119397407SSherry Moore /* 219397407SSherry Moore * CDDL HEADER START 319397407SSherry Moore * 419397407SSherry Moore * The contents of this file are subject to the terms of the 519397407SSherry Moore * Common Development and Distribution License (the "License"). 619397407SSherry Moore * You may not use this file except in compliance with the License. 719397407SSherry Moore * 819397407SSherry Moore * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 919397407SSherry Moore * or http://www.opensolaris.org/os/licensing. 1019397407SSherry Moore * See the License for the specific language governing permissions 1119397407SSherry Moore * and limitations under the License. 1219397407SSherry Moore * 1319397407SSherry Moore * When distributing Covered Code, include this CDDL HEADER in each 1419397407SSherry Moore * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 1519397407SSherry Moore * If applicable, add the following below this CDDL HEADER, with the 1619397407SSherry Moore * fields enclosed by brackets "[]" replaced with your own identifying 1719397407SSherry Moore * information: Portions Copyright [yyyy] [name of copyright owner] 1819397407SSherry Moore * 1919397407SSherry Moore * CDDL HEADER END 2019397407SSherry Moore */ 2119397407SSherry Moore 2219397407SSherry Moore /* 23753a6d45SSherry Moore * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 2419397407SSherry Moore * Use is subject to license terms. 2519397407SSherry Moore */ 2619397407SSherry Moore 276bc8bc6aSSherry Moore /* 286bc8bc6aSSherry Moore * This file contains the functions for performing Fast Reboot -- a 296bc8bc6aSSherry Moore * reboot which bypasses the firmware and bootloader, considerably 306bc8bc6aSSherry Moore * reducing downtime. 316bc8bc6aSSherry Moore * 32753a6d45SSherry Moore * fastboot_load_kernel(): This function is invoked by mdpreboot() in the 33753a6d45SSherry Moore * reboot path. It loads the new kernel and boot archive into memory, builds 346bc8bc6aSSherry Moore * the data structure containing sufficient information about the new 356bc8bc6aSSherry Moore * kernel and boot archive to be passed to the fast reboot switcher 366bc8bc6aSSherry Moore * (see fb_swtch_src.s for details). When invoked the switcher relocates 376bc8bc6aSSherry Moore * the new kernel and boot archive to physically contiguous low memory, 386bc8bc6aSSherry Moore * similar to where the boot loader would have loaded them, and jumps to 396bc8bc6aSSherry Moore * the new kernel. 406bc8bc6aSSherry Moore * 41753a6d45SSherry Moore * If fastreboot_onpanic is enabled, fastboot_load_kernel() is called 42753a6d45SSherry Moore * by fastreboot_post_startup() to load the back up kernel in case of 43753a6d45SSherry Moore * panic. 44753a6d45SSherry Moore * 456bc8bc6aSSherry Moore * The physical addresses of the memory allocated for the new kernel, boot 466bc8bc6aSSherry Moore * archive and their page tables must be above where the boot archive ends 476bc8bc6aSSherry Moore * after it has been relocated by the switcher, otherwise the new files 486bc8bc6aSSherry Moore * and their page tables could be overridden during relocation. 496bc8bc6aSSherry Moore * 506bc8bc6aSSherry Moore * fast_reboot(): This function is invoked by mdboot() once it's determined 516bc8bc6aSSherry Moore * that the system is capable of fast reboot. It jumps to the fast reboot 52753a6d45SSherry Moore * switcher with the data structure built by fastboot_load_kernel() as the 53753a6d45SSherry Moore * argument. 546bc8bc6aSSherry Moore */ 5519397407SSherry Moore 5619397407SSherry Moore #include <sys/types.h> 5719397407SSherry Moore #include <sys/param.h> 5819397407SSherry Moore #include <sys/segments.h> 5919397407SSherry Moore #include <sys/sysmacros.h> 6019397407SSherry Moore #include <sys/vm.h> 6119397407SSherry Moore 6219397407SSherry Moore #include <sys/proc.h> 6319397407SSherry Moore #include <sys/buf.h> 6419397407SSherry Moore #include <sys/kmem.h> 6519397407SSherry Moore 6619397407SSherry Moore #include <sys/reboot.h> 6719397407SSherry Moore #include <sys/uadmin.h> 6819397407SSherry Moore 6919397407SSherry Moore #include <sys/cred.h> 7019397407SSherry Moore #include <sys/vnode.h> 7119397407SSherry Moore #include <sys/file.h> 7219397407SSherry Moore 7319397407SSherry Moore #include <sys/cmn_err.h> 7419397407SSherry Moore #include <sys/dumphdr.h> 7519397407SSherry Moore #include <sys/bootconf.h> 7619397407SSherry Moore #include <sys/ddidmareq.h> 7719397407SSherry Moore #include <sys/varargs.h> 7819397407SSherry Moore #include <sys/promif.h> 7919397407SSherry Moore #include <sys/modctl.h> 8019397407SSherry Moore 8119397407SSherry Moore #include <vm/hat.h> 8219397407SSherry Moore #include <vm/as.h> 8319397407SSherry Moore #include <vm/page.h> 8419397407SSherry Moore #include <vm/seg.h> 8519397407SSherry Moore #include <vm/hat_i86.h> 8619397407SSherry Moore #include <sys/vm_machparam.h> 8719397407SSherry Moore #include <sys/archsystm.h> 8819397407SSherry Moore #include <sys/machsystm.h> 8919397407SSherry Moore #include <sys/mman.h> 9019397407SSherry Moore #include <sys/x86_archext.h> 91753a6d45SSherry Moore #include <sys/smp_impldefs.h> 92753a6d45SSherry Moore #include <sys/spl.h> 9319397407SSherry Moore 9419397407SSherry Moore #include <sys/fastboot.h> 9519397407SSherry Moore #include <sys/machelf.h> 9619397407SSherry Moore #include <sys/kobj.h> 9719397407SSherry Moore #include <sys/multiboot.h> 98753a6d45SSherry Moore #include <sys/kobj_lex.h> 99753a6d45SSherry Moore 100753a6d45SSherry Moore /* 101753a6d45SSherry Moore * Macro to determine how many pages are needed for PTEs to map a particular 102753a6d45SSherry Moore * file. Allocate one extra page table entry for terminating the list. 103753a6d45SSherry Moore */ 104753a6d45SSherry Moore #define FASTBOOT_PTE_LIST_SIZE(fsize) \ 105753a6d45SSherry Moore P2ROUNDUP((((fsize) >> PAGESHIFT) + 1) * sizeof (x86pte_t), PAGESIZE) 10619397407SSherry Moore 1076bc8bc6aSSherry Moore /* 1086bc8bc6aSSherry Moore * Data structure containing necessary information for the fast reboot 1096bc8bc6aSSherry Moore * switcher to jump to the new kernel. 1106bc8bc6aSSherry Moore */ 11119397407SSherry Moore fastboot_info_t newkernel = { 0 }; 112753a6d45SSherry Moore char fastboot_args[OBP_MAXPATHLEN]; 1136bc8bc6aSSherry Moore 11419397407SSherry Moore static char fastboot_filename[2][OBP_MAXPATHLEN] = { { 0 }, { 0 }}; 11519397407SSherry Moore static x86pte_t ptp_bits = PT_VALID | PT_REF | PT_USER | PT_WRITABLE; 11619397407SSherry Moore static x86pte_t pte_bits = 11719397407SSherry Moore PT_VALID | PT_REF | PT_MOD | PT_NOCONSIST | PT_WRITABLE; 11819397407SSherry Moore static uint_t fastboot_shift_amt_pae[] = {12, 21, 30, 39}; 11919397407SSherry Moore 12019397407SSherry Moore int fastboot_debug = 0; 12119397407SSherry Moore int fastboot_contig = 0; 12219397407SSherry Moore 12319397407SSherry Moore /* 12419397407SSherry Moore * Fake starting va for new kernel and boot archive. 12519397407SSherry Moore */ 12619397407SSherry Moore static uintptr_t fake_va = FASTBOOT_FAKE_VA; 12719397407SSherry Moore 12819397407SSherry Moore /* 129753a6d45SSherry Moore * Reserve memory below PA 1G in preparation of fast reboot. 130753a6d45SSherry Moore * 131753a6d45SSherry Moore * This variable is only checked when fastreboot_capable is set, but 132753a6d45SSherry Moore * fastreboot_onpanic is not set. The amount of memory reserved 133753a6d45SSherry Moore * is negligible, but just in case we are really short of low memory, 134753a6d45SSherry Moore * this variable will give us a backdoor to not consume memory at all. 135753a6d45SSherry Moore */ 136753a6d45SSherry Moore int reserve_mem_enabled = 1; 137753a6d45SSherry Moore 138753a6d45SSherry Moore /* 139753a6d45SSherry Moore * Amount of memory below PA 1G to reserve for constructing the multiboot 140753a6d45SSherry Moore * data structure and the page tables as we tend to run out of those 141753a6d45SSherry Moore * when more drivers are loaded. 142753a6d45SSherry Moore */ 143753a6d45SSherry Moore static size_t fastboot_mbi_size = 0x2000; /* 8K */ 144753a6d45SSherry Moore static size_t fastboot_pagetable_size = 0x5000; /* 20K */ 145753a6d45SSherry Moore 146753a6d45SSherry Moore /* 147753a6d45SSherry Moore * Use below 1G for page tables as 148753a6d45SSherry Moore * 1. we are only doing 1:1 mapping of the bottom 1G of physical memory. 149753a6d45SSherry Moore * 2. we are using 2G as the fake virtual address for the new kernel and 150753a6d45SSherry Moore * boot archive. 15119397407SSherry Moore */ 15219397407SSherry Moore static ddi_dma_attr_t fastboot_below_1G_dma_attr = { 15319397407SSherry Moore DMA_ATTR_V0, 15419397407SSherry Moore 0x0000000008000000ULL, /* dma_attr_addr_lo: 128MB */ 15519397407SSherry Moore 0x000000003FFFFFFFULL, /* dma_attr_addr_hi: 1G */ 15619397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_count_max */ 15719397407SSherry Moore 0x0000000000001000ULL, /* dma_attr_align: 4KB */ 15819397407SSherry Moore 1, /* dma_attr_burstsize */ 15919397407SSherry Moore 1, /* dma_attr_minxfer */ 16019397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_maxxfer */ 16119397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_seg */ 16219397407SSherry Moore 1, /* dma_attr_sgllen */ 16319397407SSherry Moore 0x1000ULL, /* dma_attr_granular */ 16419397407SSherry Moore 0, /* dma_attr_flags */ 16519397407SSherry Moore }; 16619397407SSherry Moore 16719397407SSherry Moore static ddi_dma_attr_t fastboot_dma_attr = { 16819397407SSherry Moore DMA_ATTR_V0, 16919397407SSherry Moore 0x0000000008000000ULL, /* dma_attr_addr_lo: 128MB */ 170877400d3SKonstantin Ananyev #ifdef __amd64 171877400d3SKonstantin Ananyev 0xFFFFFFFFFFFFFFFFULL, /* dma_attr_addr_hi: 2^64B */ 172877400d3SKonstantin Ananyev #else 17319397407SSherry Moore 0x0000000FFFFFFFFFULL, /* dma_attr_addr_hi: 64GB */ 174877400d3SKonstantin Ananyev #endif /* __amd64 */ 17519397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_count_max */ 17619397407SSherry Moore 0x0000000000001000ULL, /* dma_attr_align: 4KB */ 17719397407SSherry Moore 1, /* dma_attr_burstsize */ 17819397407SSherry Moore 1, /* dma_attr_minxfer */ 17919397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_maxxfer */ 18019397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_seg */ 18119397407SSherry Moore 1, /* dma_attr_sgllen */ 18219397407SSherry Moore 0x1000ULL, /* dma_attr_granular */ 18319397407SSherry Moore 0, /* dma_attr_flags */ 18419397407SSherry Moore }; 18519397407SSherry Moore 18619397407SSherry Moore /* 18719397407SSherry Moore * Various information saved from the previous boot to reconstruct 18819397407SSherry Moore * multiboot_info. 18919397407SSherry Moore */ 19019397407SSherry Moore extern multiboot_info_t saved_mbi; 19119397407SSherry Moore extern mb_memory_map_t saved_mmap[FASTBOOT_SAVED_MMAP_COUNT]; 192*6915124bSKonstantin Ananyev extern uint8_t saved_drives[FASTBOOT_SAVED_DRIVES_SIZE]; 19319397407SSherry Moore extern char saved_cmdline[FASTBOOT_SAVED_CMDLINE_LEN]; 19419397407SSherry Moore extern int saved_cmdline_len; 195753a6d45SSherry Moore extern size_t saved_file_size[]; 19619397407SSherry Moore 19719397407SSherry Moore extern void* contig_alloc(size_t size, ddi_dma_attr_t *attr, 19819397407SSherry Moore uintptr_t align, int cansleep); 1996bc8bc6aSSherry Moore extern void contig_free(void *addr, size_t size); 2006bc8bc6aSSherry Moore 20119397407SSherry Moore 20219397407SSherry Moore /* PRINTLIKE */ 20319397407SSherry Moore extern void vprintf(const char *, va_list); 20419397407SSherry Moore 20519397407SSherry Moore 20619397407SSherry Moore /* 20719397407SSherry Moore * Need to be able to get boot_archives from other places 20819397407SSherry Moore */ 20919397407SSherry Moore #define BOOTARCHIVE64 "/platform/i86pc/amd64/boot_archive" 21019397407SSherry Moore #define BOOTARCHIVE32 "/platform/i86pc/boot_archive" 211753a6d45SSherry Moore #define BOOTARCHIVE32_FAILSAFE "/boot/x86.miniroot-safe" 212753a6d45SSherry Moore #define BOOTARCHIVE64_FAILSAFE "/boot/amd64/x86.miniroot-safe" 213753a6d45SSherry Moore #define FAILSAFE_BOOTFILE32 "/boot/platform/i86pc/kernel/unix" 214753a6d45SSherry Moore #define FAILSAFE_BOOTFILE64 "/boot/platform/i86pc/kernel/amd64/unix" 21519397407SSherry Moore 21619397407SSherry Moore static uint_t fastboot_vatoindex(fastboot_info_t *, uintptr_t, int); 21719397407SSherry Moore static void fastboot_map_with_size(fastboot_info_t *, uintptr_t, 21819397407SSherry Moore paddr_t, size_t, int); 21919397407SSherry Moore static void fastboot_build_pagetables(fastboot_info_t *); 22019397407SSherry Moore static int fastboot_build_mbi(char *, fastboot_info_t *); 221753a6d45SSherry Moore static void fastboot_free_file(fastboot_file_t *); 22219397407SSherry Moore 22319397407SSherry Moore static const char fastboot_enomem_msg[] = "Fastboot: Couldn't allocate 0x%" 22419397407SSherry Moore PRIx64" bytes below %s to do fast reboot"; 22519397407SSherry Moore 22619397407SSherry Moore static void 22719397407SSherry Moore dprintf(char *fmt, ...) 22819397407SSherry Moore { 22919397407SSherry Moore va_list adx; 23019397407SSherry Moore 23119397407SSherry Moore if (!fastboot_debug) 23219397407SSherry Moore return; 23319397407SSherry Moore 23419397407SSherry Moore va_start(adx, fmt); 23519397407SSherry Moore vprintf(fmt, adx); 23619397407SSherry Moore va_end(adx); 23719397407SSherry Moore } 23819397407SSherry Moore 23919397407SSherry Moore 24019397407SSherry Moore /* 24119397407SSherry Moore * Return the index corresponding to a virt address at a given page table level. 24219397407SSherry Moore */ 24319397407SSherry Moore static uint_t 24419397407SSherry Moore fastboot_vatoindex(fastboot_info_t *nk, uintptr_t va, int level) 24519397407SSherry Moore { 24619397407SSherry Moore return ((va >> nk->fi_shift_amt[level]) & (nk->fi_ptes_per_table - 1)); 24719397407SSherry Moore } 24819397407SSherry Moore 24919397407SSherry Moore 25019397407SSherry Moore /* 25119397407SSherry Moore * Add mapping from vstart to pstart for the specified size. 252877400d3SKonstantin Ananyev * vstart, pstart and size should all have been aligned at 2M boundaries. 25319397407SSherry Moore */ 25419397407SSherry Moore static void 25519397407SSherry Moore fastboot_map_with_size(fastboot_info_t *nk, uintptr_t vstart, paddr_t pstart, 25619397407SSherry Moore size_t size, int level) 25719397407SSherry Moore { 25819397407SSherry Moore x86pte_t pteval, *table; 25919397407SSherry Moore uintptr_t vaddr; 26019397407SSherry Moore paddr_t paddr; 26119397407SSherry Moore int index, l; 26219397407SSherry Moore 26319397407SSherry Moore table = (x86pte_t *)(nk->fi_pagetable_va); 26419397407SSherry Moore 26519397407SSherry Moore for (l = nk->fi_top_level; l >= level; l--) { 26619397407SSherry Moore 26719397407SSherry Moore index = fastboot_vatoindex(nk, vstart, l); 26819397407SSherry Moore 26919397407SSherry Moore if (l == level) { 27019397407SSherry Moore /* 27119397407SSherry Moore * Last level. Program the page table entries. 27219397407SSherry Moore */ 27319397407SSherry Moore for (vaddr = vstart, paddr = pstart; 27419397407SSherry Moore vaddr < vstart + size; 27519397407SSherry Moore vaddr += (1ULL << nk->fi_shift_amt[l]), 27619397407SSherry Moore paddr += (1ULL << nk->fi_shift_amt[l])) { 27719397407SSherry Moore 27819397407SSherry Moore uint_t index = fastboot_vatoindex(nk, vaddr, l); 27919397407SSherry Moore 28019397407SSherry Moore if (l > 0) 28119397407SSherry Moore pteval = paddr | pte_bits | PT_PAGESIZE; 28219397407SSherry Moore else 28319397407SSherry Moore pteval = paddr | pte_bits; 28419397407SSherry Moore 28519397407SSherry Moore table[index] = pteval; 28619397407SSherry Moore } 28719397407SSherry Moore } else if (table[index] & PT_VALID) { 28819397407SSherry Moore 28919397407SSherry Moore table = (x86pte_t *) 29019397407SSherry Moore ((uintptr_t)(((paddr_t)table[index] & MMU_PAGEMASK) 29119397407SSherry Moore - nk->fi_pagetable_pa) + nk->fi_pagetable_va); 29219397407SSherry Moore } else { 29319397407SSherry Moore /* 294877400d3SKonstantin Ananyev * Intermediate levels. 295877400d3SKonstantin Ananyev * Program with either valid bit or PTP bits. 29619397407SSherry Moore */ 29719397407SSherry Moore if (l == nk->fi_top_level) { 298877400d3SKonstantin Ananyev #ifdef __amd64 299877400d3SKonstantin Ananyev ASSERT(nk->fi_top_level == 3); 300877400d3SKonstantin Ananyev table[index] = nk->fi_next_table_pa | ptp_bits; 301877400d3SKonstantin Ananyev #else 30219397407SSherry Moore table[index] = nk->fi_next_table_pa | PT_VALID; 303877400d3SKonstantin Ananyev #endif /* __amd64 */ 30419397407SSherry Moore } else { 30519397407SSherry Moore table[index] = nk->fi_next_table_pa | ptp_bits; 30619397407SSherry Moore } 30719397407SSherry Moore table = (x86pte_t *)(nk->fi_next_table_va); 30819397407SSherry Moore nk->fi_next_table_va += MMU_PAGESIZE; 30919397407SSherry Moore nk->fi_next_table_pa += MMU_PAGESIZE; 31019397407SSherry Moore } 31119397407SSherry Moore } 31219397407SSherry Moore } 31319397407SSherry Moore 31419397407SSherry Moore /* 31519397407SSherry Moore * Build page tables for the lower 1G of physical memory using 2M 31619397407SSherry Moore * pages, and prepare page tables for mapping new kernel and boot 31719397407SSherry Moore * archive pages using 4K pages. 31819397407SSherry Moore */ 31919397407SSherry Moore static void 32019397407SSherry Moore fastboot_build_pagetables(fastboot_info_t *nk) 32119397407SSherry Moore { 32219397407SSherry Moore /* 32319397407SSherry Moore * Map lower 1G physical memory. Use large pages. 32419397407SSherry Moore */ 32519397407SSherry Moore fastboot_map_with_size(nk, 0, 0, ONE_GIG, 1); 32619397407SSherry Moore 32719397407SSherry Moore /* 32819397407SSherry Moore * Map one 4K page to get the middle page tables set up. 32919397407SSherry Moore */ 33019397407SSherry Moore fake_va = P2ALIGN_TYPED(fake_va, nk->fi_lpagesize, uintptr_t); 33119397407SSherry Moore fastboot_map_with_size(nk, fake_va, 33219397407SSherry Moore nk->fi_files[0].fb_pte_list_va[0] & MMU_PAGEMASK, PAGESIZE, 0); 33319397407SSherry Moore } 33419397407SSherry Moore 33519397407SSherry Moore 33619397407SSherry Moore /* 33719397407SSherry Moore * Sanity check. Look for dboot offset. 33819397407SSherry Moore */ 33919397407SSherry Moore static int 34019397407SSherry Moore fastboot_elf64_find_dboot_load_offset(void *img, off_t imgsz, uint32_t *offp) 34119397407SSherry Moore { 34219397407SSherry Moore Elf64_Ehdr *ehdr = (Elf64_Ehdr *)img; 34319397407SSherry Moore Elf64_Phdr *phdr; 34419397407SSherry Moore uint8_t *phdrbase; 34519397407SSherry Moore int i; 34619397407SSherry Moore 34719397407SSherry Moore if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz) 34819397407SSherry Moore return (-1); 34919397407SSherry Moore 35019397407SSherry Moore phdrbase = (uint8_t *)img + ehdr->e_phoff; 35119397407SSherry Moore 35219397407SSherry Moore for (i = 0; i < ehdr->e_phnum; i++) { 35319397407SSherry Moore phdr = (Elf64_Phdr *)(phdrbase + ehdr->e_phentsize * i); 35419397407SSherry Moore 35519397407SSherry Moore if (phdr->p_type == PT_LOAD) { 35619397407SSherry Moore if (phdr->p_vaddr == phdr->p_paddr && 35719397407SSherry Moore phdr->p_vaddr == DBOOT_ENTRY_ADDRESS) { 35819397407SSherry Moore ASSERT(phdr->p_offset <= UINT32_MAX); 35919397407SSherry Moore *offp = (uint32_t)phdr->p_offset; 36019397407SSherry Moore return (0); 36119397407SSherry Moore } 36219397407SSherry Moore } 36319397407SSherry Moore } 36419397407SSherry Moore 36519397407SSherry Moore return (-1); 36619397407SSherry Moore } 36719397407SSherry Moore 36819397407SSherry Moore 36919397407SSherry Moore /* 37019397407SSherry Moore * Initialize text and data section information for 32-bit kernel. 371877400d3SKonstantin Ananyev * sectcntp - is both input/output parameter. 372877400d3SKonstantin Ananyev * On entry, *sectcntp contains maximum allowable number of sections; 373877400d3SKonstantin Ananyev * on return, it contains the actual number of sections filled. 37419397407SSherry Moore */ 37519397407SSherry Moore static int 37619397407SSherry Moore fastboot_elf32_find_loadables(void *img, off_t imgsz, fastboot_section_t *sectp, 37719397407SSherry Moore int *sectcntp, uint32_t *offp) 37819397407SSherry Moore { 37919397407SSherry Moore Elf32_Ehdr *ehdr = (Elf32_Ehdr *)img; 38019397407SSherry Moore Elf32_Phdr *phdr; 38119397407SSherry Moore uint8_t *phdrbase; 38219397407SSherry Moore int i; 38319397407SSherry Moore int used_sections = 0; 384877400d3SKonstantin Ananyev const int max_sectcnt = *sectcntp; 38519397407SSherry Moore 38619397407SSherry Moore if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz) 38719397407SSherry Moore return (-1); 38819397407SSherry Moore 38919397407SSherry Moore phdrbase = (uint8_t *)img + ehdr->e_phoff; 39019397407SSherry Moore 39119397407SSherry Moore for (i = 0; i < ehdr->e_phnum; i++) { 39219397407SSherry Moore phdr = (Elf32_Phdr *)(phdrbase + ehdr->e_phentsize * i); 39319397407SSherry Moore 39419397407SSherry Moore if (phdr->p_type == PT_INTERP) 39519397407SSherry Moore return (-1); 39619397407SSherry Moore 39719397407SSherry Moore if (phdr->p_type != PT_LOAD) 39819397407SSherry Moore continue; 39919397407SSherry Moore 40019397407SSherry Moore if (phdr->p_vaddr == phdr->p_paddr && 40119397407SSherry Moore phdr->p_paddr == DBOOT_ENTRY_ADDRESS) { 40219397407SSherry Moore *offp = (uint32_t)phdr->p_offset; 40319397407SSherry Moore } else { 404877400d3SKonstantin Ananyev if (max_sectcnt <= used_sections) 405877400d3SKonstantin Ananyev return (-1); 406877400d3SKonstantin Ananyev 40719397407SSherry Moore sectp[used_sections].fb_sec_offset = phdr->p_offset; 40819397407SSherry Moore sectp[used_sections].fb_sec_paddr = phdr->p_paddr; 40919397407SSherry Moore sectp[used_sections].fb_sec_size = phdr->p_filesz; 41019397407SSherry Moore sectp[used_sections].fb_sec_bss_size = 41119397407SSherry Moore (phdr->p_filesz < phdr->p_memsz) ? 41219397407SSherry Moore (phdr->p_memsz - phdr->p_filesz) : 0; 41319397407SSherry Moore 414877400d3SKonstantin Ananyev /* Extra sanity check for the input object file */ 415877400d3SKonstantin Ananyev if (sectp[used_sections].fb_sec_paddr + 416877400d3SKonstantin Ananyev sectp[used_sections].fb_sec_size + 417877400d3SKonstantin Ananyev sectp[used_sections].fb_sec_bss_size >= 418877400d3SKonstantin Ananyev DBOOT_ENTRY_ADDRESS) 419877400d3SKonstantin Ananyev return (-1); 420877400d3SKonstantin Ananyev 42119397407SSherry Moore used_sections++; 42219397407SSherry Moore } 42319397407SSherry Moore } 42419397407SSherry Moore 42519397407SSherry Moore *sectcntp = used_sections; 42619397407SSherry Moore return (0); 42719397407SSherry Moore } 42819397407SSherry Moore 42919397407SSherry Moore /* 4301a6f4459SKonstantin Ananyev * Create multiboot info structure (mbi) base on the saved mbi. 4311a6f4459SKonstantin Ananyev * Recalculate values of the pointer type fields in the data 4321a6f4459SKonstantin Ananyev * structure based on the new starting physical address of the 4331a6f4459SKonstantin Ananyev * data structure. 43419397407SSherry Moore */ 43519397407SSherry Moore static int 43619397407SSherry Moore fastboot_build_mbi(char *mdep, fastboot_info_t *nk) 43719397407SSherry Moore { 43819397407SSherry Moore mb_module_t *mbp; 4391a6f4459SKonstantin Ananyev multiboot_info_t *mbi; /* pointer to multiboot structure */ 4401a6f4459SKonstantin Ananyev uintptr_t start_addr_va; /* starting VA of mbi */ 4411a6f4459SKonstantin Ananyev uintptr_t start_addr_pa; /* starting PA of mbi */ 4421a6f4459SKonstantin Ananyev size_t offs = 0; /* offset from the starting address */ 4431a6f4459SKonstantin Ananyev size_t arglen; /* length of the command line arg */ 4441a6f4459SKonstantin Ananyev size_t size; /* size of the memory reserved for mbi */ 4451a6f4459SKonstantin Ananyev size_t mdnsz; /* length of the boot archive name */ 44619397407SSherry Moore 4471a6f4459SKonstantin Ananyev /* 4481a6f4459SKonstantin Ananyev * If mdep is not NULL or empty, use the length of mdep + 1 4491a6f4459SKonstantin Ananyev * (for NULL terminating) as the length of the new command 4501a6f4459SKonstantin Ananyev * line; else use the saved command line length as the 4511a6f4459SKonstantin Ananyev * length for the new command line. 4521a6f4459SKonstantin Ananyev */ 4536bc8bc6aSSherry Moore if (mdep != NULL && strlen(mdep) != 0) { 45419397407SSherry Moore arglen = strlen(mdep) + 1; 45519397407SSherry Moore } else { 45619397407SSherry Moore arglen = saved_cmdline_len; 45719397407SSherry Moore } 45819397407SSherry Moore 4591a6f4459SKonstantin Ananyev /* 4601a6f4459SKonstantin Ananyev * Allocate memory for the new multiboot info structure (mbi). 4611a6f4459SKonstantin Ananyev * If we have reserved memory for mbi but it's not enough, 4621a6f4459SKonstantin Ananyev * free it and reallocate. 4631a6f4459SKonstantin Ananyev */ 46419397407SSherry Moore size = PAGESIZE + P2ROUNDUP(arglen, PAGESIZE); 465753a6d45SSherry Moore if (nk->fi_mbi_size && nk->fi_mbi_size < size) { 466753a6d45SSherry Moore contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 467753a6d45SSherry Moore nk->fi_mbi_size = 0; 46819397407SSherry Moore } 46919397407SSherry Moore 470753a6d45SSherry Moore if (nk->fi_mbi_size == 0) { 471753a6d45SSherry Moore if ((nk->fi_new_mbi_va = 472753a6d45SSherry Moore (uintptr_t)contig_alloc(size, &fastboot_below_1G_dma_attr, 473753a6d45SSherry Moore PAGESIZE, 0)) == NULL) { 474753a6d45SSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, 475753a6d45SSherry Moore (uint64_t)size, "1G"); 476753a6d45SSherry Moore return (-1); 477753a6d45SSherry Moore } 478753a6d45SSherry Moore /* 479753a6d45SSherry Moore * fi_mbi_size must be set after the allocation succeeds 480753a6d45SSherry Moore * as it's used to determine how much memory to free. 481753a6d45SSherry Moore */ 482753a6d45SSherry Moore nk->fi_mbi_size = size; 483753a6d45SSherry Moore } 48419397407SSherry Moore 4851a6f4459SKonstantin Ananyev /* 4861a6f4459SKonstantin Ananyev * Initalize memory 4871a6f4459SKonstantin Ananyev */ 488753a6d45SSherry Moore bzero((void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 48919397407SSherry Moore 4901a6f4459SKonstantin Ananyev /* 4911a6f4459SKonstantin Ananyev * Get PA for the new mbi 4921a6f4459SKonstantin Ananyev */ 4931a6f4459SKonstantin Ananyev start_addr_va = nk->fi_new_mbi_va; 4941a6f4459SKonstantin Ananyev start_addr_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 4951a6f4459SKonstantin Ananyev (caddr_t)start_addr_va)); 4961a6f4459SKonstantin Ananyev nk->fi_new_mbi_pa = (paddr_t)start_addr_pa; 497753a6d45SSherry Moore 498753a6d45SSherry Moore /* 4991a6f4459SKonstantin Ananyev * Populate the rest of the fields in the data structure 500753a6d45SSherry Moore */ 501753a6d45SSherry Moore 5021a6f4459SKonstantin Ananyev /* 5031a6f4459SKonstantin Ananyev * Copy from the saved mbi to preserve all non-pointer type fields. 5041a6f4459SKonstantin Ananyev */ 5051a6f4459SKonstantin Ananyev mbi = (multiboot_info_t *)start_addr_va; 5061a6f4459SKonstantin Ananyev bcopy(&saved_mbi, mbi, sizeof (*mbi)); 50719397407SSherry Moore 5081a6f4459SKonstantin Ananyev /* 5091a6f4459SKonstantin Ananyev * Recalculate mods_addr. Set mod_start and mod_end based on 5101a6f4459SKonstantin Ananyev * the physical address of the new boot archive. Set mod_name 5111a6f4459SKonstantin Ananyev * to the name of the new boto archive. 5121a6f4459SKonstantin Ananyev */ 5131a6f4459SKonstantin Ananyev offs += sizeof (multiboot_info_t); 5141a6f4459SKonstantin Ananyev mbi->mods_addr = start_addr_pa + offs; 5151a6f4459SKonstantin Ananyev mbp = (mb_module_t *)(start_addr_va + offs); 516753a6d45SSherry Moore mbp->mod_start = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_dest_pa; 517753a6d45SSherry Moore mbp->mod_end = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_next_pa; 51819397407SSherry Moore 5191a6f4459SKonstantin Ananyev offs += sizeof (mb_module_t); 5201a6f4459SKonstantin Ananyev mdnsz = strlen(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE]) + 1; 5211a6f4459SKonstantin Ananyev bcopy(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE], 5221a6f4459SKonstantin Ananyev (void *)(start_addr_va + offs), mdnsz); 5231a6f4459SKonstantin Ananyev mbp->mod_name = start_addr_pa + offs; 52419397407SSherry Moore mbp->reserved = 0; 52519397407SSherry Moore 5261a6f4459SKonstantin Ananyev /* 5271a6f4459SKonstantin Ananyev * Make sure the offset is 16-byte aligned to avoid unaligned access. 5281a6f4459SKonstantin Ananyev */ 5291a6f4459SKonstantin Ananyev offs += mdnsz; 5301a6f4459SKonstantin Ananyev offs = P2ROUNDUP_TYPED(offs, 16, size_t); 5311a6f4459SKonstantin Ananyev 5321a6f4459SKonstantin Ananyev /* 5331a6f4459SKonstantin Ananyev * Recalculate mmap_addr 5341a6f4459SKonstantin Ananyev */ 5351a6f4459SKonstantin Ananyev mbi->mmap_addr = start_addr_pa + offs; 5361a6f4459SKonstantin Ananyev bcopy((void *)(uintptr_t)saved_mmap, (void *)(start_addr_va + offs), 53719397407SSherry Moore saved_mbi.mmap_length); 5381a6f4459SKonstantin Ananyev offs += saved_mbi.mmap_length; 53919397407SSherry Moore 5401a6f4459SKonstantin Ananyev /* 5411a6f4459SKonstantin Ananyev * Recalculate drives_addr 5421a6f4459SKonstantin Ananyev */ 5431a6f4459SKonstantin Ananyev mbi->drives_addr = start_addr_pa + offs; 5441a6f4459SKonstantin Ananyev bcopy((void *)(uintptr_t)saved_drives, (void *)(start_addr_va + offs), 54519397407SSherry Moore saved_mbi.drives_length); 5461a6f4459SKonstantin Ananyev offs += saved_mbi.drives_length; 54719397407SSherry Moore 5481a6f4459SKonstantin Ananyev /* 5491a6f4459SKonstantin Ananyev * Recalculate the address of cmdline. Set cmdline to contain the 5501a6f4459SKonstantin Ananyev * new boot argument. 5511a6f4459SKonstantin Ananyev */ 5521a6f4459SKonstantin Ananyev mbi->cmdline = start_addr_pa + offs; 55319397407SSherry Moore 5546bc8bc6aSSherry Moore if (mdep != NULL && strlen(mdep) != 0) { 5551a6f4459SKonstantin Ananyev bcopy(mdep, (void *)(start_addr_va + offs), arglen); 55619397407SSherry Moore } else { 5571a6f4459SKonstantin Ananyev bcopy((void *)saved_cmdline, (void *)(start_addr_va + offs), 5581a6f4459SKonstantin Ananyev arglen); 55919397407SSherry Moore } 56019397407SSherry Moore 561*6915124bSKonstantin Ananyev /* clear fields and flags that are not copied */ 562*6915124bSKonstantin Ananyev bzero(&mbi->config_table, 563*6915124bSKonstantin Ananyev sizeof (*mbi) - offsetof(multiboot_info_t, config_table)); 564*6915124bSKonstantin Ananyev mbi->flags &= ~(MB_INFO_CONFIG_TABLE | MB_INFO_BOOT_LOADER_NAME | 565*6915124bSKonstantin Ananyev MB_INFO_APM_TABLE | MB_INFO_VIDEO_INFO); 566*6915124bSKonstantin Ananyev 56719397407SSherry Moore return (0); 56819397407SSherry Moore } 56919397407SSherry Moore 5706bc8bc6aSSherry Moore /* 5716bc8bc6aSSherry Moore * Initialize HAT related fields 5726bc8bc6aSSherry Moore */ 5736bc8bc6aSSherry Moore static void 5746bc8bc6aSSherry Moore fastboot_init_fields(fastboot_info_t *nk) 57519397407SSherry Moore { 57619397407SSherry Moore if (x86_feature & X86_PAE) { 5776bc8bc6aSSherry Moore nk->fi_has_pae = 1; 5786bc8bc6aSSherry Moore nk->fi_shift_amt = fastboot_shift_amt_pae; 5796bc8bc6aSSherry Moore nk->fi_ptes_per_table = 512; 5806bc8bc6aSSherry Moore nk->fi_lpagesize = (2 << 20); /* 2M */ 581877400d3SKonstantin Ananyev #ifdef __amd64 582877400d3SKonstantin Ananyev nk->fi_top_level = 3; 583877400d3SKonstantin Ananyev #else 5846bc8bc6aSSherry Moore nk->fi_top_level = 2; 585877400d3SKonstantin Ananyev #endif /* __amd64 */ 5866bc8bc6aSSherry Moore } 58719397407SSherry Moore } 58819397407SSherry Moore 5896bc8bc6aSSherry Moore /* 5906bc8bc6aSSherry Moore * Process boot argument 5916bc8bc6aSSherry Moore */ 5926bc8bc6aSSherry Moore static void 5936bc8bc6aSSherry Moore fastboot_parse_mdep(char *mdep, char *kern_bootpath, int *bootpath_len, 5946bc8bc6aSSherry Moore char *bootargs) 5956bc8bc6aSSherry Moore { 5966bc8bc6aSSherry Moore int i; 59719397407SSherry Moore 59819397407SSherry Moore /* 59919397407SSherry Moore * If mdep is not NULL, it comes in the format of 60019397407SSherry Moore * mountpoint unix args 60119397407SSherry Moore */ 6026bc8bc6aSSherry Moore if (mdep != NULL && strlen(mdep) != 0) { 60319397407SSherry Moore if (mdep[0] != '-') { 60419397407SSherry Moore /* First get the root argument */ 60519397407SSherry Moore i = 0; 60619397407SSherry Moore while (mdep[i] != '\0' && mdep[i] != ' ') { 60719397407SSherry Moore i++; 60819397407SSherry Moore } 60919397407SSherry Moore 61019397407SSherry Moore if (i < 4 || strncmp(&mdep[i-4], "unix", 4) != 0) { 61119397407SSherry Moore /* mount point */ 61219397407SSherry Moore bcopy(mdep, kern_bootpath, i); 61319397407SSherry Moore kern_bootpath[i] = '\0'; 6146bc8bc6aSSherry Moore *bootpath_len = i; 61519397407SSherry Moore 61619397407SSherry Moore /* 61719397407SSherry Moore * Get the next argument. It should be unix as 61819397407SSherry Moore * we have validated in in halt.c. 61919397407SSherry Moore */ 62019397407SSherry Moore if (strlen(mdep) > i) { 62119397407SSherry Moore mdep += (i + 1); 62219397407SSherry Moore i = 0; 62319397407SSherry Moore while (mdep[i] != '\0' && 62419397407SSherry Moore mdep[i] != ' ') { 62519397407SSherry Moore i++; 62619397407SSherry Moore } 62719397407SSherry Moore } 62819397407SSherry Moore 62919397407SSherry Moore } 63019397407SSherry Moore bcopy(mdep, kern_bootfile, i); 63119397407SSherry Moore kern_bootfile[i] = '\0'; 6326bc8bc6aSSherry Moore bcopy(mdep, bootargs, strlen(mdep)); 63319397407SSherry Moore } else { 63419397407SSherry Moore int off = strlen(kern_bootfile); 63519397407SSherry Moore bcopy(kern_bootfile, bootargs, off); 63619397407SSherry Moore bcopy(" ", &bootargs[off++], 1); 63719397407SSherry Moore bcopy(mdep, &bootargs[off], strlen(mdep)); 63819397407SSherry Moore off += strlen(mdep); 63919397407SSherry Moore bootargs[off] = '\0'; 64019397407SSherry Moore } 64119397407SSherry Moore } 6426bc8bc6aSSherry Moore } 6436bc8bc6aSSherry Moore 6446bc8bc6aSSherry Moore /* 645753a6d45SSherry Moore * Reserve memory under PA 1G for mapping the new kernel and boot archive. 646753a6d45SSherry Moore * This function is only called if fastreboot_onpanic is *not* set. 647753a6d45SSherry Moore */ 648753a6d45SSherry Moore static void 649753a6d45SSherry Moore fastboot_reserve_mem(fastboot_info_t *nk) 650753a6d45SSherry Moore { 651753a6d45SSherry Moore int i; 652753a6d45SSherry Moore 653753a6d45SSherry Moore /* 654753a6d45SSherry Moore * A valid kernel is in place. No need to reserve any memory. 655753a6d45SSherry Moore */ 656753a6d45SSherry Moore if (nk->fi_valid) 657753a6d45SSherry Moore return; 658753a6d45SSherry Moore 659753a6d45SSherry Moore /* 660753a6d45SSherry Moore * Reserve memory under PA 1G for PTE lists. 661753a6d45SSherry Moore */ 662753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 663753a6d45SSherry Moore fastboot_file_t *fb = &nk->fi_files[i]; 664753a6d45SSherry Moore size_t fsize_roundup, size; 665753a6d45SSherry Moore 666753a6d45SSherry Moore fsize_roundup = P2ROUNDUP_TYPED(saved_file_size[i], 667753a6d45SSherry Moore PAGESIZE, size_t); 668753a6d45SSherry Moore size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup); 669753a6d45SSherry Moore if ((fb->fb_pte_list_va = contig_alloc(size, 670753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) { 671753a6d45SSherry Moore return; 672753a6d45SSherry Moore } 673753a6d45SSherry Moore fb->fb_pte_list_size = size; 674753a6d45SSherry Moore } 675753a6d45SSherry Moore 676753a6d45SSherry Moore /* 677753a6d45SSherry Moore * Reserve memory under PA 1G for page tables. 678753a6d45SSherry Moore */ 679753a6d45SSherry Moore if ((nk->fi_pagetable_va = 680753a6d45SSherry Moore (uintptr_t)contig_alloc(fastboot_pagetable_size, 681753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) { 682753a6d45SSherry Moore return; 683753a6d45SSherry Moore } 684753a6d45SSherry Moore nk->fi_pagetable_size = fastboot_pagetable_size; 685753a6d45SSherry Moore 686753a6d45SSherry Moore /* 687753a6d45SSherry Moore * Reserve memory under PA 1G for multiboot structure. 688753a6d45SSherry Moore */ 689753a6d45SSherry Moore if ((nk->fi_new_mbi_va = (uintptr_t)contig_alloc(fastboot_mbi_size, 690753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) { 691753a6d45SSherry Moore return; 692753a6d45SSherry Moore } 693753a6d45SSherry Moore nk->fi_mbi_size = fastboot_mbi_size; 694753a6d45SSherry Moore } 695753a6d45SSherry Moore 696753a6d45SSherry Moore /* 697753a6d45SSherry Moore * Calculate MD5 digest for the given fastboot_file. 698753a6d45SSherry Moore * Assumes that the file is allready loaded properly. 699753a6d45SSherry Moore */ 700753a6d45SSherry Moore static void 701753a6d45SSherry Moore fastboot_cksum_file(fastboot_file_t *fb, uchar_t *md5_hash) 702753a6d45SSherry Moore { 703753a6d45SSherry Moore MD5_CTX md5_ctx; 704753a6d45SSherry Moore 705753a6d45SSherry Moore MD5Init(&md5_ctx); 706753a6d45SSherry Moore MD5Update(&md5_ctx, (void *)fb->fb_va, fb->fb_size); 707753a6d45SSherry Moore MD5Final(md5_hash, &md5_ctx); 708753a6d45SSherry Moore } 709753a6d45SSherry Moore 710753a6d45SSherry Moore /* 711753a6d45SSherry Moore * Free up the memory we have allocated for a file 7126bc8bc6aSSherry Moore */ 7136bc8bc6aSSherry Moore static void 7146bc8bc6aSSherry Moore fastboot_free_file(fastboot_file_t *fb) 7156bc8bc6aSSherry Moore { 716753a6d45SSherry Moore size_t fsize_roundup; 7176bc8bc6aSSherry Moore 7186bc8bc6aSSherry Moore fsize_roundup = P2ROUNDUP_TYPED(fb->fb_size, PAGESIZE, size_t); 719753a6d45SSherry Moore if (fsize_roundup) { 7206bc8bc6aSSherry Moore contig_free((void *)fb->fb_va, fsize_roundup); 721753a6d45SSherry Moore fb->fb_va = NULL; 722753a6d45SSherry Moore fb->fb_size = 0; 723753a6d45SSherry Moore } 724753a6d45SSherry Moore } 7256bc8bc6aSSherry Moore 726753a6d45SSherry Moore /* 727753a6d45SSherry Moore * Free up memory used by the PTEs for a file. 728753a6d45SSherry Moore */ 729753a6d45SSherry Moore static void 730753a6d45SSherry Moore fastboot_free_file_pte(fastboot_file_t *fb, uint64_t endaddr) 731753a6d45SSherry Moore { 732753a6d45SSherry Moore if (fb->fb_pte_list_size && fb->fb_pte_list_pa < endaddr) { 733753a6d45SSherry Moore contig_free((void *)fb->fb_pte_list_va, fb->fb_pte_list_size); 734753a6d45SSherry Moore fb->fb_pte_list_va = 0; 735753a6d45SSherry Moore fb->fb_pte_list_pa = 0; 736753a6d45SSherry Moore fb->fb_pte_list_size = 0; 737753a6d45SSherry Moore } 738753a6d45SSherry Moore } 739753a6d45SSherry Moore 740753a6d45SSherry Moore /* 741753a6d45SSherry Moore * Free up all the memory used for representing a kernel with 742753a6d45SSherry Moore * fastboot_info_t. 743753a6d45SSherry Moore */ 744753a6d45SSherry Moore static void 745753a6d45SSherry Moore fastboot_free_mem(fastboot_info_t *nk, uint64_t endaddr) 746753a6d45SSherry Moore { 747753a6d45SSherry Moore int i; 748753a6d45SSherry Moore 749753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 750753a6d45SSherry Moore fastboot_free_file(nk->fi_files + i); 751753a6d45SSherry Moore fastboot_free_file_pte(nk->fi_files + i, endaddr); 752753a6d45SSherry Moore } 753753a6d45SSherry Moore 754753a6d45SSherry Moore if (nk->fi_pagetable_size && nk->fi_pagetable_pa < endaddr) { 755753a6d45SSherry Moore contig_free((void *)nk->fi_pagetable_va, nk->fi_pagetable_size); 756753a6d45SSherry Moore nk->fi_pagetable_va = 0; 757753a6d45SSherry Moore nk->fi_pagetable_pa = 0; 758753a6d45SSherry Moore nk->fi_pagetable_size = 0; 759753a6d45SSherry Moore } 760753a6d45SSherry Moore 761753a6d45SSherry Moore if (nk->fi_mbi_size && nk->fi_new_mbi_pa < endaddr) { 762753a6d45SSherry Moore contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 763753a6d45SSherry Moore nk->fi_new_mbi_va = 0; 764753a6d45SSherry Moore nk->fi_new_mbi_pa = 0; 765753a6d45SSherry Moore nk->fi_mbi_size = 0; 766753a6d45SSherry Moore } 767753a6d45SSherry Moore } 768753a6d45SSherry Moore 769753a6d45SSherry Moore /* 770753a6d45SSherry Moore * Only free up the memory allocated for the kernel and boot archive, 771753a6d45SSherry Moore * but not for the page tables. 772753a6d45SSherry Moore */ 773753a6d45SSherry Moore void 774753a6d45SSherry Moore fastboot_free_newkernel(fastboot_info_t *nk) 775753a6d45SSherry Moore { 776753a6d45SSherry Moore int i; 777753a6d45SSherry Moore 778753a6d45SSherry Moore nk->fi_valid = 0; 779753a6d45SSherry Moore /* 780753a6d45SSherry Moore * Free the memory we have allocated 781753a6d45SSherry Moore */ 782753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 783753a6d45SSherry Moore fastboot_free_file(&(nk->fi_files[i])); 784753a6d45SSherry Moore } 785753a6d45SSherry Moore } 786753a6d45SSherry Moore 787753a6d45SSherry Moore static void 788753a6d45SSherry Moore fastboot_cksum_cdata(fastboot_info_t *nk, uchar_t *md5_hash) 789753a6d45SSherry Moore { 790753a6d45SSherry Moore int i; 791753a6d45SSherry Moore MD5_CTX md5_ctx; 792753a6d45SSherry Moore 793753a6d45SSherry Moore MD5Init(&md5_ctx); 794753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 795753a6d45SSherry Moore MD5Update(&md5_ctx, nk->fi_files[i].fb_pte_list_va, 796753a6d45SSherry Moore nk->fi_files[i].fb_pte_list_size); 797753a6d45SSherry Moore } 798753a6d45SSherry Moore MD5Update(&md5_ctx, (void *)nk->fi_pagetable_va, nk->fi_pagetable_size); 799753a6d45SSherry Moore MD5Update(&md5_ctx, (void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 800753a6d45SSherry Moore 801753a6d45SSherry Moore MD5Final(md5_hash, &md5_ctx); 802753a6d45SSherry Moore } 803753a6d45SSherry Moore 804753a6d45SSherry Moore /* 805753a6d45SSherry Moore * Generate MD5 checksum of the given kernel. 806753a6d45SSherry Moore */ 807753a6d45SSherry Moore static void 808753a6d45SSherry Moore fastboot_cksum_generate(fastboot_info_t *nk) 809753a6d45SSherry Moore { 810753a6d45SSherry Moore int i; 811753a6d45SSherry Moore 812753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 813753a6d45SSherry Moore fastboot_cksum_file(nk->fi_files + i, nk->fi_md5_hash[i]); 814753a6d45SSherry Moore } 815753a6d45SSherry Moore fastboot_cksum_cdata(nk, nk->fi_md5_hash[i]); 816753a6d45SSherry Moore } 817753a6d45SSherry Moore 818753a6d45SSherry Moore /* 819753a6d45SSherry Moore * Calculate MD5 checksum of the given kernel and verify that 820753a6d45SSherry Moore * it matches with what was calculated before. 821753a6d45SSherry Moore */ 822753a6d45SSherry Moore int 823753a6d45SSherry Moore fastboot_cksum_verify(fastboot_info_t *nk) 824753a6d45SSherry Moore { 825753a6d45SSherry Moore int i; 826753a6d45SSherry Moore uchar_t md5_hash[MD5_DIGEST_LENGTH]; 827753a6d45SSherry Moore 828753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 829753a6d45SSherry Moore fastboot_cksum_file(nk->fi_files + i, md5_hash); 830753a6d45SSherry Moore if (bcmp(nk->fi_md5_hash[i], md5_hash, 831753a6d45SSherry Moore sizeof (nk->fi_md5_hash[i])) != 0) 832753a6d45SSherry Moore return (i + 1); 833753a6d45SSherry Moore } 834753a6d45SSherry Moore 835753a6d45SSherry Moore fastboot_cksum_cdata(nk, md5_hash); 836753a6d45SSherry Moore if (bcmp(nk->fi_md5_hash[i], md5_hash, 837753a6d45SSherry Moore sizeof (nk->fi_md5_hash[i])) != 0) 838753a6d45SSherry Moore return (i + 1); 839753a6d45SSherry Moore 840753a6d45SSherry Moore return (0); 8416bc8bc6aSSherry Moore } 8426bc8bc6aSSherry Moore 8436bc8bc6aSSherry Moore /* 8446bc8bc6aSSherry Moore * This function performs the following tasks: 8456bc8bc6aSSherry Moore * - Read the sizes of the new kernel and boot archive. 8466bc8bc6aSSherry Moore * - Allocate memory for the new kernel and boot archive. 8476bc8bc6aSSherry Moore * - Allocate memory for page tables necessary for mapping the memory 8486bc8bc6aSSherry Moore * allocated for the files. 8496bc8bc6aSSherry Moore * - Read the new kernel and boot archive into memory. 8506bc8bc6aSSherry Moore * - Map in the fast reboot switcher. 8516bc8bc6aSSherry Moore * - Load the fast reboot switcher to FASTBOOT_SWTCH_PA. 8526bc8bc6aSSherry Moore * - Build the new multiboot_info structure 8536bc8bc6aSSherry Moore * - Build page tables for the low 1G of physical memory. 8546bc8bc6aSSherry Moore * - Mark the data structure as valid if all steps have succeeded. 8556bc8bc6aSSherry Moore */ 8566bc8bc6aSSherry Moore void 857753a6d45SSherry Moore fastboot_load_kernel(char *mdep) 8586bc8bc6aSSherry Moore { 8596bc8bc6aSSherry Moore void *buf = NULL; 8606bc8bc6aSSherry Moore int i; 8616bc8bc6aSSherry Moore fastboot_file_t *fb; 8626bc8bc6aSSherry Moore uint32_t dboot_start_offset; 8636bc8bc6aSSherry Moore char kern_bootpath[OBP_MAXPATHLEN]; 8646bc8bc6aSSherry Moore extern uintptr_t postbootkernelbase; 865753a6d45SSherry Moore uintptr_t saved_kernelbase; 8666bc8bc6aSSherry Moore int bootpath_len = 0; 8676bc8bc6aSSherry Moore int is_failsafe = 0; 8686bc8bc6aSSherry Moore int is_retry = 0; 8696bc8bc6aSSherry Moore uint64_t end_addr; 8706bc8bc6aSSherry Moore 8716bc8bc6aSSherry Moore ASSERT(fastreboot_capable); 8726bc8bc6aSSherry Moore 873753a6d45SSherry Moore if (newkernel.fi_valid) 874753a6d45SSherry Moore fastboot_free_newkernel(&newkernel); 875753a6d45SSherry Moore 876753a6d45SSherry Moore saved_kernelbase = postbootkernelbase; 877753a6d45SSherry Moore 8786bc8bc6aSSherry Moore postbootkernelbase = 0; 8796bc8bc6aSSherry Moore 8806bc8bc6aSSherry Moore /* 8816bc8bc6aSSherry Moore * Initialize various HAT related fields in the data structure 8826bc8bc6aSSherry Moore */ 8836bc8bc6aSSherry Moore fastboot_init_fields(&newkernel); 8846bc8bc6aSSherry Moore 8856bc8bc6aSSherry Moore bzero(kern_bootpath, OBP_MAXPATHLEN); 8866bc8bc6aSSherry Moore 8876bc8bc6aSSherry Moore /* 8886bc8bc6aSSherry Moore * Process the boot argument 8896bc8bc6aSSherry Moore */ 890753a6d45SSherry Moore bzero(fastboot_args, OBP_MAXPATHLEN); 891753a6d45SSherry Moore fastboot_parse_mdep(mdep, kern_bootpath, &bootpath_len, fastboot_args); 89219397407SSherry Moore 89319397407SSherry Moore /* 89419397407SSherry Moore * Make sure we get the null character 89519397407SSherry Moore */ 89619397407SSherry Moore bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_UNIX], 89719397407SSherry Moore bootpath_len); 89819397407SSherry Moore bcopy(kern_bootfile, 89919397407SSherry Moore &fastboot_filename[FASTBOOT_NAME_UNIX][bootpath_len], 90019397407SSherry Moore strlen(kern_bootfile) + 1); 90119397407SSherry Moore 90219397407SSherry Moore bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE], 90319397407SSherry Moore bootpath_len); 90419397407SSherry Moore 905753a6d45SSherry Moore if (bcmp(kern_bootfile, FAILSAFE_BOOTFILE32, 906753a6d45SSherry Moore (sizeof (FAILSAFE_BOOTFILE32) - 1)) == 0 || 907753a6d45SSherry Moore bcmp(kern_bootfile, FAILSAFE_BOOTFILE64, 908753a6d45SSherry Moore (sizeof (FAILSAFE_BOOTFILE64) - 1)) == 0) { 90919397407SSherry Moore is_failsafe = 1; 91019397407SSherry Moore } 91119397407SSherry Moore 9126bc8bc6aSSherry Moore load_kernel_retry: 91319397407SSherry Moore /* 91419397407SSherry Moore * Read in unix and boot_archive 91519397407SSherry Moore */ 9166bc8bc6aSSherry Moore end_addr = DBOOT_ENTRY_ADDRESS; 91719397407SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 9186bc8bc6aSSherry Moore struct _buf *file; 9196bc8bc6aSSherry Moore uintptr_t va; 92019397407SSherry Moore uint64_t fsize; 92119397407SSherry Moore size_t fsize_roundup, pt_size; 92219397407SSherry Moore int page_index; 92319397407SSherry Moore uintptr_t offset; 92419397407SSherry Moore ddi_dma_attr_t dma_attr = fastboot_dma_attr; 92519397407SSherry Moore 9266bc8bc6aSSherry Moore 92719397407SSherry Moore dprintf("fastboot_filename[%d] = %s\n", 92819397407SSherry Moore i, fastboot_filename[i]); 92919397407SSherry Moore 93019397407SSherry Moore if ((file = kobj_open_file(fastboot_filename[i])) == 93119397407SSherry Moore (struct _buf *)-1) { 93219397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Couldn't open %s", 93319397407SSherry Moore fastboot_filename[i]); 93419397407SSherry Moore goto err_out; 93519397407SSherry Moore } 93619397407SSherry Moore 93719397407SSherry Moore if (kobj_get_filesize(file, &fsize) != 0) { 93819397407SSherry Moore cmn_err(CE_WARN, 93919397407SSherry Moore "Fastboot: Couldn't get filesize for %s", 94019397407SSherry Moore fastboot_filename[i]); 94119397407SSherry Moore goto err_out; 94219397407SSherry Moore } 94319397407SSherry Moore 9446bc8bc6aSSherry Moore fsize_roundup = P2ROUNDUP_TYPED(fsize, PAGESIZE, size_t); 9456bc8bc6aSSherry Moore 9466bc8bc6aSSherry Moore /* 9476bc8bc6aSSherry Moore * Where the files end in physical memory after being 9486bc8bc6aSSherry Moore * relocated by the fast boot switcher. 9496bc8bc6aSSherry Moore */ 9506bc8bc6aSSherry Moore end_addr += fsize_roundup; 9516bc8bc6aSSherry Moore if (end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_hi) { 9526bc8bc6aSSherry Moore cmn_err(CE_WARN, "Fastboot: boot archive is too big"); 9536bc8bc6aSSherry Moore goto err_out; 95419397407SSherry Moore } 95519397407SSherry Moore 9566bc8bc6aSSherry Moore /* 9576bc8bc6aSSherry Moore * Adjust dma_attr_addr_lo so that the new kernel and boot 9586bc8bc6aSSherry Moore * archive will not be overridden during relocation. 9596bc8bc6aSSherry Moore */ 9606bc8bc6aSSherry Moore if (end_addr > fastboot_dma_attr.dma_attr_addr_lo || 9616bc8bc6aSSherry Moore end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_lo) { 9626bc8bc6aSSherry Moore 9636bc8bc6aSSherry Moore if (is_retry) { 9646bc8bc6aSSherry Moore /* 9656bc8bc6aSSherry Moore * If we have already tried and didn't succeed, 9666bc8bc6aSSherry Moore * just give up. 9676bc8bc6aSSherry Moore */ 9686bc8bc6aSSherry Moore cmn_err(CE_WARN, 9696bc8bc6aSSherry Moore "Fastboot: boot archive is too big"); 9706bc8bc6aSSherry Moore goto err_out; 9716bc8bc6aSSherry Moore } else { 9726bc8bc6aSSherry Moore /* Set the flag so we don't keep retrying */ 9736bc8bc6aSSherry Moore is_retry++; 9746bc8bc6aSSherry Moore 9756bc8bc6aSSherry Moore /* Adjust dma_attr_addr_lo */ 9766bc8bc6aSSherry Moore fastboot_dma_attr.dma_attr_addr_lo = end_addr; 9776bc8bc6aSSherry Moore fastboot_below_1G_dma_attr.dma_attr_addr_lo = 9786bc8bc6aSSherry Moore end_addr; 9796bc8bc6aSSherry Moore 9806bc8bc6aSSherry Moore /* 9816bc8bc6aSSherry Moore * Free the memory we have already allocated 9826bc8bc6aSSherry Moore * whose physical addresses might not fit 9836bc8bc6aSSherry Moore * the new lo and hi constraints. 9846bc8bc6aSSherry Moore */ 985753a6d45SSherry Moore fastboot_free_mem(&newkernel, end_addr); 9866bc8bc6aSSherry Moore goto load_kernel_retry; 9876bc8bc6aSSherry Moore } 9886bc8bc6aSSherry Moore } 9896bc8bc6aSSherry Moore 9906bc8bc6aSSherry Moore 99119397407SSherry Moore if (!fastboot_contig) 99219397407SSherry Moore dma_attr.dma_attr_sgllen = (fsize / PAGESIZE) + 99319397407SSherry Moore (((fsize % PAGESIZE) == 0) ? 0 : 1); 99419397407SSherry Moore 99519397407SSherry Moore if ((buf = contig_alloc(fsize, &dma_attr, PAGESIZE, 0)) 99619397407SSherry Moore == NULL) { 9976bc8bc6aSSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, fsize, "64G"); 99819397407SSherry Moore goto err_out; 99919397407SSherry Moore } 100019397407SSherry Moore 100119397407SSherry Moore va = P2ROUNDUP_TYPED((uintptr_t)buf, PAGESIZE, uintptr_t); 100219397407SSherry Moore 100319397407SSherry Moore if (kobj_read_file(file, (char *)va, fsize, 0) < 0) { 100419397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Couldn't read %s", 100519397407SSherry Moore fastboot_filename[i]); 100619397407SSherry Moore goto err_out; 100719397407SSherry Moore } 100819397407SSherry Moore 100919397407SSherry Moore fb = &newkernel.fi_files[i]; 101019397407SSherry Moore fb->fb_va = va; 101119397407SSherry Moore fb->fb_size = fsize; 101219397407SSherry Moore fb->fb_sectcnt = 0; 101319397407SSherry Moore 1014753a6d45SSherry Moore pt_size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup); 101519397407SSherry Moore 1016753a6d45SSherry Moore /* 1017753a6d45SSherry Moore * If we have reserved memory but it not enough, free it. 1018753a6d45SSherry Moore */ 1019753a6d45SSherry Moore if (fb->fb_pte_list_size && fb->fb_pte_list_size < pt_size) { 1020753a6d45SSherry Moore contig_free((void *)fb->fb_pte_list_va, 1021753a6d45SSherry Moore fb->fb_pte_list_size); 1022753a6d45SSherry Moore fb->fb_pte_list_size = 0; 1023753a6d45SSherry Moore } 1024753a6d45SSherry Moore 1025753a6d45SSherry Moore if (fb->fb_pte_list_size == 0) { 102619397407SSherry Moore if ((fb->fb_pte_list_va = 102719397407SSherry Moore (x86pte_t *)contig_alloc(pt_size, 1028753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) 1029753a6d45SSherry Moore == NULL) { 103019397407SSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, 103119397407SSherry Moore (uint64_t)pt_size, "1G"); 103219397407SSherry Moore goto err_out; 103319397407SSherry Moore } 1034753a6d45SSherry Moore /* 1035753a6d45SSherry Moore * fb_pte_list_size must be set after the allocation 1036753a6d45SSherry Moore * succeeds as it's used to determine how much memory to 1037753a6d45SSherry Moore * free. 1038753a6d45SSherry Moore */ 1039753a6d45SSherry Moore fb->fb_pte_list_size = pt_size; 1040753a6d45SSherry Moore } 104119397407SSherry Moore 1042753a6d45SSherry Moore bzero((void *)(fb->fb_pte_list_va), fb->fb_pte_list_size); 104319397407SSherry Moore 104419397407SSherry Moore fb->fb_pte_list_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 104519397407SSherry Moore (caddr_t)fb->fb_pte_list_va)); 104619397407SSherry Moore 104719397407SSherry Moore for (page_index = 0, offset = 0; offset < fb->fb_size; 104819397407SSherry Moore offset += PAGESIZE) { 104919397407SSherry Moore uint64_t paddr; 105019397407SSherry Moore 105119397407SSherry Moore paddr = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 105219397407SSherry Moore (caddr_t)fb->fb_va + offset)); 105319397407SSherry Moore 105419397407SSherry Moore ASSERT(paddr >= fastboot_dma_attr.dma_attr_addr_lo); 105519397407SSherry Moore 105619397407SSherry Moore /* 105719397407SSherry Moore * Include the pte_bits so we don't have to make 105819397407SSherry Moore * it in assembly. 105919397407SSherry Moore */ 106019397407SSherry Moore fb->fb_pte_list_va[page_index++] = (x86pte_t) 106119397407SSherry Moore (paddr | pte_bits); 106219397407SSherry Moore } 106319397407SSherry Moore 106419397407SSherry Moore fb->fb_pte_list_va[page_index] = FASTBOOT_TERMINATE; 106519397407SSherry Moore 106619397407SSherry Moore if (i == FASTBOOT_UNIX) { 10676bc8bc6aSSherry Moore Ehdr *ehdr = (Ehdr *)va; 10686bc8bc6aSSherry Moore int j; 106919397407SSherry Moore 107019397407SSherry Moore /* 107119397407SSherry Moore * Sanity checks: 107219397407SSherry Moore */ 107319397407SSherry Moore for (j = 0; j < SELFMAG; j++) { 107419397407SSherry Moore if (ehdr->e_ident[j] != ELFMAG[j]) { 107519397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Bad ELF " 107619397407SSherry Moore "signature"); 107719397407SSherry Moore goto err_out; 107819397407SSherry Moore } 107919397407SSherry Moore } 108019397407SSherry Moore 108119397407SSherry Moore if (ehdr->e_ident[EI_CLASS] == ELFCLASS32 && 108219397407SSherry Moore ehdr->e_ident[EI_DATA] == ELFDATA2LSB && 108319397407SSherry Moore ehdr->e_machine == EM_386) { 108419397407SSherry Moore 1085877400d3SKonstantin Ananyev fb->fb_sectcnt = sizeof (fb->fb_sections) / 1086877400d3SKonstantin Ananyev sizeof (fb->fb_sections[0]); 1087877400d3SKonstantin Ananyev 108819397407SSherry Moore if (fastboot_elf32_find_loadables((void *)va, 108919397407SSherry Moore fsize, &fb->fb_sections[0], 109019397407SSherry Moore &fb->fb_sectcnt, &dboot_start_offset) < 0) { 109119397407SSherry Moore cmn_err(CE_WARN, "Fastboot: ELF32 " 109219397407SSherry Moore "program section failure"); 109319397407SSherry Moore goto err_out; 109419397407SSherry Moore } 109519397407SSherry Moore 109619397407SSherry Moore if (fb->fb_sectcnt == 0) { 109719397407SSherry Moore cmn_err(CE_WARN, "Fastboot: No ELF32 " 109819397407SSherry Moore "program sections found"); 109919397407SSherry Moore goto err_out; 110019397407SSherry Moore } 110119397407SSherry Moore 110219397407SSherry Moore if (is_failsafe) { 110319397407SSherry Moore /* Failsafe boot_archive */ 1104753a6d45SSherry Moore bcopy(BOOTARCHIVE32_FAILSAFE, 110519397407SSherry Moore &fastboot_filename 110619397407SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 110719397407SSherry Moore [bootpath_len], 1108753a6d45SSherry Moore sizeof (BOOTARCHIVE32_FAILSAFE)); 110919397407SSherry Moore } else { 111019397407SSherry Moore bcopy(BOOTARCHIVE32, 111119397407SSherry Moore &fastboot_filename 111219397407SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 111319397407SSherry Moore [bootpath_len], 111419397407SSherry Moore sizeof (BOOTARCHIVE32)); 111519397407SSherry Moore } 111619397407SSherry Moore 111719397407SSherry Moore } else if (ehdr->e_ident[EI_CLASS] == ELFCLASS64 && 111819397407SSherry Moore ehdr->e_ident[EI_DATA] == ELFDATA2LSB && 111919397407SSherry Moore ehdr->e_machine == EM_AMD64) { 112019397407SSherry Moore 112119397407SSherry Moore if (fastboot_elf64_find_dboot_load_offset( 112219397407SSherry Moore (void *)va, fsize, &dboot_start_offset) 112319397407SSherry Moore != 0) { 112419397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Couldn't " 112519397407SSherry Moore "find ELF64 dboot entry offset"); 112619397407SSherry Moore goto err_out; 112719397407SSherry Moore } 112819397407SSherry Moore 112919397407SSherry Moore if ((x86_feature & X86_64) == 0 || 1130877400d3SKonstantin Ananyev (x86_feature & X86_PAE) == 0) { 113119397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Cannot " 113219397407SSherry Moore "reboot to %s: " 113319397407SSherry Moore "not a 64-bit capable system", 113419397407SSherry Moore kern_bootfile); 113519397407SSherry Moore goto err_out; 113619397407SSherry Moore } 113719397407SSherry Moore 1138753a6d45SSherry Moore if (is_failsafe) { 1139753a6d45SSherry Moore /* Failsafe boot_archive */ 1140753a6d45SSherry Moore bcopy(BOOTARCHIVE64_FAILSAFE, 1141753a6d45SSherry Moore &fastboot_filename 1142753a6d45SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 1143753a6d45SSherry Moore [bootpath_len], 1144753a6d45SSherry Moore sizeof (BOOTARCHIVE64_FAILSAFE)); 1145753a6d45SSherry Moore } else { 114619397407SSherry Moore bcopy(BOOTARCHIVE64, 114719397407SSherry Moore &fastboot_filename 1148753a6d45SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 1149753a6d45SSherry Moore [bootpath_len], 115019397407SSherry Moore sizeof (BOOTARCHIVE64)); 1151753a6d45SSherry Moore } 115219397407SSherry Moore } else { 115319397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Unknown ELF type"); 115419397407SSherry Moore goto err_out; 115519397407SSherry Moore } 115619397407SSherry Moore 115719397407SSherry Moore fb->fb_dest_pa = DBOOT_ENTRY_ADDRESS - 115819397407SSherry Moore dboot_start_offset; 115919397407SSherry Moore 116019397407SSherry Moore fb->fb_next_pa = DBOOT_ENTRY_ADDRESS + fsize_roundup; 116119397407SSherry Moore } else { 116219397407SSherry Moore fb->fb_dest_pa = newkernel.fi_files[i - 1].fb_next_pa; 116319397407SSherry Moore fb->fb_next_pa = fb->fb_dest_pa + fsize_roundup; 116419397407SSherry Moore } 116519397407SSherry Moore 116619397407SSherry Moore kobj_close_file(file); 116719397407SSherry Moore 11686bc8bc6aSSherry Moore } 11696bc8bc6aSSherry Moore 117019397407SSherry Moore /* 117119397407SSherry Moore * Add the function that will switch us to 32-bit protected mode 117219397407SSherry Moore */ 117319397407SSherry Moore fb = &newkernel.fi_files[FASTBOOT_SWTCH]; 117419397407SSherry Moore fb->fb_va = fb->fb_dest_pa = FASTBOOT_SWTCH_PA; 1175877400d3SKonstantin Ananyev fb->fb_size = MMU_PAGESIZE; 117619397407SSherry Moore 1177753a6d45SSherry Moore hat_devload(kas.a_hat, (caddr_t)fb->fb_va, 1178753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1179753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1180753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 118119397407SSherry Moore 118219397407SSherry Moore /* 118319397407SSherry Moore * Build the new multiboot_info structure 118419397407SSherry Moore */ 1185753a6d45SSherry Moore if (fastboot_build_mbi(fastboot_args, &newkernel) != 0) { 118619397407SSherry Moore goto err_out; 118719397407SSherry Moore } 118819397407SSherry Moore 118919397407SSherry Moore /* 119019397407SSherry Moore * Build page table for low 1G physical memory. Use big pages. 1191877400d3SKonstantin Ananyev * Allocate 4 (5 for amd64) pages for the page tables. 1192877400d3SKonstantin Ananyev * 1 page for PML4 (amd64) 119319397407SSherry Moore * 1 page for Page-Directory-Pointer Table 1194877400d3SKonstantin Ananyev * 2 pages for Page Directory 119519397407SSherry Moore * 1 page for Page Table. 119619397407SSherry Moore * The page table entry will be rewritten to map the physical 119719397407SSherry Moore * address as we do the copying. 119819397407SSherry Moore */ 119919397407SSherry Moore if (newkernel.fi_has_pae) { 1200877400d3SKonstantin Ananyev #ifdef __amd64 1201877400d3SKonstantin Ananyev size_t size = MMU_PAGESIZE * 5; 1202877400d3SKonstantin Ananyev #else 120319397407SSherry Moore size_t size = MMU_PAGESIZE * 4; 1204877400d3SKonstantin Ananyev #endif /* __amd64 */ 120519397407SSherry Moore 1206753a6d45SSherry Moore if (newkernel.fi_pagetable_size && newkernel.fi_pagetable_size 1207753a6d45SSherry Moore < size) { 1208753a6d45SSherry Moore contig_free((void *)newkernel.fi_pagetable_va, 1209753a6d45SSherry Moore newkernel.fi_pagetable_size); 1210753a6d45SSherry Moore newkernel.fi_pagetable_size = 0; 1211753a6d45SSherry Moore } 1212753a6d45SSherry Moore 1213753a6d45SSherry Moore if (newkernel.fi_pagetable_size == 0) { 121419397407SSherry Moore if ((newkernel.fi_pagetable_va = (uintptr_t) 121519397407SSherry Moore contig_alloc(size, &fastboot_below_1G_dma_attr, 1216877400d3SKonstantin Ananyev MMU_PAGESIZE, 0)) == NULL) { 121719397407SSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, 121819397407SSherry Moore (uint64_t)size, "1G"); 121919397407SSherry Moore goto err_out; 122019397407SSherry Moore } 1221753a6d45SSherry Moore /* 1222753a6d45SSherry Moore * fi_pagetable_size must be set after the allocation 1223753a6d45SSherry Moore * succeeds as it's used to determine how much memory to 1224753a6d45SSherry Moore * free. 1225753a6d45SSherry Moore */ 1226753a6d45SSherry Moore newkernel.fi_pagetable_size = size; 1227753a6d45SSherry Moore } 122819397407SSherry Moore 122919397407SSherry Moore bzero((void *)(newkernel.fi_pagetable_va), size); 123019397407SSherry Moore 123119397407SSherry Moore newkernel.fi_pagetable_pa = 123219397407SSherry Moore mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 123319397407SSherry Moore (caddr_t)newkernel.fi_pagetable_va)); 123419397407SSherry Moore 123519397407SSherry Moore newkernel.fi_last_table_pa = newkernel.fi_pagetable_pa + 1236877400d3SKonstantin Ananyev size - MMU_PAGESIZE; 123719397407SSherry Moore 123819397407SSherry Moore newkernel.fi_next_table_va = newkernel.fi_pagetable_va + 123919397407SSherry Moore MMU_PAGESIZE; 124019397407SSherry Moore newkernel.fi_next_table_pa = newkernel.fi_pagetable_pa + 124119397407SSherry Moore MMU_PAGESIZE; 124219397407SSherry Moore 124319397407SSherry Moore fastboot_build_pagetables(&newkernel); 124419397407SSherry Moore } 124519397407SSherry Moore 124619397407SSherry Moore 1247753a6d45SSherry Moore /* Generate MD5 checksums */ 1248753a6d45SSherry Moore fastboot_cksum_generate(&newkernel); 1249753a6d45SSherry Moore 125019397407SSherry Moore /* Mark it as valid */ 125119397407SSherry Moore newkernel.fi_valid = 1; 125219397407SSherry Moore newkernel.fi_magic = FASTBOOT_MAGIC; 125319397407SSherry Moore 1254753a6d45SSherry Moore postbootkernelbase = saved_kernelbase; 125519397407SSherry Moore return; 125619397407SSherry Moore 125719397407SSherry Moore err_out: 1258753a6d45SSherry Moore postbootkernelbase = saved_kernelbase; 125919397407SSherry Moore newkernel.fi_valid = 0; 1260753a6d45SSherry Moore fastboot_free_newkernel(&newkernel); 1261753a6d45SSherry Moore } 1262753a6d45SSherry Moore 1263753a6d45SSherry Moore 1264753a6d45SSherry Moore /* ARGSUSED */ 1265753a6d45SSherry Moore static int 1266753a6d45SSherry Moore fastboot_xc_func(fastboot_info_t *nk, xc_arg_t unused2, xc_arg_t unused3) 1267753a6d45SSherry Moore { 1268753a6d45SSherry Moore void (*fastboot_func)(fastboot_info_t *); 1269753a6d45SSherry Moore fastboot_file_t *fb = &nk->fi_files[FASTBOOT_SWTCH]; 1270753a6d45SSherry Moore fastboot_func = (void (*)())(fb->fb_va); 1271753a6d45SSherry Moore kthread_t *t_intr = curthread->t_intr; 1272753a6d45SSherry Moore 1273753a6d45SSherry Moore if (&kas != curproc->p_as) { 1274753a6d45SSherry Moore hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va, 1275753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1276753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1277753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 1278753a6d45SSherry Moore } 1279753a6d45SSherry Moore 1280753a6d45SSherry Moore /* 1281753a6d45SSherry Moore * If we have pinned a thread, make sure the address is mapped 1282753a6d45SSherry Moore * in the address space of the pinned thread. 1283753a6d45SSherry Moore */ 1284753a6d45SSherry Moore if (t_intr && t_intr->t_procp->p_as->a_hat != curproc->p_as->a_hat && 1285753a6d45SSherry Moore t_intr->t_procp->p_as != &kas) 1286753a6d45SSherry Moore hat_devload(t_intr->t_procp->p_as->a_hat, (caddr_t)fb->fb_va, 1287753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1288753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1289753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 1290753a6d45SSherry Moore 1291753a6d45SSherry Moore (*psm_shutdownf)(A_SHUTDOWN, AD_FASTREBOOT); 1292753a6d45SSherry Moore (*fastboot_func)(nk); 1293753a6d45SSherry Moore 1294753a6d45SSherry Moore /*NOTREACHED*/ 1295753a6d45SSherry Moore return (0); 129619397407SSherry Moore } 129719397407SSherry Moore 12986bc8bc6aSSherry Moore /* 12996bc8bc6aSSherry Moore * Jump to the fast reboot switcher. This function never returns. 13006bc8bc6aSSherry Moore */ 130119397407SSherry Moore void 130219397407SSherry Moore fast_reboot() 130319397407SSherry Moore { 1304753a6d45SSherry Moore processorid_t bootcpuid = 0; 1305753a6d45SSherry Moore extern uintptr_t postbootkernelbase; 1306753a6d45SSherry Moore extern char fb_swtch_image[]; 1307753a6d45SSherry Moore fastboot_file_t *fb; 1308753a6d45SSherry Moore int i; 130919397407SSherry Moore 1310753a6d45SSherry Moore postbootkernelbase = 0; 1311753a6d45SSherry Moore 1312753a6d45SSherry Moore fb = &newkernel.fi_files[FASTBOOT_SWTCH]; 1313753a6d45SSherry Moore 1314753a6d45SSherry Moore /* 1315753a6d45SSherry Moore * Map the address into both the current proc's address 1316753a6d45SSherry Moore * space and the kernel's address space in case the panic 1317753a6d45SSherry Moore * is forced by kmdb. 1318753a6d45SSherry Moore */ 1319753a6d45SSherry Moore if (&kas != curproc->p_as) { 1320753a6d45SSherry Moore hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va, 1321753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1322753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1323753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 1324753a6d45SSherry Moore } 1325753a6d45SSherry Moore 1326753a6d45SSherry Moore bcopy((void *)fb_swtch_image, (void *)fb->fb_va, fb->fb_size); 1327753a6d45SSherry Moore 1328753a6d45SSherry Moore 1329753a6d45SSherry Moore /* 1330753a6d45SSherry Moore * Set fb_va to fake_va 1331753a6d45SSherry Moore */ 1332753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 1333753a6d45SSherry Moore newkernel.fi_files[i].fb_va = fake_va; 1334753a6d45SSherry Moore 1335753a6d45SSherry Moore } 1336753a6d45SSherry Moore 1337753a6d45SSherry Moore if (panicstr && CPU->cpu_id != bootcpuid && 1338753a6d45SSherry Moore CPU_ACTIVE(cpu_get(bootcpuid))) { 1339f34a7178SJoe Bonasera extern void panic_idle(void); 1340753a6d45SSherry Moore cpuset_t cpuset; 1341753a6d45SSherry Moore 1342753a6d45SSherry Moore CPUSET_ZERO(cpuset); 1343753a6d45SSherry Moore CPUSET_ADD(cpuset, bootcpuid); 1344f34a7178SJoe Bonasera xc_priority((xc_arg_t)&newkernel, 0, 0, CPUSET2BV(cpuset), 1345753a6d45SSherry Moore (xc_func_t)fastboot_xc_func); 1346753a6d45SSherry Moore 1347f34a7178SJoe Bonasera panic_idle(); 1348753a6d45SSherry Moore } else 1349753a6d45SSherry Moore (void) fastboot_xc_func(&newkernel, 0, 0); 1350753a6d45SSherry Moore } 1351753a6d45SSherry Moore 1352753a6d45SSherry Moore 1353753a6d45SSherry Moore /* 1354753a6d45SSherry Moore * Get boot property value for fastreboot_onpanic. 1355753a6d45SSherry Moore * 1356753a6d45SSherry Moore * NOTE: If fastreboot_onpanic is set to non-zero in /etc/system, 1357753a6d45SSherry Moore * new setting passed in via "-B fastreboot_onpanic" is ignored. 1358753a6d45SSherry Moore * This order of precedence is to enable developers debugging panics 1359753a6d45SSherry Moore * that occur early in boot to utilize Fast Reboot on panic. 1360753a6d45SSherry Moore */ 1361753a6d45SSherry Moore static void 1362753a6d45SSherry Moore fastboot_get_bootprop(void) 1363753a6d45SSherry Moore { 1364753a6d45SSherry Moore int val = 0xaa, len, ret; 1365753a6d45SSherry Moore dev_info_t *devi; 1366753a6d45SSherry Moore char *propstr = NULL; 1367753a6d45SSherry Moore 1368753a6d45SSherry Moore devi = ddi_root_node(); 1369753a6d45SSherry Moore 1370753a6d45SSherry Moore ret = ddi_prop_lookup_string(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS, 1371753a6d45SSherry Moore FASTREBOOT_ONPANIC, &propstr); 1372753a6d45SSherry Moore 1373753a6d45SSherry Moore if (ret == DDI_PROP_SUCCESS) { 1374753a6d45SSherry Moore if (FASTREBOOT_ONPANIC_NOTSET(propstr)) 1375753a6d45SSherry Moore val = 0; 1376753a6d45SSherry Moore else if (FASTREBOOT_ONPANIC_ISSET(propstr)) 1377753a6d45SSherry Moore val = UA_FASTREBOOT_ONPANIC; 1378753a6d45SSherry Moore 1379753a6d45SSherry Moore /* 1380753a6d45SSherry Moore * Only set fastreboot_onpanic to the value passed in 1381753a6d45SSherry Moore * if it's not already set to non-zero, and the value 1382753a6d45SSherry Moore * has indeed been passed in via command line. 1383753a6d45SSherry Moore */ 1384753a6d45SSherry Moore if (!fastreboot_onpanic && val != 0xaa) 1385753a6d45SSherry Moore fastreboot_onpanic = val; 1386753a6d45SSherry Moore ddi_prop_free(propstr); 1387753a6d45SSherry Moore } else if (ret != DDI_PROP_NOT_FOUND && ret != DDI_PROP_UNDEFINED) { 1388753a6d45SSherry Moore cmn_err(CE_WARN, "%s value is invalid, will be ignored", 1389753a6d45SSherry Moore FASTREBOOT_ONPANIC); 1390753a6d45SSherry Moore } 1391753a6d45SSherry Moore 1392753a6d45SSherry Moore len = sizeof (fastreboot_onpanic_cmdline); 1393753a6d45SSherry Moore ret = ddi_getlongprop_buf(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS, 1394753a6d45SSherry Moore FASTREBOOT_ONPANIC_CMDLINE, fastreboot_onpanic_cmdline, &len); 1395753a6d45SSherry Moore 1396753a6d45SSherry Moore if (ret == DDI_PROP_BUF_TOO_SMALL) 1397753a6d45SSherry Moore cmn_err(CE_WARN, "%s value is too long, will be ignored", 1398753a6d45SSherry Moore FASTREBOOT_ONPANIC_CMDLINE); 1399753a6d45SSherry Moore } 1400753a6d45SSherry Moore 1401753a6d45SSherry Moore /* 1402753a6d45SSherry Moore * This function is called by main() to either load the backup kernel for panic 1403753a6d45SSherry Moore * fast reboot, or to reserve low physical memory for fast reboot. 1404753a6d45SSherry Moore */ 1405753a6d45SSherry Moore void 1406753a6d45SSherry Moore fastboot_post_startup() 1407753a6d45SSherry Moore { 1408753a6d45SSherry Moore if (!fastreboot_capable) 1409753a6d45SSherry Moore return; 1410753a6d45SSherry Moore 1411753a6d45SSherry Moore fastboot_get_bootprop(); 1412753a6d45SSherry Moore 1413753a6d45SSherry Moore if (fastreboot_onpanic) 1414753a6d45SSherry Moore fastboot_load_kernel(fastreboot_onpanic_cmdline); 1415753a6d45SSherry Moore else if (reserve_mem_enabled) 1416753a6d45SSherry Moore fastboot_reserve_mem(&newkernel); 1417753a6d45SSherry Moore } 1418753a6d45SSherry Moore 1419753a6d45SSherry Moore /* 1420753a6d45SSherry Moore * Update boot configuration settings. 1421753a6d45SSherry Moore * If the new fastreboot_onpanic setting is false, and a kernel has 1422753a6d45SSherry Moore * been preloaded, free the memory; 1423753a6d45SSherry Moore * if the new fastreboot_onpanic setting is true and newkernel is 1424753a6d45SSherry Moore * not valid, load the new kernel. 1425753a6d45SSherry Moore */ 1426753a6d45SSherry Moore void 1427753a6d45SSherry Moore fastboot_update_config(const char *mdep) 1428753a6d45SSherry Moore { 1429753a6d45SSherry Moore uint8_t boot_config = (uint8_t)*mdep; 1430753a6d45SSherry Moore int cur_fastreboot_onpanic = fastreboot_onpanic; 1431753a6d45SSherry Moore 1432753a6d45SSherry Moore if (!fastreboot_capable) 1433753a6d45SSherry Moore return; 1434753a6d45SSherry Moore 1435753a6d45SSherry Moore fastreboot_onpanic = boot_config & UA_FASTREBOOT_ONPANIC; 1436753a6d45SSherry Moore if (fastreboot_onpanic && (!cur_fastreboot_onpanic || 1437753a6d45SSherry Moore !newkernel.fi_valid)) 1438753a6d45SSherry Moore fastboot_load_kernel(fastreboot_onpanic_cmdline); 1439753a6d45SSherry Moore if (cur_fastreboot_onpanic && !fastreboot_onpanic) 1440753a6d45SSherry Moore fastboot_free_newkernel(&newkernel); 144119397407SSherry Moore } 1442