119397407SSherry Moore /* 219397407SSherry Moore * CDDL HEADER START 319397407SSherry Moore * 419397407SSherry Moore * The contents of this file are subject to the terms of the 519397407SSherry Moore * Common Development and Distribution License (the "License"). 619397407SSherry Moore * You may not use this file except in compliance with the License. 719397407SSherry Moore * 819397407SSherry Moore * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 919397407SSherry Moore * or http://www.opensolaris.org/os/licensing. 1019397407SSherry Moore * See the License for the specific language governing permissions 1119397407SSherry Moore * and limitations under the License. 1219397407SSherry Moore * 1319397407SSherry Moore * When distributing Covered Code, include this CDDL HEADER in each 1419397407SSherry Moore * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 1519397407SSherry Moore * If applicable, add the following below this CDDL HEADER, with the 1619397407SSherry Moore * fields enclosed by brackets "[]" replaced with your own identifying 1719397407SSherry Moore * information: Portions Copyright [yyyy] [name of copyright owner] 1819397407SSherry Moore * 1919397407SSherry Moore * CDDL HEADER END 2019397407SSherry Moore */ 2119397407SSherry Moore 2219397407SSherry Moore /* 23753a6d45SSherry Moore * Copyright 2009 Sun Microsystems, Inc. All rights reserved. 2419397407SSherry Moore * Use is subject to license terms. 2519397407SSherry Moore */ 2619397407SSherry Moore 276bc8bc6aSSherry Moore /* 286bc8bc6aSSherry Moore * This file contains the functions for performing Fast Reboot -- a 296bc8bc6aSSherry Moore * reboot which bypasses the firmware and bootloader, considerably 306bc8bc6aSSherry Moore * reducing downtime. 316bc8bc6aSSherry Moore * 32753a6d45SSherry Moore * fastboot_load_kernel(): This function is invoked by mdpreboot() in the 33753a6d45SSherry Moore * reboot path. It loads the new kernel and boot archive into memory, builds 346bc8bc6aSSherry Moore * the data structure containing sufficient information about the new 356bc8bc6aSSherry Moore * kernel and boot archive to be passed to the fast reboot switcher 366bc8bc6aSSherry Moore * (see fb_swtch_src.s for details). When invoked the switcher relocates 376bc8bc6aSSherry Moore * the new kernel and boot archive to physically contiguous low memory, 386bc8bc6aSSherry Moore * similar to where the boot loader would have loaded them, and jumps to 396bc8bc6aSSherry Moore * the new kernel. 406bc8bc6aSSherry Moore * 41753a6d45SSherry Moore * If fastreboot_onpanic is enabled, fastboot_load_kernel() is called 42753a6d45SSherry Moore * by fastreboot_post_startup() to load the back up kernel in case of 43753a6d45SSherry Moore * panic. 44753a6d45SSherry Moore * 456bc8bc6aSSherry Moore * The physical addresses of the memory allocated for the new kernel, boot 466bc8bc6aSSherry Moore * archive and their page tables must be above where the boot archive ends 476bc8bc6aSSherry Moore * after it has been relocated by the switcher, otherwise the new files 486bc8bc6aSSherry Moore * and their page tables could be overridden during relocation. 496bc8bc6aSSherry Moore * 506bc8bc6aSSherry Moore * fast_reboot(): This function is invoked by mdboot() once it's determined 516bc8bc6aSSherry Moore * that the system is capable of fast reboot. It jumps to the fast reboot 52753a6d45SSherry Moore * switcher with the data structure built by fastboot_load_kernel() as the 53753a6d45SSherry Moore * argument. 546bc8bc6aSSherry Moore */ 5519397407SSherry Moore 5619397407SSherry Moore #include <sys/types.h> 5719397407SSherry Moore #include <sys/param.h> 5819397407SSherry Moore #include <sys/segments.h> 5919397407SSherry Moore #include <sys/sysmacros.h> 6019397407SSherry Moore #include <sys/vm.h> 6119397407SSherry Moore 6219397407SSherry Moore #include <sys/proc.h> 6319397407SSherry Moore #include <sys/buf.h> 6419397407SSherry Moore #include <sys/kmem.h> 6519397407SSherry Moore 6619397407SSherry Moore #include <sys/reboot.h> 6719397407SSherry Moore #include <sys/uadmin.h> 6819397407SSherry Moore 6919397407SSherry Moore #include <sys/cred.h> 7019397407SSherry Moore #include <sys/vnode.h> 7119397407SSherry Moore #include <sys/file.h> 7219397407SSherry Moore 7319397407SSherry Moore #include <sys/cmn_err.h> 7419397407SSherry Moore #include <sys/dumphdr.h> 7519397407SSherry Moore #include <sys/bootconf.h> 7619397407SSherry Moore #include <sys/ddidmareq.h> 7719397407SSherry Moore #include <sys/varargs.h> 7819397407SSherry Moore #include <sys/promif.h> 7919397407SSherry Moore #include <sys/modctl.h> 8019397407SSherry Moore 8119397407SSherry Moore #include <vm/hat.h> 8219397407SSherry Moore #include <vm/as.h> 8319397407SSherry Moore #include <vm/page.h> 8419397407SSherry Moore #include <vm/seg.h> 8519397407SSherry Moore #include <vm/hat_i86.h> 8619397407SSherry Moore #include <sys/vm_machparam.h> 8719397407SSherry Moore #include <sys/archsystm.h> 8819397407SSherry Moore #include <sys/machsystm.h> 8919397407SSherry Moore #include <sys/mman.h> 9019397407SSherry Moore #include <sys/x86_archext.h> 91753a6d45SSherry Moore #include <sys/smp_impldefs.h> 92753a6d45SSherry Moore #include <sys/spl.h> 9319397407SSherry Moore 9419397407SSherry Moore #include <sys/fastboot.h> 9519397407SSherry Moore #include <sys/machelf.h> 9619397407SSherry Moore #include <sys/kobj.h> 9719397407SSherry Moore #include <sys/multiboot.h> 98753a6d45SSherry Moore #include <sys/kobj_lex.h> 99753a6d45SSherry Moore 100753a6d45SSherry Moore /* 101753a6d45SSherry Moore * Macro to determine how many pages are needed for PTEs to map a particular 102753a6d45SSherry Moore * file. Allocate one extra page table entry for terminating the list. 103753a6d45SSherry Moore */ 104753a6d45SSherry Moore #define FASTBOOT_PTE_LIST_SIZE(fsize) \ 105753a6d45SSherry Moore P2ROUNDUP((((fsize) >> PAGESHIFT) + 1) * sizeof (x86pte_t), PAGESIZE) 10619397407SSherry Moore 1076bc8bc6aSSherry Moore /* 1086bc8bc6aSSherry Moore * Data structure containing necessary information for the fast reboot 1096bc8bc6aSSherry Moore * switcher to jump to the new kernel. 1106bc8bc6aSSherry Moore */ 11119397407SSherry Moore fastboot_info_t newkernel = { 0 }; 112753a6d45SSherry Moore char fastboot_args[OBP_MAXPATHLEN]; 1136bc8bc6aSSherry Moore 11419397407SSherry Moore static char fastboot_filename[2][OBP_MAXPATHLEN] = { { 0 }, { 0 }}; 11519397407SSherry Moore static x86pte_t ptp_bits = PT_VALID | PT_REF | PT_USER | PT_WRITABLE; 11619397407SSherry Moore static x86pte_t pte_bits = 11719397407SSherry Moore PT_VALID | PT_REF | PT_MOD | PT_NOCONSIST | PT_WRITABLE; 11819397407SSherry Moore static uint_t fastboot_shift_amt_pae[] = {12, 21, 30, 39}; 11919397407SSherry Moore 12019397407SSherry Moore int fastboot_debug = 0; 12119397407SSherry Moore int fastboot_contig = 0; 12219397407SSherry Moore 12319397407SSherry Moore /* 12419397407SSherry Moore * Fake starting va for new kernel and boot archive. 12519397407SSherry Moore */ 12619397407SSherry Moore static uintptr_t fake_va = FASTBOOT_FAKE_VA; 12719397407SSherry Moore 12819397407SSherry Moore /* 129753a6d45SSherry Moore * Reserve memory below PA 1G in preparation of fast reboot. 130753a6d45SSherry Moore * 131753a6d45SSherry Moore * This variable is only checked when fastreboot_capable is set, but 132753a6d45SSherry Moore * fastreboot_onpanic is not set. The amount of memory reserved 133753a6d45SSherry Moore * is negligible, but just in case we are really short of low memory, 134753a6d45SSherry Moore * this variable will give us a backdoor to not consume memory at all. 135753a6d45SSherry Moore */ 136753a6d45SSherry Moore int reserve_mem_enabled = 1; 137753a6d45SSherry Moore 138753a6d45SSherry Moore /* 139*c90a5fbeSSherry Moore * Mutex to protect fastreboot_onpanic. 140*c90a5fbeSSherry Moore */ 141*c90a5fbeSSherry Moore kmutex_t fastreboot_config_mutex; 142*c90a5fbeSSherry Moore 143*c90a5fbeSSherry Moore /* 144753a6d45SSherry Moore * Amount of memory below PA 1G to reserve for constructing the multiboot 145753a6d45SSherry Moore * data structure and the page tables as we tend to run out of those 146753a6d45SSherry Moore * when more drivers are loaded. 147753a6d45SSherry Moore */ 148753a6d45SSherry Moore static size_t fastboot_mbi_size = 0x2000; /* 8K */ 149753a6d45SSherry Moore static size_t fastboot_pagetable_size = 0x5000; /* 20K */ 150753a6d45SSherry Moore 151753a6d45SSherry Moore /* 152753a6d45SSherry Moore * Use below 1G for page tables as 153753a6d45SSherry Moore * 1. we are only doing 1:1 mapping of the bottom 1G of physical memory. 154753a6d45SSherry Moore * 2. we are using 2G as the fake virtual address for the new kernel and 155753a6d45SSherry Moore * boot archive. 15619397407SSherry Moore */ 15719397407SSherry Moore static ddi_dma_attr_t fastboot_below_1G_dma_attr = { 15819397407SSherry Moore DMA_ATTR_V0, 15919397407SSherry Moore 0x0000000008000000ULL, /* dma_attr_addr_lo: 128MB */ 16019397407SSherry Moore 0x000000003FFFFFFFULL, /* dma_attr_addr_hi: 1G */ 16119397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_count_max */ 16219397407SSherry Moore 0x0000000000001000ULL, /* dma_attr_align: 4KB */ 16319397407SSherry Moore 1, /* dma_attr_burstsize */ 16419397407SSherry Moore 1, /* dma_attr_minxfer */ 16519397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_maxxfer */ 16619397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_seg */ 16719397407SSherry Moore 1, /* dma_attr_sgllen */ 16819397407SSherry Moore 0x1000ULL, /* dma_attr_granular */ 16919397407SSherry Moore 0, /* dma_attr_flags */ 17019397407SSherry Moore }; 17119397407SSherry Moore 17219397407SSherry Moore static ddi_dma_attr_t fastboot_dma_attr = { 17319397407SSherry Moore DMA_ATTR_V0, 17419397407SSherry Moore 0x0000000008000000ULL, /* dma_attr_addr_lo: 128MB */ 175877400d3SKonstantin Ananyev #ifdef __amd64 176877400d3SKonstantin Ananyev 0xFFFFFFFFFFFFFFFFULL, /* dma_attr_addr_hi: 2^64B */ 177877400d3SKonstantin Ananyev #else 17819397407SSherry Moore 0x0000000FFFFFFFFFULL, /* dma_attr_addr_hi: 64GB */ 179877400d3SKonstantin Ananyev #endif /* __amd64 */ 18019397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_count_max */ 18119397407SSherry Moore 0x0000000000001000ULL, /* dma_attr_align: 4KB */ 18219397407SSherry Moore 1, /* dma_attr_burstsize */ 18319397407SSherry Moore 1, /* dma_attr_minxfer */ 18419397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_maxxfer */ 18519397407SSherry Moore 0x00000000FFFFFFFFULL, /* dma_attr_seg */ 18619397407SSherry Moore 1, /* dma_attr_sgllen */ 18719397407SSherry Moore 0x1000ULL, /* dma_attr_granular */ 18819397407SSherry Moore 0, /* dma_attr_flags */ 18919397407SSherry Moore }; 19019397407SSherry Moore 19119397407SSherry Moore /* 19219397407SSherry Moore * Various information saved from the previous boot to reconstruct 19319397407SSherry Moore * multiboot_info. 19419397407SSherry Moore */ 19519397407SSherry Moore extern multiboot_info_t saved_mbi; 19619397407SSherry Moore extern mb_memory_map_t saved_mmap[FASTBOOT_SAVED_MMAP_COUNT]; 1976915124bSKonstantin Ananyev extern uint8_t saved_drives[FASTBOOT_SAVED_DRIVES_SIZE]; 19819397407SSherry Moore extern char saved_cmdline[FASTBOOT_SAVED_CMDLINE_LEN]; 19919397407SSherry Moore extern int saved_cmdline_len; 200753a6d45SSherry Moore extern size_t saved_file_size[]; 20119397407SSherry Moore 20219397407SSherry Moore extern void* contig_alloc(size_t size, ddi_dma_attr_t *attr, 20319397407SSherry Moore uintptr_t align, int cansleep); 2046bc8bc6aSSherry Moore extern void contig_free(void *addr, size_t size); 2056bc8bc6aSSherry Moore 20619397407SSherry Moore 20719397407SSherry Moore /* PRINTLIKE */ 20819397407SSherry Moore extern void vprintf(const char *, va_list); 20919397407SSherry Moore 21019397407SSherry Moore 21119397407SSherry Moore /* 21219397407SSherry Moore * Need to be able to get boot_archives from other places 21319397407SSherry Moore */ 21419397407SSherry Moore #define BOOTARCHIVE64 "/platform/i86pc/amd64/boot_archive" 21519397407SSherry Moore #define BOOTARCHIVE32 "/platform/i86pc/boot_archive" 216753a6d45SSherry Moore #define BOOTARCHIVE32_FAILSAFE "/boot/x86.miniroot-safe" 217753a6d45SSherry Moore #define BOOTARCHIVE64_FAILSAFE "/boot/amd64/x86.miniroot-safe" 218753a6d45SSherry Moore #define FAILSAFE_BOOTFILE32 "/boot/platform/i86pc/kernel/unix" 219753a6d45SSherry Moore #define FAILSAFE_BOOTFILE64 "/boot/platform/i86pc/kernel/amd64/unix" 22019397407SSherry Moore 22119397407SSherry Moore static uint_t fastboot_vatoindex(fastboot_info_t *, uintptr_t, int); 22219397407SSherry Moore static void fastboot_map_with_size(fastboot_info_t *, uintptr_t, 22319397407SSherry Moore paddr_t, size_t, int); 22419397407SSherry Moore static void fastboot_build_pagetables(fastboot_info_t *); 22519397407SSherry Moore static int fastboot_build_mbi(char *, fastboot_info_t *); 226753a6d45SSherry Moore static void fastboot_free_file(fastboot_file_t *); 22719397407SSherry Moore 22819397407SSherry Moore static const char fastboot_enomem_msg[] = "Fastboot: Couldn't allocate 0x%" 22919397407SSherry Moore PRIx64" bytes below %s to do fast reboot"; 23019397407SSherry Moore 23119397407SSherry Moore static void 23219397407SSherry Moore dprintf(char *fmt, ...) 23319397407SSherry Moore { 23419397407SSherry Moore va_list adx; 23519397407SSherry Moore 23619397407SSherry Moore if (!fastboot_debug) 23719397407SSherry Moore return; 23819397407SSherry Moore 23919397407SSherry Moore va_start(adx, fmt); 24019397407SSherry Moore vprintf(fmt, adx); 24119397407SSherry Moore va_end(adx); 24219397407SSherry Moore } 24319397407SSherry Moore 24419397407SSherry Moore 24519397407SSherry Moore /* 24619397407SSherry Moore * Return the index corresponding to a virt address at a given page table level. 24719397407SSherry Moore */ 24819397407SSherry Moore static uint_t 24919397407SSherry Moore fastboot_vatoindex(fastboot_info_t *nk, uintptr_t va, int level) 25019397407SSherry Moore { 25119397407SSherry Moore return ((va >> nk->fi_shift_amt[level]) & (nk->fi_ptes_per_table - 1)); 25219397407SSherry Moore } 25319397407SSherry Moore 25419397407SSherry Moore 25519397407SSherry Moore /* 25619397407SSherry Moore * Add mapping from vstart to pstart for the specified size. 257877400d3SKonstantin Ananyev * vstart, pstart and size should all have been aligned at 2M boundaries. 25819397407SSherry Moore */ 25919397407SSherry Moore static void 26019397407SSherry Moore fastboot_map_with_size(fastboot_info_t *nk, uintptr_t vstart, paddr_t pstart, 26119397407SSherry Moore size_t size, int level) 26219397407SSherry Moore { 26319397407SSherry Moore x86pte_t pteval, *table; 26419397407SSherry Moore uintptr_t vaddr; 26519397407SSherry Moore paddr_t paddr; 26619397407SSherry Moore int index, l; 26719397407SSherry Moore 26819397407SSherry Moore table = (x86pte_t *)(nk->fi_pagetable_va); 26919397407SSherry Moore 27019397407SSherry Moore for (l = nk->fi_top_level; l >= level; l--) { 27119397407SSherry Moore 27219397407SSherry Moore index = fastboot_vatoindex(nk, vstart, l); 27319397407SSherry Moore 27419397407SSherry Moore if (l == level) { 27519397407SSherry Moore /* 27619397407SSherry Moore * Last level. Program the page table entries. 27719397407SSherry Moore */ 27819397407SSherry Moore for (vaddr = vstart, paddr = pstart; 27919397407SSherry Moore vaddr < vstart + size; 28019397407SSherry Moore vaddr += (1ULL << nk->fi_shift_amt[l]), 28119397407SSherry Moore paddr += (1ULL << nk->fi_shift_amt[l])) { 28219397407SSherry Moore 28319397407SSherry Moore uint_t index = fastboot_vatoindex(nk, vaddr, l); 28419397407SSherry Moore 28519397407SSherry Moore if (l > 0) 28619397407SSherry Moore pteval = paddr | pte_bits | PT_PAGESIZE; 28719397407SSherry Moore else 28819397407SSherry Moore pteval = paddr | pte_bits; 28919397407SSherry Moore 29019397407SSherry Moore table[index] = pteval; 29119397407SSherry Moore } 29219397407SSherry Moore } else if (table[index] & PT_VALID) { 29319397407SSherry Moore 29419397407SSherry Moore table = (x86pte_t *) 29519397407SSherry Moore ((uintptr_t)(((paddr_t)table[index] & MMU_PAGEMASK) 29619397407SSherry Moore - nk->fi_pagetable_pa) + nk->fi_pagetable_va); 29719397407SSherry Moore } else { 29819397407SSherry Moore /* 299877400d3SKonstantin Ananyev * Intermediate levels. 300877400d3SKonstantin Ananyev * Program with either valid bit or PTP bits. 30119397407SSherry Moore */ 30219397407SSherry Moore if (l == nk->fi_top_level) { 303877400d3SKonstantin Ananyev #ifdef __amd64 304877400d3SKonstantin Ananyev ASSERT(nk->fi_top_level == 3); 305877400d3SKonstantin Ananyev table[index] = nk->fi_next_table_pa | ptp_bits; 306877400d3SKonstantin Ananyev #else 30719397407SSherry Moore table[index] = nk->fi_next_table_pa | PT_VALID; 308877400d3SKonstantin Ananyev #endif /* __amd64 */ 30919397407SSherry Moore } else { 31019397407SSherry Moore table[index] = nk->fi_next_table_pa | ptp_bits; 31119397407SSherry Moore } 31219397407SSherry Moore table = (x86pte_t *)(nk->fi_next_table_va); 31319397407SSherry Moore nk->fi_next_table_va += MMU_PAGESIZE; 31419397407SSherry Moore nk->fi_next_table_pa += MMU_PAGESIZE; 31519397407SSherry Moore } 31619397407SSherry Moore } 31719397407SSherry Moore } 31819397407SSherry Moore 31919397407SSherry Moore /* 32019397407SSherry Moore * Build page tables for the lower 1G of physical memory using 2M 32119397407SSherry Moore * pages, and prepare page tables for mapping new kernel and boot 32219397407SSherry Moore * archive pages using 4K pages. 32319397407SSherry Moore */ 32419397407SSherry Moore static void 32519397407SSherry Moore fastboot_build_pagetables(fastboot_info_t *nk) 32619397407SSherry Moore { 32719397407SSherry Moore /* 32819397407SSherry Moore * Map lower 1G physical memory. Use large pages. 32919397407SSherry Moore */ 33019397407SSherry Moore fastboot_map_with_size(nk, 0, 0, ONE_GIG, 1); 33119397407SSherry Moore 33219397407SSherry Moore /* 33319397407SSherry Moore * Map one 4K page to get the middle page tables set up. 33419397407SSherry Moore */ 33519397407SSherry Moore fake_va = P2ALIGN_TYPED(fake_va, nk->fi_lpagesize, uintptr_t); 33619397407SSherry Moore fastboot_map_with_size(nk, fake_va, 33719397407SSherry Moore nk->fi_files[0].fb_pte_list_va[0] & MMU_PAGEMASK, PAGESIZE, 0); 33819397407SSherry Moore } 33919397407SSherry Moore 34019397407SSherry Moore 34119397407SSherry Moore /* 34219397407SSherry Moore * Sanity check. Look for dboot offset. 34319397407SSherry Moore */ 34419397407SSherry Moore static int 34519397407SSherry Moore fastboot_elf64_find_dboot_load_offset(void *img, off_t imgsz, uint32_t *offp) 34619397407SSherry Moore { 34719397407SSherry Moore Elf64_Ehdr *ehdr = (Elf64_Ehdr *)img; 34819397407SSherry Moore Elf64_Phdr *phdr; 34919397407SSherry Moore uint8_t *phdrbase; 35019397407SSherry Moore int i; 35119397407SSherry Moore 35219397407SSherry Moore if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz) 35319397407SSherry Moore return (-1); 35419397407SSherry Moore 35519397407SSherry Moore phdrbase = (uint8_t *)img + ehdr->e_phoff; 35619397407SSherry Moore 35719397407SSherry Moore for (i = 0; i < ehdr->e_phnum; i++) { 35819397407SSherry Moore phdr = (Elf64_Phdr *)(phdrbase + ehdr->e_phentsize * i); 35919397407SSherry Moore 36019397407SSherry Moore if (phdr->p_type == PT_LOAD) { 36119397407SSherry Moore if (phdr->p_vaddr == phdr->p_paddr && 36219397407SSherry Moore phdr->p_vaddr == DBOOT_ENTRY_ADDRESS) { 36319397407SSherry Moore ASSERT(phdr->p_offset <= UINT32_MAX); 36419397407SSherry Moore *offp = (uint32_t)phdr->p_offset; 36519397407SSherry Moore return (0); 36619397407SSherry Moore } 36719397407SSherry Moore } 36819397407SSherry Moore } 36919397407SSherry Moore 37019397407SSherry Moore return (-1); 37119397407SSherry Moore } 37219397407SSherry Moore 37319397407SSherry Moore 37419397407SSherry Moore /* 37519397407SSherry Moore * Initialize text and data section information for 32-bit kernel. 376877400d3SKonstantin Ananyev * sectcntp - is both input/output parameter. 377877400d3SKonstantin Ananyev * On entry, *sectcntp contains maximum allowable number of sections; 378877400d3SKonstantin Ananyev * on return, it contains the actual number of sections filled. 37919397407SSherry Moore */ 38019397407SSherry Moore static int 38119397407SSherry Moore fastboot_elf32_find_loadables(void *img, off_t imgsz, fastboot_section_t *sectp, 38219397407SSherry Moore int *sectcntp, uint32_t *offp) 38319397407SSherry Moore { 38419397407SSherry Moore Elf32_Ehdr *ehdr = (Elf32_Ehdr *)img; 38519397407SSherry Moore Elf32_Phdr *phdr; 38619397407SSherry Moore uint8_t *phdrbase; 38719397407SSherry Moore int i; 38819397407SSherry Moore int used_sections = 0; 389877400d3SKonstantin Ananyev const int max_sectcnt = *sectcntp; 39019397407SSherry Moore 39119397407SSherry Moore if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz) 39219397407SSherry Moore return (-1); 39319397407SSherry Moore 39419397407SSherry Moore phdrbase = (uint8_t *)img + ehdr->e_phoff; 39519397407SSherry Moore 39619397407SSherry Moore for (i = 0; i < ehdr->e_phnum; i++) { 39719397407SSherry Moore phdr = (Elf32_Phdr *)(phdrbase + ehdr->e_phentsize * i); 39819397407SSherry Moore 39919397407SSherry Moore if (phdr->p_type == PT_INTERP) 40019397407SSherry Moore return (-1); 40119397407SSherry Moore 40219397407SSherry Moore if (phdr->p_type != PT_LOAD) 40319397407SSherry Moore continue; 40419397407SSherry Moore 40519397407SSherry Moore if (phdr->p_vaddr == phdr->p_paddr && 40619397407SSherry Moore phdr->p_paddr == DBOOT_ENTRY_ADDRESS) { 40719397407SSherry Moore *offp = (uint32_t)phdr->p_offset; 40819397407SSherry Moore } else { 409877400d3SKonstantin Ananyev if (max_sectcnt <= used_sections) 410877400d3SKonstantin Ananyev return (-1); 411877400d3SKonstantin Ananyev 41219397407SSherry Moore sectp[used_sections].fb_sec_offset = phdr->p_offset; 41319397407SSherry Moore sectp[used_sections].fb_sec_paddr = phdr->p_paddr; 41419397407SSherry Moore sectp[used_sections].fb_sec_size = phdr->p_filesz; 41519397407SSherry Moore sectp[used_sections].fb_sec_bss_size = 41619397407SSherry Moore (phdr->p_filesz < phdr->p_memsz) ? 41719397407SSherry Moore (phdr->p_memsz - phdr->p_filesz) : 0; 41819397407SSherry Moore 419877400d3SKonstantin Ananyev /* Extra sanity check for the input object file */ 420877400d3SKonstantin Ananyev if (sectp[used_sections].fb_sec_paddr + 421877400d3SKonstantin Ananyev sectp[used_sections].fb_sec_size + 422877400d3SKonstantin Ananyev sectp[used_sections].fb_sec_bss_size >= 423877400d3SKonstantin Ananyev DBOOT_ENTRY_ADDRESS) 424877400d3SKonstantin Ananyev return (-1); 425877400d3SKonstantin Ananyev 42619397407SSherry Moore used_sections++; 42719397407SSherry Moore } 42819397407SSherry Moore } 42919397407SSherry Moore 43019397407SSherry Moore *sectcntp = used_sections; 43119397407SSherry Moore return (0); 43219397407SSherry Moore } 43319397407SSherry Moore 43419397407SSherry Moore /* 4351a6f4459SKonstantin Ananyev * Create multiboot info structure (mbi) base on the saved mbi. 4361a6f4459SKonstantin Ananyev * Recalculate values of the pointer type fields in the data 4371a6f4459SKonstantin Ananyev * structure based on the new starting physical address of the 4381a6f4459SKonstantin Ananyev * data structure. 43919397407SSherry Moore */ 44019397407SSherry Moore static int 44119397407SSherry Moore fastboot_build_mbi(char *mdep, fastboot_info_t *nk) 44219397407SSherry Moore { 44319397407SSherry Moore mb_module_t *mbp; 4441a6f4459SKonstantin Ananyev multiboot_info_t *mbi; /* pointer to multiboot structure */ 4451a6f4459SKonstantin Ananyev uintptr_t start_addr_va; /* starting VA of mbi */ 4461a6f4459SKonstantin Ananyev uintptr_t start_addr_pa; /* starting PA of mbi */ 4471a6f4459SKonstantin Ananyev size_t offs = 0; /* offset from the starting address */ 4481a6f4459SKonstantin Ananyev size_t arglen; /* length of the command line arg */ 4491a6f4459SKonstantin Ananyev size_t size; /* size of the memory reserved for mbi */ 4501a6f4459SKonstantin Ananyev size_t mdnsz; /* length of the boot archive name */ 45119397407SSherry Moore 4521a6f4459SKonstantin Ananyev /* 4531a6f4459SKonstantin Ananyev * If mdep is not NULL or empty, use the length of mdep + 1 4541a6f4459SKonstantin Ananyev * (for NULL terminating) as the length of the new command 4551a6f4459SKonstantin Ananyev * line; else use the saved command line length as the 4561a6f4459SKonstantin Ananyev * length for the new command line. 4571a6f4459SKonstantin Ananyev */ 4586bc8bc6aSSherry Moore if (mdep != NULL && strlen(mdep) != 0) { 45919397407SSherry Moore arglen = strlen(mdep) + 1; 46019397407SSherry Moore } else { 46119397407SSherry Moore arglen = saved_cmdline_len; 46219397407SSherry Moore } 46319397407SSherry Moore 4641a6f4459SKonstantin Ananyev /* 4651a6f4459SKonstantin Ananyev * Allocate memory for the new multiboot info structure (mbi). 4661a6f4459SKonstantin Ananyev * If we have reserved memory for mbi but it's not enough, 4671a6f4459SKonstantin Ananyev * free it and reallocate. 4681a6f4459SKonstantin Ananyev */ 46919397407SSherry Moore size = PAGESIZE + P2ROUNDUP(arglen, PAGESIZE); 470753a6d45SSherry Moore if (nk->fi_mbi_size && nk->fi_mbi_size < size) { 471753a6d45SSherry Moore contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 472753a6d45SSherry Moore nk->fi_mbi_size = 0; 47319397407SSherry Moore } 47419397407SSherry Moore 475753a6d45SSherry Moore if (nk->fi_mbi_size == 0) { 476753a6d45SSherry Moore if ((nk->fi_new_mbi_va = 477753a6d45SSherry Moore (uintptr_t)contig_alloc(size, &fastboot_below_1G_dma_attr, 478753a6d45SSherry Moore PAGESIZE, 0)) == NULL) { 479753a6d45SSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, 480753a6d45SSherry Moore (uint64_t)size, "1G"); 481753a6d45SSherry Moore return (-1); 482753a6d45SSherry Moore } 483753a6d45SSherry Moore /* 484753a6d45SSherry Moore * fi_mbi_size must be set after the allocation succeeds 485753a6d45SSherry Moore * as it's used to determine how much memory to free. 486753a6d45SSherry Moore */ 487753a6d45SSherry Moore nk->fi_mbi_size = size; 488753a6d45SSherry Moore } 48919397407SSherry Moore 4901a6f4459SKonstantin Ananyev /* 4911a6f4459SKonstantin Ananyev * Initalize memory 4921a6f4459SKonstantin Ananyev */ 493753a6d45SSherry Moore bzero((void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 49419397407SSherry Moore 4951a6f4459SKonstantin Ananyev /* 4961a6f4459SKonstantin Ananyev * Get PA for the new mbi 4971a6f4459SKonstantin Ananyev */ 4981a6f4459SKonstantin Ananyev start_addr_va = nk->fi_new_mbi_va; 4991a6f4459SKonstantin Ananyev start_addr_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 5001a6f4459SKonstantin Ananyev (caddr_t)start_addr_va)); 5011a6f4459SKonstantin Ananyev nk->fi_new_mbi_pa = (paddr_t)start_addr_pa; 502753a6d45SSherry Moore 503753a6d45SSherry Moore /* 5041a6f4459SKonstantin Ananyev * Populate the rest of the fields in the data structure 505753a6d45SSherry Moore */ 506753a6d45SSherry Moore 5071a6f4459SKonstantin Ananyev /* 5081a6f4459SKonstantin Ananyev * Copy from the saved mbi to preserve all non-pointer type fields. 5091a6f4459SKonstantin Ananyev */ 5101a6f4459SKonstantin Ananyev mbi = (multiboot_info_t *)start_addr_va; 5111a6f4459SKonstantin Ananyev bcopy(&saved_mbi, mbi, sizeof (*mbi)); 51219397407SSherry Moore 5131a6f4459SKonstantin Ananyev /* 5141a6f4459SKonstantin Ananyev * Recalculate mods_addr. Set mod_start and mod_end based on 5151a6f4459SKonstantin Ananyev * the physical address of the new boot archive. Set mod_name 5161a6f4459SKonstantin Ananyev * to the name of the new boto archive. 5171a6f4459SKonstantin Ananyev */ 5181a6f4459SKonstantin Ananyev offs += sizeof (multiboot_info_t); 5191a6f4459SKonstantin Ananyev mbi->mods_addr = start_addr_pa + offs; 5201a6f4459SKonstantin Ananyev mbp = (mb_module_t *)(start_addr_va + offs); 521753a6d45SSherry Moore mbp->mod_start = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_dest_pa; 522753a6d45SSherry Moore mbp->mod_end = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_next_pa; 52319397407SSherry Moore 5241a6f4459SKonstantin Ananyev offs += sizeof (mb_module_t); 5251a6f4459SKonstantin Ananyev mdnsz = strlen(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE]) + 1; 5261a6f4459SKonstantin Ananyev bcopy(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE], 5271a6f4459SKonstantin Ananyev (void *)(start_addr_va + offs), mdnsz); 5281a6f4459SKonstantin Ananyev mbp->mod_name = start_addr_pa + offs; 52919397407SSherry Moore mbp->reserved = 0; 53019397407SSherry Moore 5311a6f4459SKonstantin Ananyev /* 5321a6f4459SKonstantin Ananyev * Make sure the offset is 16-byte aligned to avoid unaligned access. 5331a6f4459SKonstantin Ananyev */ 5341a6f4459SKonstantin Ananyev offs += mdnsz; 5351a6f4459SKonstantin Ananyev offs = P2ROUNDUP_TYPED(offs, 16, size_t); 5361a6f4459SKonstantin Ananyev 5371a6f4459SKonstantin Ananyev /* 5381a6f4459SKonstantin Ananyev * Recalculate mmap_addr 5391a6f4459SKonstantin Ananyev */ 5401a6f4459SKonstantin Ananyev mbi->mmap_addr = start_addr_pa + offs; 5411a6f4459SKonstantin Ananyev bcopy((void *)(uintptr_t)saved_mmap, (void *)(start_addr_va + offs), 54219397407SSherry Moore saved_mbi.mmap_length); 5431a6f4459SKonstantin Ananyev offs += saved_mbi.mmap_length; 54419397407SSherry Moore 5451a6f4459SKonstantin Ananyev /* 5461a6f4459SKonstantin Ananyev * Recalculate drives_addr 5471a6f4459SKonstantin Ananyev */ 5481a6f4459SKonstantin Ananyev mbi->drives_addr = start_addr_pa + offs; 5491a6f4459SKonstantin Ananyev bcopy((void *)(uintptr_t)saved_drives, (void *)(start_addr_va + offs), 55019397407SSherry Moore saved_mbi.drives_length); 5511a6f4459SKonstantin Ananyev offs += saved_mbi.drives_length; 55219397407SSherry Moore 5531a6f4459SKonstantin Ananyev /* 5541a6f4459SKonstantin Ananyev * Recalculate the address of cmdline. Set cmdline to contain the 5551a6f4459SKonstantin Ananyev * new boot argument. 5561a6f4459SKonstantin Ananyev */ 5571a6f4459SKonstantin Ananyev mbi->cmdline = start_addr_pa + offs; 55819397407SSherry Moore 5596bc8bc6aSSherry Moore if (mdep != NULL && strlen(mdep) != 0) { 5601a6f4459SKonstantin Ananyev bcopy(mdep, (void *)(start_addr_va + offs), arglen); 56119397407SSherry Moore } else { 5621a6f4459SKonstantin Ananyev bcopy((void *)saved_cmdline, (void *)(start_addr_va + offs), 5631a6f4459SKonstantin Ananyev arglen); 56419397407SSherry Moore } 56519397407SSherry Moore 5666915124bSKonstantin Ananyev /* clear fields and flags that are not copied */ 5676915124bSKonstantin Ananyev bzero(&mbi->config_table, 5686915124bSKonstantin Ananyev sizeof (*mbi) - offsetof(multiboot_info_t, config_table)); 5696915124bSKonstantin Ananyev mbi->flags &= ~(MB_INFO_CONFIG_TABLE | MB_INFO_BOOT_LOADER_NAME | 5706915124bSKonstantin Ananyev MB_INFO_APM_TABLE | MB_INFO_VIDEO_INFO); 5716915124bSKonstantin Ananyev 57219397407SSherry Moore return (0); 57319397407SSherry Moore } 57419397407SSherry Moore 5756bc8bc6aSSherry Moore /* 5766bc8bc6aSSherry Moore * Initialize HAT related fields 5776bc8bc6aSSherry Moore */ 5786bc8bc6aSSherry Moore static void 5796bc8bc6aSSherry Moore fastboot_init_fields(fastboot_info_t *nk) 58019397407SSherry Moore { 58119397407SSherry Moore if (x86_feature & X86_PAE) { 5826bc8bc6aSSherry Moore nk->fi_has_pae = 1; 5836bc8bc6aSSherry Moore nk->fi_shift_amt = fastboot_shift_amt_pae; 5846bc8bc6aSSherry Moore nk->fi_ptes_per_table = 512; 5856bc8bc6aSSherry Moore nk->fi_lpagesize = (2 << 20); /* 2M */ 586877400d3SKonstantin Ananyev #ifdef __amd64 587877400d3SKonstantin Ananyev nk->fi_top_level = 3; 588877400d3SKonstantin Ananyev #else 5896bc8bc6aSSherry Moore nk->fi_top_level = 2; 590877400d3SKonstantin Ananyev #endif /* __amd64 */ 5916bc8bc6aSSherry Moore } 59219397407SSherry Moore } 59319397407SSherry Moore 5946bc8bc6aSSherry Moore /* 5956bc8bc6aSSherry Moore * Process boot argument 5966bc8bc6aSSherry Moore */ 5976bc8bc6aSSherry Moore static void 5986bc8bc6aSSherry Moore fastboot_parse_mdep(char *mdep, char *kern_bootpath, int *bootpath_len, 5996bc8bc6aSSherry Moore char *bootargs) 6006bc8bc6aSSherry Moore { 6016bc8bc6aSSherry Moore int i; 60219397407SSherry Moore 60319397407SSherry Moore /* 60419397407SSherry Moore * If mdep is not NULL, it comes in the format of 60519397407SSherry Moore * mountpoint unix args 60619397407SSherry Moore */ 6076bc8bc6aSSherry Moore if (mdep != NULL && strlen(mdep) != 0) { 60819397407SSherry Moore if (mdep[0] != '-') { 60919397407SSherry Moore /* First get the root argument */ 61019397407SSherry Moore i = 0; 61119397407SSherry Moore while (mdep[i] != '\0' && mdep[i] != ' ') { 61219397407SSherry Moore i++; 61319397407SSherry Moore } 61419397407SSherry Moore 61519397407SSherry Moore if (i < 4 || strncmp(&mdep[i-4], "unix", 4) != 0) { 61619397407SSherry Moore /* mount point */ 61719397407SSherry Moore bcopy(mdep, kern_bootpath, i); 61819397407SSherry Moore kern_bootpath[i] = '\0'; 6196bc8bc6aSSherry Moore *bootpath_len = i; 62019397407SSherry Moore 62119397407SSherry Moore /* 62219397407SSherry Moore * Get the next argument. It should be unix as 62319397407SSherry Moore * we have validated in in halt.c. 62419397407SSherry Moore */ 62519397407SSherry Moore if (strlen(mdep) > i) { 62619397407SSherry Moore mdep += (i + 1); 62719397407SSherry Moore i = 0; 62819397407SSherry Moore while (mdep[i] != '\0' && 62919397407SSherry Moore mdep[i] != ' ') { 63019397407SSherry Moore i++; 63119397407SSherry Moore } 63219397407SSherry Moore } 63319397407SSherry Moore 63419397407SSherry Moore } 63519397407SSherry Moore bcopy(mdep, kern_bootfile, i); 63619397407SSherry Moore kern_bootfile[i] = '\0'; 6376bc8bc6aSSherry Moore bcopy(mdep, bootargs, strlen(mdep)); 63819397407SSherry Moore } else { 63919397407SSherry Moore int off = strlen(kern_bootfile); 64019397407SSherry Moore bcopy(kern_bootfile, bootargs, off); 64119397407SSherry Moore bcopy(" ", &bootargs[off++], 1); 64219397407SSherry Moore bcopy(mdep, &bootargs[off], strlen(mdep)); 64319397407SSherry Moore off += strlen(mdep); 64419397407SSherry Moore bootargs[off] = '\0'; 64519397407SSherry Moore } 64619397407SSherry Moore } 6476bc8bc6aSSherry Moore } 6486bc8bc6aSSherry Moore 6496bc8bc6aSSherry Moore /* 650753a6d45SSherry Moore * Reserve memory under PA 1G for mapping the new kernel and boot archive. 651753a6d45SSherry Moore * This function is only called if fastreboot_onpanic is *not* set. 652753a6d45SSherry Moore */ 653753a6d45SSherry Moore static void 654753a6d45SSherry Moore fastboot_reserve_mem(fastboot_info_t *nk) 655753a6d45SSherry Moore { 656753a6d45SSherry Moore int i; 657753a6d45SSherry Moore 658753a6d45SSherry Moore /* 659753a6d45SSherry Moore * A valid kernel is in place. No need to reserve any memory. 660753a6d45SSherry Moore */ 661753a6d45SSherry Moore if (nk->fi_valid) 662753a6d45SSherry Moore return; 663753a6d45SSherry Moore 664753a6d45SSherry Moore /* 665753a6d45SSherry Moore * Reserve memory under PA 1G for PTE lists. 666753a6d45SSherry Moore */ 667753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 668753a6d45SSherry Moore fastboot_file_t *fb = &nk->fi_files[i]; 669753a6d45SSherry Moore size_t fsize_roundup, size; 670753a6d45SSherry Moore 671753a6d45SSherry Moore fsize_roundup = P2ROUNDUP_TYPED(saved_file_size[i], 672753a6d45SSherry Moore PAGESIZE, size_t); 673753a6d45SSherry Moore size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup); 674753a6d45SSherry Moore if ((fb->fb_pte_list_va = contig_alloc(size, 675753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) { 676753a6d45SSherry Moore return; 677753a6d45SSherry Moore } 678753a6d45SSherry Moore fb->fb_pte_list_size = size; 679753a6d45SSherry Moore } 680753a6d45SSherry Moore 681753a6d45SSherry Moore /* 682753a6d45SSherry Moore * Reserve memory under PA 1G for page tables. 683753a6d45SSherry Moore */ 684753a6d45SSherry Moore if ((nk->fi_pagetable_va = 685753a6d45SSherry Moore (uintptr_t)contig_alloc(fastboot_pagetable_size, 686753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) { 687753a6d45SSherry Moore return; 688753a6d45SSherry Moore } 689753a6d45SSherry Moore nk->fi_pagetable_size = fastboot_pagetable_size; 690753a6d45SSherry Moore 691753a6d45SSherry Moore /* 692753a6d45SSherry Moore * Reserve memory under PA 1G for multiboot structure. 693753a6d45SSherry Moore */ 694753a6d45SSherry Moore if ((nk->fi_new_mbi_va = (uintptr_t)contig_alloc(fastboot_mbi_size, 695753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) { 696753a6d45SSherry Moore return; 697753a6d45SSherry Moore } 698753a6d45SSherry Moore nk->fi_mbi_size = fastboot_mbi_size; 699753a6d45SSherry Moore } 700753a6d45SSherry Moore 701753a6d45SSherry Moore /* 702753a6d45SSherry Moore * Calculate MD5 digest for the given fastboot_file. 703753a6d45SSherry Moore * Assumes that the file is allready loaded properly. 704753a6d45SSherry Moore */ 705753a6d45SSherry Moore static void 706753a6d45SSherry Moore fastboot_cksum_file(fastboot_file_t *fb, uchar_t *md5_hash) 707753a6d45SSherry Moore { 708753a6d45SSherry Moore MD5_CTX md5_ctx; 709753a6d45SSherry Moore 710753a6d45SSherry Moore MD5Init(&md5_ctx); 711753a6d45SSherry Moore MD5Update(&md5_ctx, (void *)fb->fb_va, fb->fb_size); 712753a6d45SSherry Moore MD5Final(md5_hash, &md5_ctx); 713753a6d45SSherry Moore } 714753a6d45SSherry Moore 715753a6d45SSherry Moore /* 716753a6d45SSherry Moore * Free up the memory we have allocated for a file 7176bc8bc6aSSherry Moore */ 7186bc8bc6aSSherry Moore static void 7196bc8bc6aSSherry Moore fastboot_free_file(fastboot_file_t *fb) 7206bc8bc6aSSherry Moore { 721753a6d45SSherry Moore size_t fsize_roundup; 7226bc8bc6aSSherry Moore 7236bc8bc6aSSherry Moore fsize_roundup = P2ROUNDUP_TYPED(fb->fb_size, PAGESIZE, size_t); 724753a6d45SSherry Moore if (fsize_roundup) { 7256bc8bc6aSSherry Moore contig_free((void *)fb->fb_va, fsize_roundup); 726753a6d45SSherry Moore fb->fb_va = NULL; 727753a6d45SSherry Moore fb->fb_size = 0; 728753a6d45SSherry Moore } 729753a6d45SSherry Moore } 7306bc8bc6aSSherry Moore 731753a6d45SSherry Moore /* 732753a6d45SSherry Moore * Free up memory used by the PTEs for a file. 733753a6d45SSherry Moore */ 734753a6d45SSherry Moore static void 735753a6d45SSherry Moore fastboot_free_file_pte(fastboot_file_t *fb, uint64_t endaddr) 736753a6d45SSherry Moore { 737753a6d45SSherry Moore if (fb->fb_pte_list_size && fb->fb_pte_list_pa < endaddr) { 738753a6d45SSherry Moore contig_free((void *)fb->fb_pte_list_va, fb->fb_pte_list_size); 739753a6d45SSherry Moore fb->fb_pte_list_va = 0; 740753a6d45SSherry Moore fb->fb_pte_list_pa = 0; 741753a6d45SSherry Moore fb->fb_pte_list_size = 0; 742753a6d45SSherry Moore } 743753a6d45SSherry Moore } 744753a6d45SSherry Moore 745753a6d45SSherry Moore /* 746753a6d45SSherry Moore * Free up all the memory used for representing a kernel with 747753a6d45SSherry Moore * fastboot_info_t. 748753a6d45SSherry Moore */ 749753a6d45SSherry Moore static void 750753a6d45SSherry Moore fastboot_free_mem(fastboot_info_t *nk, uint64_t endaddr) 751753a6d45SSherry Moore { 752753a6d45SSherry Moore int i; 753753a6d45SSherry Moore 754753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 755753a6d45SSherry Moore fastboot_free_file(nk->fi_files + i); 756753a6d45SSherry Moore fastboot_free_file_pte(nk->fi_files + i, endaddr); 757753a6d45SSherry Moore } 758753a6d45SSherry Moore 759753a6d45SSherry Moore if (nk->fi_pagetable_size && nk->fi_pagetable_pa < endaddr) { 760753a6d45SSherry Moore contig_free((void *)nk->fi_pagetable_va, nk->fi_pagetable_size); 761753a6d45SSherry Moore nk->fi_pagetable_va = 0; 762753a6d45SSherry Moore nk->fi_pagetable_pa = 0; 763753a6d45SSherry Moore nk->fi_pagetable_size = 0; 764753a6d45SSherry Moore } 765753a6d45SSherry Moore 766753a6d45SSherry Moore if (nk->fi_mbi_size && nk->fi_new_mbi_pa < endaddr) { 767753a6d45SSherry Moore contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 768753a6d45SSherry Moore nk->fi_new_mbi_va = 0; 769753a6d45SSherry Moore nk->fi_new_mbi_pa = 0; 770753a6d45SSherry Moore nk->fi_mbi_size = 0; 771753a6d45SSherry Moore } 772753a6d45SSherry Moore } 773753a6d45SSherry Moore 774753a6d45SSherry Moore /* 775753a6d45SSherry Moore * Only free up the memory allocated for the kernel and boot archive, 776753a6d45SSherry Moore * but not for the page tables. 777753a6d45SSherry Moore */ 778753a6d45SSherry Moore void 779753a6d45SSherry Moore fastboot_free_newkernel(fastboot_info_t *nk) 780753a6d45SSherry Moore { 781753a6d45SSherry Moore int i; 782753a6d45SSherry Moore 783753a6d45SSherry Moore nk->fi_valid = 0; 784753a6d45SSherry Moore /* 785753a6d45SSherry Moore * Free the memory we have allocated 786753a6d45SSherry Moore */ 787753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 788753a6d45SSherry Moore fastboot_free_file(&(nk->fi_files[i])); 789753a6d45SSherry Moore } 790753a6d45SSherry Moore } 791753a6d45SSherry Moore 792753a6d45SSherry Moore static void 793753a6d45SSherry Moore fastboot_cksum_cdata(fastboot_info_t *nk, uchar_t *md5_hash) 794753a6d45SSherry Moore { 795753a6d45SSherry Moore int i; 796753a6d45SSherry Moore MD5_CTX md5_ctx; 797753a6d45SSherry Moore 798753a6d45SSherry Moore MD5Init(&md5_ctx); 799753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 800753a6d45SSherry Moore MD5Update(&md5_ctx, nk->fi_files[i].fb_pte_list_va, 801753a6d45SSherry Moore nk->fi_files[i].fb_pte_list_size); 802753a6d45SSherry Moore } 803753a6d45SSherry Moore MD5Update(&md5_ctx, (void *)nk->fi_pagetable_va, nk->fi_pagetable_size); 804753a6d45SSherry Moore MD5Update(&md5_ctx, (void *)nk->fi_new_mbi_va, nk->fi_mbi_size); 805753a6d45SSherry Moore 806753a6d45SSherry Moore MD5Final(md5_hash, &md5_ctx); 807753a6d45SSherry Moore } 808753a6d45SSherry Moore 809753a6d45SSherry Moore /* 810753a6d45SSherry Moore * Generate MD5 checksum of the given kernel. 811753a6d45SSherry Moore */ 812753a6d45SSherry Moore static void 813753a6d45SSherry Moore fastboot_cksum_generate(fastboot_info_t *nk) 814753a6d45SSherry Moore { 815753a6d45SSherry Moore int i; 816753a6d45SSherry Moore 817753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 818753a6d45SSherry Moore fastboot_cksum_file(nk->fi_files + i, nk->fi_md5_hash[i]); 819753a6d45SSherry Moore } 820753a6d45SSherry Moore fastboot_cksum_cdata(nk, nk->fi_md5_hash[i]); 821753a6d45SSherry Moore } 822753a6d45SSherry Moore 823753a6d45SSherry Moore /* 824753a6d45SSherry Moore * Calculate MD5 checksum of the given kernel and verify that 825753a6d45SSherry Moore * it matches with what was calculated before. 826753a6d45SSherry Moore */ 827753a6d45SSherry Moore int 828753a6d45SSherry Moore fastboot_cksum_verify(fastboot_info_t *nk) 829753a6d45SSherry Moore { 830753a6d45SSherry Moore int i; 831753a6d45SSherry Moore uchar_t md5_hash[MD5_DIGEST_LENGTH]; 832753a6d45SSherry Moore 833753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 834753a6d45SSherry Moore fastboot_cksum_file(nk->fi_files + i, md5_hash); 835753a6d45SSherry Moore if (bcmp(nk->fi_md5_hash[i], md5_hash, 836753a6d45SSherry Moore sizeof (nk->fi_md5_hash[i])) != 0) 837753a6d45SSherry Moore return (i + 1); 838753a6d45SSherry Moore } 839753a6d45SSherry Moore 840753a6d45SSherry Moore fastboot_cksum_cdata(nk, md5_hash); 841753a6d45SSherry Moore if (bcmp(nk->fi_md5_hash[i], md5_hash, 842753a6d45SSherry Moore sizeof (nk->fi_md5_hash[i])) != 0) 843753a6d45SSherry Moore return (i + 1); 844753a6d45SSherry Moore 845753a6d45SSherry Moore return (0); 8466bc8bc6aSSherry Moore } 8476bc8bc6aSSherry Moore 8486bc8bc6aSSherry Moore /* 8496bc8bc6aSSherry Moore * This function performs the following tasks: 8506bc8bc6aSSherry Moore * - Read the sizes of the new kernel and boot archive. 8516bc8bc6aSSherry Moore * - Allocate memory for the new kernel and boot archive. 8526bc8bc6aSSherry Moore * - Allocate memory for page tables necessary for mapping the memory 8536bc8bc6aSSherry Moore * allocated for the files. 8546bc8bc6aSSherry Moore * - Read the new kernel and boot archive into memory. 8556bc8bc6aSSherry Moore * - Map in the fast reboot switcher. 8566bc8bc6aSSherry Moore * - Load the fast reboot switcher to FASTBOOT_SWTCH_PA. 8576bc8bc6aSSherry Moore * - Build the new multiboot_info structure 8586bc8bc6aSSherry Moore * - Build page tables for the low 1G of physical memory. 8596bc8bc6aSSherry Moore * - Mark the data structure as valid if all steps have succeeded. 8606bc8bc6aSSherry Moore */ 8616bc8bc6aSSherry Moore void 862753a6d45SSherry Moore fastboot_load_kernel(char *mdep) 8636bc8bc6aSSherry Moore { 8646bc8bc6aSSherry Moore void *buf = NULL; 8656bc8bc6aSSherry Moore int i; 8666bc8bc6aSSherry Moore fastboot_file_t *fb; 8676bc8bc6aSSherry Moore uint32_t dboot_start_offset; 8686bc8bc6aSSherry Moore char kern_bootpath[OBP_MAXPATHLEN]; 8696bc8bc6aSSherry Moore extern uintptr_t postbootkernelbase; 870753a6d45SSherry Moore uintptr_t saved_kernelbase; 8716bc8bc6aSSherry Moore int bootpath_len = 0; 8726bc8bc6aSSherry Moore int is_failsafe = 0; 8736bc8bc6aSSherry Moore int is_retry = 0; 8746bc8bc6aSSherry Moore uint64_t end_addr; 8756bc8bc6aSSherry Moore 876*c90a5fbeSSherry Moore if (!fastreboot_capable) 877*c90a5fbeSSherry Moore return; 8786bc8bc6aSSherry Moore 879753a6d45SSherry Moore if (newkernel.fi_valid) 880753a6d45SSherry Moore fastboot_free_newkernel(&newkernel); 881753a6d45SSherry Moore 882753a6d45SSherry Moore saved_kernelbase = postbootkernelbase; 883753a6d45SSherry Moore 8846bc8bc6aSSherry Moore postbootkernelbase = 0; 8856bc8bc6aSSherry Moore 8866bc8bc6aSSherry Moore /* 8876bc8bc6aSSherry Moore * Initialize various HAT related fields in the data structure 8886bc8bc6aSSherry Moore */ 8896bc8bc6aSSherry Moore fastboot_init_fields(&newkernel); 8906bc8bc6aSSherry Moore 8916bc8bc6aSSherry Moore bzero(kern_bootpath, OBP_MAXPATHLEN); 8926bc8bc6aSSherry Moore 8936bc8bc6aSSherry Moore /* 8946bc8bc6aSSherry Moore * Process the boot argument 8956bc8bc6aSSherry Moore */ 896753a6d45SSherry Moore bzero(fastboot_args, OBP_MAXPATHLEN); 897753a6d45SSherry Moore fastboot_parse_mdep(mdep, kern_bootpath, &bootpath_len, fastboot_args); 89819397407SSherry Moore 89919397407SSherry Moore /* 90019397407SSherry Moore * Make sure we get the null character 90119397407SSherry Moore */ 90219397407SSherry Moore bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_UNIX], 90319397407SSherry Moore bootpath_len); 90419397407SSherry Moore bcopy(kern_bootfile, 90519397407SSherry Moore &fastboot_filename[FASTBOOT_NAME_UNIX][bootpath_len], 90619397407SSherry Moore strlen(kern_bootfile) + 1); 90719397407SSherry Moore 90819397407SSherry Moore bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE], 90919397407SSherry Moore bootpath_len); 91019397407SSherry Moore 911753a6d45SSherry Moore if (bcmp(kern_bootfile, FAILSAFE_BOOTFILE32, 912753a6d45SSherry Moore (sizeof (FAILSAFE_BOOTFILE32) - 1)) == 0 || 913753a6d45SSherry Moore bcmp(kern_bootfile, FAILSAFE_BOOTFILE64, 914753a6d45SSherry Moore (sizeof (FAILSAFE_BOOTFILE64) - 1)) == 0) { 91519397407SSherry Moore is_failsafe = 1; 91619397407SSherry Moore } 91719397407SSherry Moore 9186bc8bc6aSSherry Moore load_kernel_retry: 91919397407SSherry Moore /* 92019397407SSherry Moore * Read in unix and boot_archive 92119397407SSherry Moore */ 9226bc8bc6aSSherry Moore end_addr = DBOOT_ENTRY_ADDRESS; 92319397407SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 9246bc8bc6aSSherry Moore struct _buf *file; 9256bc8bc6aSSherry Moore uintptr_t va; 92619397407SSherry Moore uint64_t fsize; 92719397407SSherry Moore size_t fsize_roundup, pt_size; 92819397407SSherry Moore int page_index; 92919397407SSherry Moore uintptr_t offset; 93019397407SSherry Moore ddi_dma_attr_t dma_attr = fastboot_dma_attr; 93119397407SSherry Moore 9326bc8bc6aSSherry Moore 93319397407SSherry Moore dprintf("fastboot_filename[%d] = %s\n", 93419397407SSherry Moore i, fastboot_filename[i]); 93519397407SSherry Moore 93619397407SSherry Moore if ((file = kobj_open_file(fastboot_filename[i])) == 93719397407SSherry Moore (struct _buf *)-1) { 93819397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Couldn't open %s", 93919397407SSherry Moore fastboot_filename[i]); 94019397407SSherry Moore goto err_out; 94119397407SSherry Moore } 94219397407SSherry Moore 94319397407SSherry Moore if (kobj_get_filesize(file, &fsize) != 0) { 94419397407SSherry Moore cmn_err(CE_WARN, 94519397407SSherry Moore "Fastboot: Couldn't get filesize for %s", 94619397407SSherry Moore fastboot_filename[i]); 94719397407SSherry Moore goto err_out; 94819397407SSherry Moore } 94919397407SSherry Moore 9506bc8bc6aSSherry Moore fsize_roundup = P2ROUNDUP_TYPED(fsize, PAGESIZE, size_t); 9516bc8bc6aSSherry Moore 9526bc8bc6aSSherry Moore /* 9536bc8bc6aSSherry Moore * Where the files end in physical memory after being 9546bc8bc6aSSherry Moore * relocated by the fast boot switcher. 9556bc8bc6aSSherry Moore */ 9566bc8bc6aSSherry Moore end_addr += fsize_roundup; 9576bc8bc6aSSherry Moore if (end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_hi) { 9586bc8bc6aSSherry Moore cmn_err(CE_WARN, "Fastboot: boot archive is too big"); 9596bc8bc6aSSherry Moore goto err_out; 96019397407SSherry Moore } 96119397407SSherry Moore 9626bc8bc6aSSherry Moore /* 9636bc8bc6aSSherry Moore * Adjust dma_attr_addr_lo so that the new kernel and boot 9646bc8bc6aSSherry Moore * archive will not be overridden during relocation. 9656bc8bc6aSSherry Moore */ 9666bc8bc6aSSherry Moore if (end_addr > fastboot_dma_attr.dma_attr_addr_lo || 9676bc8bc6aSSherry Moore end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_lo) { 9686bc8bc6aSSherry Moore 9696bc8bc6aSSherry Moore if (is_retry) { 9706bc8bc6aSSherry Moore /* 9716bc8bc6aSSherry Moore * If we have already tried and didn't succeed, 9726bc8bc6aSSherry Moore * just give up. 9736bc8bc6aSSherry Moore */ 9746bc8bc6aSSherry Moore cmn_err(CE_WARN, 9756bc8bc6aSSherry Moore "Fastboot: boot archive is too big"); 9766bc8bc6aSSherry Moore goto err_out; 9776bc8bc6aSSherry Moore } else { 9786bc8bc6aSSherry Moore /* Set the flag so we don't keep retrying */ 9796bc8bc6aSSherry Moore is_retry++; 9806bc8bc6aSSherry Moore 9816bc8bc6aSSherry Moore /* Adjust dma_attr_addr_lo */ 9826bc8bc6aSSherry Moore fastboot_dma_attr.dma_attr_addr_lo = end_addr; 9836bc8bc6aSSherry Moore fastboot_below_1G_dma_attr.dma_attr_addr_lo = 9846bc8bc6aSSherry Moore end_addr; 9856bc8bc6aSSherry Moore 9866bc8bc6aSSherry Moore /* 9876bc8bc6aSSherry Moore * Free the memory we have already allocated 9886bc8bc6aSSherry Moore * whose physical addresses might not fit 9896bc8bc6aSSherry Moore * the new lo and hi constraints. 9906bc8bc6aSSherry Moore */ 991753a6d45SSherry Moore fastboot_free_mem(&newkernel, end_addr); 9926bc8bc6aSSherry Moore goto load_kernel_retry; 9936bc8bc6aSSherry Moore } 9946bc8bc6aSSherry Moore } 9956bc8bc6aSSherry Moore 9966bc8bc6aSSherry Moore 99719397407SSherry Moore if (!fastboot_contig) 99819397407SSherry Moore dma_attr.dma_attr_sgllen = (fsize / PAGESIZE) + 99919397407SSherry Moore (((fsize % PAGESIZE) == 0) ? 0 : 1); 100019397407SSherry Moore 100119397407SSherry Moore if ((buf = contig_alloc(fsize, &dma_attr, PAGESIZE, 0)) 100219397407SSherry Moore == NULL) { 10036bc8bc6aSSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, fsize, "64G"); 100419397407SSherry Moore goto err_out; 100519397407SSherry Moore } 100619397407SSherry Moore 100719397407SSherry Moore va = P2ROUNDUP_TYPED((uintptr_t)buf, PAGESIZE, uintptr_t); 100819397407SSherry Moore 100919397407SSherry Moore if (kobj_read_file(file, (char *)va, fsize, 0) < 0) { 101019397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Couldn't read %s", 101119397407SSherry Moore fastboot_filename[i]); 101219397407SSherry Moore goto err_out; 101319397407SSherry Moore } 101419397407SSherry Moore 101519397407SSherry Moore fb = &newkernel.fi_files[i]; 101619397407SSherry Moore fb->fb_va = va; 101719397407SSherry Moore fb->fb_size = fsize; 101819397407SSherry Moore fb->fb_sectcnt = 0; 101919397407SSherry Moore 1020753a6d45SSherry Moore pt_size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup); 102119397407SSherry Moore 1022753a6d45SSherry Moore /* 1023753a6d45SSherry Moore * If we have reserved memory but it not enough, free it. 1024753a6d45SSherry Moore */ 1025753a6d45SSherry Moore if (fb->fb_pte_list_size && fb->fb_pte_list_size < pt_size) { 1026753a6d45SSherry Moore contig_free((void *)fb->fb_pte_list_va, 1027753a6d45SSherry Moore fb->fb_pte_list_size); 1028753a6d45SSherry Moore fb->fb_pte_list_size = 0; 1029753a6d45SSherry Moore } 1030753a6d45SSherry Moore 1031753a6d45SSherry Moore if (fb->fb_pte_list_size == 0) { 103219397407SSherry Moore if ((fb->fb_pte_list_va = 103319397407SSherry Moore (x86pte_t *)contig_alloc(pt_size, 1034753a6d45SSherry Moore &fastboot_below_1G_dma_attr, PAGESIZE, 0)) 1035753a6d45SSherry Moore == NULL) { 103619397407SSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, 103719397407SSherry Moore (uint64_t)pt_size, "1G"); 103819397407SSherry Moore goto err_out; 103919397407SSherry Moore } 1040753a6d45SSherry Moore /* 1041753a6d45SSherry Moore * fb_pte_list_size must be set after the allocation 1042753a6d45SSherry Moore * succeeds as it's used to determine how much memory to 1043753a6d45SSherry Moore * free. 1044753a6d45SSherry Moore */ 1045753a6d45SSherry Moore fb->fb_pte_list_size = pt_size; 1046753a6d45SSherry Moore } 104719397407SSherry Moore 1048753a6d45SSherry Moore bzero((void *)(fb->fb_pte_list_va), fb->fb_pte_list_size); 104919397407SSherry Moore 105019397407SSherry Moore fb->fb_pte_list_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 105119397407SSherry Moore (caddr_t)fb->fb_pte_list_va)); 105219397407SSherry Moore 105319397407SSherry Moore for (page_index = 0, offset = 0; offset < fb->fb_size; 105419397407SSherry Moore offset += PAGESIZE) { 105519397407SSherry Moore uint64_t paddr; 105619397407SSherry Moore 105719397407SSherry Moore paddr = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 105819397407SSherry Moore (caddr_t)fb->fb_va + offset)); 105919397407SSherry Moore 106019397407SSherry Moore ASSERT(paddr >= fastboot_dma_attr.dma_attr_addr_lo); 106119397407SSherry Moore 106219397407SSherry Moore /* 106319397407SSherry Moore * Include the pte_bits so we don't have to make 106419397407SSherry Moore * it in assembly. 106519397407SSherry Moore */ 106619397407SSherry Moore fb->fb_pte_list_va[page_index++] = (x86pte_t) 106719397407SSherry Moore (paddr | pte_bits); 106819397407SSherry Moore } 106919397407SSherry Moore 107019397407SSherry Moore fb->fb_pte_list_va[page_index] = FASTBOOT_TERMINATE; 107119397407SSherry Moore 107219397407SSherry Moore if (i == FASTBOOT_UNIX) { 10736bc8bc6aSSherry Moore Ehdr *ehdr = (Ehdr *)va; 10746bc8bc6aSSherry Moore int j; 107519397407SSherry Moore 107619397407SSherry Moore /* 107719397407SSherry Moore * Sanity checks: 107819397407SSherry Moore */ 107919397407SSherry Moore for (j = 0; j < SELFMAG; j++) { 108019397407SSherry Moore if (ehdr->e_ident[j] != ELFMAG[j]) { 108119397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Bad ELF " 108219397407SSherry Moore "signature"); 108319397407SSherry Moore goto err_out; 108419397407SSherry Moore } 108519397407SSherry Moore } 108619397407SSherry Moore 108719397407SSherry Moore if (ehdr->e_ident[EI_CLASS] == ELFCLASS32 && 108819397407SSherry Moore ehdr->e_ident[EI_DATA] == ELFDATA2LSB && 108919397407SSherry Moore ehdr->e_machine == EM_386) { 109019397407SSherry Moore 1091877400d3SKonstantin Ananyev fb->fb_sectcnt = sizeof (fb->fb_sections) / 1092877400d3SKonstantin Ananyev sizeof (fb->fb_sections[0]); 1093877400d3SKonstantin Ananyev 109419397407SSherry Moore if (fastboot_elf32_find_loadables((void *)va, 109519397407SSherry Moore fsize, &fb->fb_sections[0], 109619397407SSherry Moore &fb->fb_sectcnt, &dboot_start_offset) < 0) { 109719397407SSherry Moore cmn_err(CE_WARN, "Fastboot: ELF32 " 109819397407SSherry Moore "program section failure"); 109919397407SSherry Moore goto err_out; 110019397407SSherry Moore } 110119397407SSherry Moore 110219397407SSherry Moore if (fb->fb_sectcnt == 0) { 110319397407SSherry Moore cmn_err(CE_WARN, "Fastboot: No ELF32 " 110419397407SSherry Moore "program sections found"); 110519397407SSherry Moore goto err_out; 110619397407SSherry Moore } 110719397407SSherry Moore 110819397407SSherry Moore if (is_failsafe) { 110919397407SSherry Moore /* Failsafe boot_archive */ 1110753a6d45SSherry Moore bcopy(BOOTARCHIVE32_FAILSAFE, 111119397407SSherry Moore &fastboot_filename 111219397407SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 111319397407SSherry Moore [bootpath_len], 1114753a6d45SSherry Moore sizeof (BOOTARCHIVE32_FAILSAFE)); 111519397407SSherry Moore } else { 111619397407SSherry Moore bcopy(BOOTARCHIVE32, 111719397407SSherry Moore &fastboot_filename 111819397407SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 111919397407SSherry Moore [bootpath_len], 112019397407SSherry Moore sizeof (BOOTARCHIVE32)); 112119397407SSherry Moore } 112219397407SSherry Moore 112319397407SSherry Moore } else if (ehdr->e_ident[EI_CLASS] == ELFCLASS64 && 112419397407SSherry Moore ehdr->e_ident[EI_DATA] == ELFDATA2LSB && 112519397407SSherry Moore ehdr->e_machine == EM_AMD64) { 112619397407SSherry Moore 112719397407SSherry Moore if (fastboot_elf64_find_dboot_load_offset( 112819397407SSherry Moore (void *)va, fsize, &dboot_start_offset) 112919397407SSherry Moore != 0) { 113019397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Couldn't " 113119397407SSherry Moore "find ELF64 dboot entry offset"); 113219397407SSherry Moore goto err_out; 113319397407SSherry Moore } 113419397407SSherry Moore 113519397407SSherry Moore if ((x86_feature & X86_64) == 0 || 1136877400d3SKonstantin Ananyev (x86_feature & X86_PAE) == 0) { 113719397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Cannot " 113819397407SSherry Moore "reboot to %s: " 113919397407SSherry Moore "not a 64-bit capable system", 114019397407SSherry Moore kern_bootfile); 114119397407SSherry Moore goto err_out; 114219397407SSherry Moore } 114319397407SSherry Moore 1144753a6d45SSherry Moore if (is_failsafe) { 1145753a6d45SSherry Moore /* Failsafe boot_archive */ 1146753a6d45SSherry Moore bcopy(BOOTARCHIVE64_FAILSAFE, 1147753a6d45SSherry Moore &fastboot_filename 1148753a6d45SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 1149753a6d45SSherry Moore [bootpath_len], 1150753a6d45SSherry Moore sizeof (BOOTARCHIVE64_FAILSAFE)); 1151753a6d45SSherry Moore } else { 115219397407SSherry Moore bcopy(BOOTARCHIVE64, 115319397407SSherry Moore &fastboot_filename 1154753a6d45SSherry Moore [FASTBOOT_NAME_BOOTARCHIVE] 1155753a6d45SSherry Moore [bootpath_len], 115619397407SSherry Moore sizeof (BOOTARCHIVE64)); 1157753a6d45SSherry Moore } 115819397407SSherry Moore } else { 115919397407SSherry Moore cmn_err(CE_WARN, "Fastboot: Unknown ELF type"); 116019397407SSherry Moore goto err_out; 116119397407SSherry Moore } 116219397407SSherry Moore 116319397407SSherry Moore fb->fb_dest_pa = DBOOT_ENTRY_ADDRESS - 116419397407SSherry Moore dboot_start_offset; 116519397407SSherry Moore 116619397407SSherry Moore fb->fb_next_pa = DBOOT_ENTRY_ADDRESS + fsize_roundup; 116719397407SSherry Moore } else { 116819397407SSherry Moore fb->fb_dest_pa = newkernel.fi_files[i - 1].fb_next_pa; 116919397407SSherry Moore fb->fb_next_pa = fb->fb_dest_pa + fsize_roundup; 117019397407SSherry Moore } 117119397407SSherry Moore 117219397407SSherry Moore kobj_close_file(file); 117319397407SSherry Moore 11746bc8bc6aSSherry Moore } 11756bc8bc6aSSherry Moore 117619397407SSherry Moore /* 117719397407SSherry Moore * Add the function that will switch us to 32-bit protected mode 117819397407SSherry Moore */ 117919397407SSherry Moore fb = &newkernel.fi_files[FASTBOOT_SWTCH]; 118019397407SSherry Moore fb->fb_va = fb->fb_dest_pa = FASTBOOT_SWTCH_PA; 1181877400d3SKonstantin Ananyev fb->fb_size = MMU_PAGESIZE; 118219397407SSherry Moore 1183753a6d45SSherry Moore hat_devload(kas.a_hat, (caddr_t)fb->fb_va, 1184753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1185753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1186753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 118719397407SSherry Moore 118819397407SSherry Moore /* 118919397407SSherry Moore * Build the new multiboot_info structure 119019397407SSherry Moore */ 1191753a6d45SSherry Moore if (fastboot_build_mbi(fastboot_args, &newkernel) != 0) { 119219397407SSherry Moore goto err_out; 119319397407SSherry Moore } 119419397407SSherry Moore 119519397407SSherry Moore /* 119619397407SSherry Moore * Build page table for low 1G physical memory. Use big pages. 1197877400d3SKonstantin Ananyev * Allocate 4 (5 for amd64) pages for the page tables. 1198877400d3SKonstantin Ananyev * 1 page for PML4 (amd64) 119919397407SSherry Moore * 1 page for Page-Directory-Pointer Table 1200877400d3SKonstantin Ananyev * 2 pages for Page Directory 120119397407SSherry Moore * 1 page for Page Table. 120219397407SSherry Moore * The page table entry will be rewritten to map the physical 120319397407SSherry Moore * address as we do the copying. 120419397407SSherry Moore */ 120519397407SSherry Moore if (newkernel.fi_has_pae) { 1206877400d3SKonstantin Ananyev #ifdef __amd64 1207877400d3SKonstantin Ananyev size_t size = MMU_PAGESIZE * 5; 1208877400d3SKonstantin Ananyev #else 120919397407SSherry Moore size_t size = MMU_PAGESIZE * 4; 1210877400d3SKonstantin Ananyev #endif /* __amd64 */ 121119397407SSherry Moore 1212753a6d45SSherry Moore if (newkernel.fi_pagetable_size && newkernel.fi_pagetable_size 1213753a6d45SSherry Moore < size) { 1214753a6d45SSherry Moore contig_free((void *)newkernel.fi_pagetable_va, 1215753a6d45SSherry Moore newkernel.fi_pagetable_size); 1216753a6d45SSherry Moore newkernel.fi_pagetable_size = 0; 1217753a6d45SSherry Moore } 1218753a6d45SSherry Moore 1219753a6d45SSherry Moore if (newkernel.fi_pagetable_size == 0) { 122019397407SSherry Moore if ((newkernel.fi_pagetable_va = (uintptr_t) 122119397407SSherry Moore contig_alloc(size, &fastboot_below_1G_dma_attr, 1222877400d3SKonstantin Ananyev MMU_PAGESIZE, 0)) == NULL) { 122319397407SSherry Moore cmn_err(CE_WARN, fastboot_enomem_msg, 122419397407SSherry Moore (uint64_t)size, "1G"); 122519397407SSherry Moore goto err_out; 122619397407SSherry Moore } 1227753a6d45SSherry Moore /* 1228753a6d45SSherry Moore * fi_pagetable_size must be set after the allocation 1229753a6d45SSherry Moore * succeeds as it's used to determine how much memory to 1230753a6d45SSherry Moore * free. 1231753a6d45SSherry Moore */ 1232753a6d45SSherry Moore newkernel.fi_pagetable_size = size; 1233753a6d45SSherry Moore } 123419397407SSherry Moore 123519397407SSherry Moore bzero((void *)(newkernel.fi_pagetable_va), size); 123619397407SSherry Moore 123719397407SSherry Moore newkernel.fi_pagetable_pa = 123819397407SSherry Moore mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat, 123919397407SSherry Moore (caddr_t)newkernel.fi_pagetable_va)); 124019397407SSherry Moore 124119397407SSherry Moore newkernel.fi_last_table_pa = newkernel.fi_pagetable_pa + 1242877400d3SKonstantin Ananyev size - MMU_PAGESIZE; 124319397407SSherry Moore 124419397407SSherry Moore newkernel.fi_next_table_va = newkernel.fi_pagetable_va + 124519397407SSherry Moore MMU_PAGESIZE; 124619397407SSherry Moore newkernel.fi_next_table_pa = newkernel.fi_pagetable_pa + 124719397407SSherry Moore MMU_PAGESIZE; 124819397407SSherry Moore 124919397407SSherry Moore fastboot_build_pagetables(&newkernel); 125019397407SSherry Moore } 125119397407SSherry Moore 125219397407SSherry Moore 1253753a6d45SSherry Moore /* Generate MD5 checksums */ 1254753a6d45SSherry Moore fastboot_cksum_generate(&newkernel); 1255753a6d45SSherry Moore 125619397407SSherry Moore /* Mark it as valid */ 125719397407SSherry Moore newkernel.fi_valid = 1; 125819397407SSherry Moore newkernel.fi_magic = FASTBOOT_MAGIC; 125919397407SSherry Moore 1260753a6d45SSherry Moore postbootkernelbase = saved_kernelbase; 126119397407SSherry Moore return; 126219397407SSherry Moore 126319397407SSherry Moore err_out: 1264753a6d45SSherry Moore postbootkernelbase = saved_kernelbase; 126519397407SSherry Moore newkernel.fi_valid = 0; 1266753a6d45SSherry Moore fastboot_free_newkernel(&newkernel); 1267753a6d45SSherry Moore } 1268753a6d45SSherry Moore 1269753a6d45SSherry Moore 1270753a6d45SSherry Moore /* ARGSUSED */ 1271753a6d45SSherry Moore static int 1272753a6d45SSherry Moore fastboot_xc_func(fastboot_info_t *nk, xc_arg_t unused2, xc_arg_t unused3) 1273753a6d45SSherry Moore { 1274753a6d45SSherry Moore void (*fastboot_func)(fastboot_info_t *); 1275753a6d45SSherry Moore fastboot_file_t *fb = &nk->fi_files[FASTBOOT_SWTCH]; 1276753a6d45SSherry Moore fastboot_func = (void (*)())(fb->fb_va); 1277753a6d45SSherry Moore kthread_t *t_intr = curthread->t_intr; 1278753a6d45SSherry Moore 1279753a6d45SSherry Moore if (&kas != curproc->p_as) { 1280753a6d45SSherry Moore hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va, 1281753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1282753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1283753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 1284753a6d45SSherry Moore } 1285753a6d45SSherry Moore 1286753a6d45SSherry Moore /* 1287753a6d45SSherry Moore * If we have pinned a thread, make sure the address is mapped 1288753a6d45SSherry Moore * in the address space of the pinned thread. 1289753a6d45SSherry Moore */ 1290753a6d45SSherry Moore if (t_intr && t_intr->t_procp->p_as->a_hat != curproc->p_as->a_hat && 1291753a6d45SSherry Moore t_intr->t_procp->p_as != &kas) 1292753a6d45SSherry Moore hat_devload(t_intr->t_procp->p_as->a_hat, (caddr_t)fb->fb_va, 1293753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1294753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1295753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 1296753a6d45SSherry Moore 1297753a6d45SSherry Moore (*psm_shutdownf)(A_SHUTDOWN, AD_FASTREBOOT); 1298753a6d45SSherry Moore (*fastboot_func)(nk); 1299753a6d45SSherry Moore 1300753a6d45SSherry Moore /*NOTREACHED*/ 1301753a6d45SSherry Moore return (0); 130219397407SSherry Moore } 130319397407SSherry Moore 13046bc8bc6aSSherry Moore /* 13056bc8bc6aSSherry Moore * Jump to the fast reboot switcher. This function never returns. 13066bc8bc6aSSherry Moore */ 130719397407SSherry Moore void 130819397407SSherry Moore fast_reboot() 130919397407SSherry Moore { 1310753a6d45SSherry Moore processorid_t bootcpuid = 0; 1311753a6d45SSherry Moore extern uintptr_t postbootkernelbase; 1312753a6d45SSherry Moore extern char fb_swtch_image[]; 1313753a6d45SSherry Moore fastboot_file_t *fb; 1314753a6d45SSherry Moore int i; 131519397407SSherry Moore 1316753a6d45SSherry Moore postbootkernelbase = 0; 1317753a6d45SSherry Moore 1318753a6d45SSherry Moore fb = &newkernel.fi_files[FASTBOOT_SWTCH]; 1319753a6d45SSherry Moore 1320753a6d45SSherry Moore /* 1321753a6d45SSherry Moore * Map the address into both the current proc's address 1322753a6d45SSherry Moore * space and the kernel's address space in case the panic 1323753a6d45SSherry Moore * is forced by kmdb. 1324753a6d45SSherry Moore */ 1325753a6d45SSherry Moore if (&kas != curproc->p_as) { 1326753a6d45SSherry Moore hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va, 1327753a6d45SSherry Moore MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa), 1328753a6d45SSherry Moore PROT_READ | PROT_WRITE | PROT_EXEC, 1329753a6d45SSherry Moore HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK); 1330753a6d45SSherry Moore } 1331753a6d45SSherry Moore 1332753a6d45SSherry Moore bcopy((void *)fb_swtch_image, (void *)fb->fb_va, fb->fb_size); 1333753a6d45SSherry Moore 1334753a6d45SSherry Moore 1335753a6d45SSherry Moore /* 1336753a6d45SSherry Moore * Set fb_va to fake_va 1337753a6d45SSherry Moore */ 1338753a6d45SSherry Moore for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) { 1339753a6d45SSherry Moore newkernel.fi_files[i].fb_va = fake_va; 1340753a6d45SSherry Moore 1341753a6d45SSherry Moore } 1342753a6d45SSherry Moore 1343753a6d45SSherry Moore if (panicstr && CPU->cpu_id != bootcpuid && 1344753a6d45SSherry Moore CPU_ACTIVE(cpu_get(bootcpuid))) { 1345f34a7178SJoe Bonasera extern void panic_idle(void); 1346753a6d45SSherry Moore cpuset_t cpuset; 1347753a6d45SSherry Moore 1348753a6d45SSherry Moore CPUSET_ZERO(cpuset); 1349753a6d45SSherry Moore CPUSET_ADD(cpuset, bootcpuid); 1350f34a7178SJoe Bonasera xc_priority((xc_arg_t)&newkernel, 0, 0, CPUSET2BV(cpuset), 1351753a6d45SSherry Moore (xc_func_t)fastboot_xc_func); 1352753a6d45SSherry Moore 1353f34a7178SJoe Bonasera panic_idle(); 1354753a6d45SSherry Moore } else 1355753a6d45SSherry Moore (void) fastboot_xc_func(&newkernel, 0, 0); 1356753a6d45SSherry Moore } 1357753a6d45SSherry Moore 1358753a6d45SSherry Moore 1359753a6d45SSherry Moore /* 1360753a6d45SSherry Moore * Get boot property value for fastreboot_onpanic. 1361753a6d45SSherry Moore * 1362753a6d45SSherry Moore * NOTE: If fastreboot_onpanic is set to non-zero in /etc/system, 1363753a6d45SSherry Moore * new setting passed in via "-B fastreboot_onpanic" is ignored. 1364753a6d45SSherry Moore * This order of precedence is to enable developers debugging panics 1365753a6d45SSherry Moore * that occur early in boot to utilize Fast Reboot on panic. 1366753a6d45SSherry Moore */ 1367753a6d45SSherry Moore static void 1368753a6d45SSherry Moore fastboot_get_bootprop(void) 1369753a6d45SSherry Moore { 1370753a6d45SSherry Moore int val = 0xaa, len, ret; 1371753a6d45SSherry Moore dev_info_t *devi; 1372753a6d45SSherry Moore char *propstr = NULL; 1373753a6d45SSherry Moore 1374753a6d45SSherry Moore devi = ddi_root_node(); 1375753a6d45SSherry Moore 1376753a6d45SSherry Moore ret = ddi_prop_lookup_string(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS, 1377753a6d45SSherry Moore FASTREBOOT_ONPANIC, &propstr); 1378753a6d45SSherry Moore 1379753a6d45SSherry Moore if (ret == DDI_PROP_SUCCESS) { 1380753a6d45SSherry Moore if (FASTREBOOT_ONPANIC_NOTSET(propstr)) 1381753a6d45SSherry Moore val = 0; 1382753a6d45SSherry Moore else if (FASTREBOOT_ONPANIC_ISSET(propstr)) 1383753a6d45SSherry Moore val = UA_FASTREBOOT_ONPANIC; 1384753a6d45SSherry Moore 1385753a6d45SSherry Moore /* 1386753a6d45SSherry Moore * Only set fastreboot_onpanic to the value passed in 1387753a6d45SSherry Moore * if it's not already set to non-zero, and the value 1388753a6d45SSherry Moore * has indeed been passed in via command line. 1389753a6d45SSherry Moore */ 1390753a6d45SSherry Moore if (!fastreboot_onpanic && val != 0xaa) 1391753a6d45SSherry Moore fastreboot_onpanic = val; 1392753a6d45SSherry Moore ddi_prop_free(propstr); 1393753a6d45SSherry Moore } else if (ret != DDI_PROP_NOT_FOUND && ret != DDI_PROP_UNDEFINED) { 1394753a6d45SSherry Moore cmn_err(CE_WARN, "%s value is invalid, will be ignored", 1395753a6d45SSherry Moore FASTREBOOT_ONPANIC); 1396753a6d45SSherry Moore } 1397753a6d45SSherry Moore 1398753a6d45SSherry Moore len = sizeof (fastreboot_onpanic_cmdline); 1399753a6d45SSherry Moore ret = ddi_getlongprop_buf(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS, 1400753a6d45SSherry Moore FASTREBOOT_ONPANIC_CMDLINE, fastreboot_onpanic_cmdline, &len); 1401753a6d45SSherry Moore 1402753a6d45SSherry Moore if (ret == DDI_PROP_BUF_TOO_SMALL) 1403753a6d45SSherry Moore cmn_err(CE_WARN, "%s value is too long, will be ignored", 1404753a6d45SSherry Moore FASTREBOOT_ONPANIC_CMDLINE); 1405753a6d45SSherry Moore } 1406753a6d45SSherry Moore 1407753a6d45SSherry Moore /* 1408753a6d45SSherry Moore * This function is called by main() to either load the backup kernel for panic 1409753a6d45SSherry Moore * fast reboot, or to reserve low physical memory for fast reboot. 1410753a6d45SSherry Moore */ 1411753a6d45SSherry Moore void 1412753a6d45SSherry Moore fastboot_post_startup() 1413753a6d45SSherry Moore { 1414753a6d45SSherry Moore if (!fastreboot_capable) 1415753a6d45SSherry Moore return; 1416753a6d45SSherry Moore 1417*c90a5fbeSSherry Moore mutex_enter(&fastreboot_config_mutex); 1418*c90a5fbeSSherry Moore 1419753a6d45SSherry Moore fastboot_get_bootprop(); 1420753a6d45SSherry Moore 1421753a6d45SSherry Moore if (fastreboot_onpanic) 1422753a6d45SSherry Moore fastboot_load_kernel(fastreboot_onpanic_cmdline); 1423753a6d45SSherry Moore else if (reserve_mem_enabled) 1424753a6d45SSherry Moore fastboot_reserve_mem(&newkernel); 1425*c90a5fbeSSherry Moore 1426*c90a5fbeSSherry Moore mutex_exit(&fastreboot_config_mutex); 1427753a6d45SSherry Moore } 1428753a6d45SSherry Moore 1429753a6d45SSherry Moore /* 1430753a6d45SSherry Moore * Update boot configuration settings. 1431753a6d45SSherry Moore * If the new fastreboot_onpanic setting is false, and a kernel has 1432753a6d45SSherry Moore * been preloaded, free the memory; 1433753a6d45SSherry Moore * if the new fastreboot_onpanic setting is true and newkernel is 1434753a6d45SSherry Moore * not valid, load the new kernel. 1435753a6d45SSherry Moore */ 1436753a6d45SSherry Moore void 1437753a6d45SSherry Moore fastboot_update_config(const char *mdep) 1438753a6d45SSherry Moore { 1439753a6d45SSherry Moore uint8_t boot_config = (uint8_t)*mdep; 1440*c90a5fbeSSherry Moore int cur_fastreboot_onpanic; 1441753a6d45SSherry Moore 1442753a6d45SSherry Moore if (!fastreboot_capable) 1443753a6d45SSherry Moore return; 1444753a6d45SSherry Moore 1445*c90a5fbeSSherry Moore mutex_enter(&fastreboot_config_mutex); 1446*c90a5fbeSSherry Moore 1447*c90a5fbeSSherry Moore cur_fastreboot_onpanic = fastreboot_onpanic; 1448753a6d45SSherry Moore fastreboot_onpanic = boot_config & UA_FASTREBOOT_ONPANIC; 1449*c90a5fbeSSherry Moore 1450753a6d45SSherry Moore if (fastreboot_onpanic && (!cur_fastreboot_onpanic || 1451753a6d45SSherry Moore !newkernel.fi_valid)) 1452753a6d45SSherry Moore fastboot_load_kernel(fastreboot_onpanic_cmdline); 1453753a6d45SSherry Moore if (cur_fastreboot_onpanic && !fastreboot_onpanic) 1454753a6d45SSherry Moore fastboot_free_newkernel(&newkernel); 1455*c90a5fbeSSherry Moore 1456*c90a5fbeSSherry Moore mutex_exit(&fastreboot_config_mutex); 1457*c90a5fbeSSherry Moore } 1458*c90a5fbeSSherry Moore 1459*c90a5fbeSSherry Moore /* 1460*c90a5fbeSSherry Moore * This is the interface to be called by other kernel components to 1461*c90a5fbeSSherry Moore * disable fastreboot_onpanic. 1462*c90a5fbeSSherry Moore */ 1463*c90a5fbeSSherry Moore void 1464*c90a5fbeSSherry Moore fastreboot_disable() 1465*c90a5fbeSSherry Moore { 1466*c90a5fbeSSherry Moore uint8_t boot_config = (uint8_t)(~UA_FASTREBOOT_ONPANIC); 1467*c90a5fbeSSherry Moore fastboot_update_config((const char *)&boot_config); 1468*c90a5fbeSSherry Moore } 1469*c90a5fbeSSherry Moore 1470*c90a5fbeSSherry Moore /* 1471*c90a5fbeSSherry Moore * This is the interface to be called by fm_panic() in case FMA has diagnosed 1472*c90a5fbeSSherry Moore * a terminal machine check exception. It does not free up memory allocated 1473*c90a5fbeSSherry Moore * for the backup kernel. General disabling fastreboot_onpanic in a 1474*c90a5fbeSSherry Moore * non-panicking situation must go through fastboot_update_config(). 1475*c90a5fbeSSherry Moore */ 1476*c90a5fbeSSherry Moore void 1477*c90a5fbeSSherry Moore fastreboot_disable_highpil() 1478*c90a5fbeSSherry Moore { 1479*c90a5fbeSSherry Moore fastreboot_onpanic = 0; 1480*c90a5fbeSSherry Moore } 1481*c90a5fbeSSherry Moore 1482*c90a5fbeSSherry Moore 1483*c90a5fbeSSherry Moore /* 1484*c90a5fbeSSherry Moore * A simplified interface for uadmin to call to update the configuration 1485*c90a5fbeSSherry Moore * setting and load a new kernel if necessary. 1486*c90a5fbeSSherry Moore */ 1487*c90a5fbeSSherry Moore void 1488*c90a5fbeSSherry Moore fastboot_update_and_load(int fcn, char *mdep) 1489*c90a5fbeSSherry Moore { 1490*c90a5fbeSSherry Moore if (fcn != AD_FASTREBOOT) { 1491*c90a5fbeSSherry Moore /* 1492*c90a5fbeSSherry Moore * If user has explicitly requested reboot to prom, 1493*c90a5fbeSSherry Moore * or uadmin(1M) was invoked with other functions, 1494*c90a5fbeSSherry Moore * don't try to fast reboot after dumping. 1495*c90a5fbeSSherry Moore */ 1496*c90a5fbeSSherry Moore fastreboot_disable(); 1497*c90a5fbeSSherry Moore } 1498*c90a5fbeSSherry Moore 1499*c90a5fbeSSherry Moore mutex_enter(&fastreboot_config_mutex); 1500*c90a5fbeSSherry Moore 1501*c90a5fbeSSherry Moore if (fastreboot_onpanic) 1502*c90a5fbeSSherry Moore fastboot_load_kernel(mdep); 1503*c90a5fbeSSherry Moore 1504*c90a5fbeSSherry Moore mutex_exit(&fastreboot_config_mutex); 150519397407SSherry Moore } 1506