xref: /titanic_44/usr/src/uts/i86pc/os/fastboot.c (revision 67dbe2be0c0f1e2eb428b89088bb5667e8f0b9f6)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 
22 /*
23  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
24  * Use is subject to license terms.
25  */
26 
27 /*
28  * This file contains the functions for performing Fast Reboot -- a
29  * reboot which bypasses the firmware and bootloader, considerably
30  * reducing downtime.
31  *
32  * fastboot_load_kernel(): This function is invoked by mdpreboot() in the
33  * reboot path.  It loads the new kernel and boot archive into memory, builds
34  * the data structure containing sufficient information about the new
35  * kernel and boot archive to be passed to the fast reboot switcher
36  * (see fb_swtch_src.s for details).  When invoked the switcher relocates
37  * the new kernel and boot archive to physically contiguous low memory,
38  * similar to where the boot loader would have loaded them, and jumps to
39  * the new kernel.
40  *
41  * If fastreboot_onpanic is enabled, fastboot_load_kernel() is called
42  * by fastreboot_post_startup() to load the back up kernel in case of
43  * panic.
44  *
45  * The physical addresses of the memory allocated for the new kernel, boot
46  * archive and their page tables must be above where the boot archive ends
47  * after it has been relocated by the switcher, otherwise the new files
48  * and their page tables could be overridden during relocation.
49  *
50  * fast_reboot(): This function is invoked by mdboot() once it's determined
51  * that the system is capable of fast reboot.  It jumps to the fast reboot
52  * switcher with the data structure built by fastboot_load_kernel() as the
53  * argument.
54  */
55 
56 #include <sys/types.h>
57 #include <sys/param.h>
58 #include <sys/segments.h>
59 #include <sys/sysmacros.h>
60 #include <sys/vm.h>
61 
62 #include <sys/proc.h>
63 #include <sys/buf.h>
64 #include <sys/kmem.h>
65 
66 #include <sys/reboot.h>
67 #include <sys/uadmin.h>
68 
69 #include <sys/cred.h>
70 #include <sys/vnode.h>
71 #include <sys/file.h>
72 
73 #include <sys/cmn_err.h>
74 #include <sys/dumphdr.h>
75 #include <sys/bootconf.h>
76 #include <sys/ddidmareq.h>
77 #include <sys/varargs.h>
78 #include <sys/promif.h>
79 #include <sys/modctl.h>
80 
81 #include <vm/hat.h>
82 #include <vm/as.h>
83 #include <vm/page.h>
84 #include <vm/seg.h>
85 #include <vm/hat_i86.h>
86 #include <sys/vm_machparam.h>
87 #include <sys/archsystm.h>
88 #include <sys/machsystm.h>
89 #include <sys/mman.h>
90 #include <sys/x86_archext.h>
91 #include <sys/smp_impldefs.h>
92 #include <sys/spl.h>
93 
94 #include <sys/fastboot.h>
95 #include <sys/machelf.h>
96 #include <sys/kobj.h>
97 #include <sys/multiboot.h>
98 #include <sys/kobj_lex.h>
99 
100 /*
101  * Macro to determine how many pages are needed for PTEs to map a particular
102  * file.  Allocate one extra page table entry for terminating the list.
103  */
104 #define	FASTBOOT_PTE_LIST_SIZE(fsize)	\
105 	P2ROUNDUP((((fsize) >> PAGESHIFT) + 1) * sizeof (x86pte_t), PAGESIZE)
106 
107 /*
108  * Data structure containing necessary information for the fast reboot
109  * switcher to jump to the new kernel.
110  */
111 fastboot_info_t newkernel = { 0 };
112 char		fastboot_args[OBP_MAXPATHLEN];
113 
114 static char fastboot_filename[2][OBP_MAXPATHLEN] = { { 0 }, { 0 }};
115 static x86pte_t ptp_bits = PT_VALID | PT_REF | PT_USER | PT_WRITABLE;
116 static x86pte_t pte_bits =
117     PT_VALID | PT_REF | PT_MOD | PT_NOCONSIST | PT_WRITABLE;
118 static uint_t fastboot_shift_amt_pae[] = {12, 21, 30, 39};
119 
120 int fastboot_debug = 0;
121 int fastboot_contig = 0;
122 
123 /*
124  * Fake starting va for new kernel and boot archive.
125  */
126 static uintptr_t fake_va = FASTBOOT_FAKE_VA;
127 
128 /*
129  * Reserve memory below PA 1G in preparation of fast reboot.
130  *
131  * This variable is only checked when fastreboot_capable is set, but
132  * fastreboot_onpanic is not set.  The amount of memory reserved
133  * is negligible, but just in case we are really short of low memory,
134  * this variable will give us a backdoor to not consume memory at all.
135  */
136 int reserve_mem_enabled = 1;
137 
138 /*
139  * Mutex to protect fastreboot_onpanic.
140  */
141 kmutex_t fastreboot_config_mutex;
142 
143 /*
144  * Amount of memory below PA 1G to reserve for constructing the multiboot
145  * data structure and the page tables as we tend to run out of those
146  * when more drivers are loaded.
147  */
148 static size_t fastboot_mbi_size = 0x2000;	/* 8K */
149 static size_t fastboot_pagetable_size = 0x5000;	/* 20K */
150 
151 /*
152  * Minimum system uptime in clock_t before Fast Reboot should be used
153  * on panic.  Will be initialized in fastboot_post_startup().
154  */
155 clock_t fastreboot_onpanic_uptime = LONG_MAX;
156 
157 /*
158  * lbolt value when the system booted.  This value will be used if the system
159  * panics to calculate how long the system has been up.  If the uptime is less
160  * than fastreboot_onpanic_uptime, a reboot through BIOS will be performed to
161  * avoid a potential panic/reboot loop.
162  */
163 clock_t lbolt_at_boot = LONG_MAX;
164 
165 /*
166  * Use below 1G for page tables as
167  *	1. we are only doing 1:1 mapping of the bottom 1G of physical memory.
168  *	2. we are using 2G as the fake virtual address for the new kernel and
169  *	boot archive.
170  */
171 static ddi_dma_attr_t fastboot_below_1G_dma_attr = {
172 	DMA_ATTR_V0,
173 	0x0000000008000000ULL,	/* dma_attr_addr_lo: 128MB */
174 	0x000000003FFFFFFFULL,	/* dma_attr_addr_hi: 1G */
175 	0x00000000FFFFFFFFULL,	/* dma_attr_count_max */
176 	0x0000000000001000ULL,	/* dma_attr_align: 4KB */
177 	1,			/* dma_attr_burstsize */
178 	1,			/* dma_attr_minxfer */
179 	0x00000000FFFFFFFFULL,	/* dma_attr_maxxfer */
180 	0x00000000FFFFFFFFULL,	/* dma_attr_seg */
181 	1,			/* dma_attr_sgllen */
182 	0x1000ULL,		/* dma_attr_granular */
183 	0,			/* dma_attr_flags */
184 };
185 
186 static ddi_dma_attr_t fastboot_dma_attr = {
187 	DMA_ATTR_V0,
188 	0x0000000008000000ULL,	/* dma_attr_addr_lo: 128MB */
189 #ifdef	__amd64
190 	0xFFFFFFFFFFFFFFFFULL,	/* dma_attr_addr_hi: 2^64B */
191 #else
192 	0x0000000FFFFFFFFFULL,	/* dma_attr_addr_hi: 64GB */
193 #endif	/* __amd64 */
194 	0x00000000FFFFFFFFULL,	/* dma_attr_count_max */
195 	0x0000000000001000ULL,	/* dma_attr_align: 4KB */
196 	1,			/* dma_attr_burstsize */
197 	1,			/* dma_attr_minxfer */
198 	0x00000000FFFFFFFFULL,	/* dma_attr_maxxfer */
199 	0x00000000FFFFFFFFULL,	/* dma_attr_seg */
200 	1,			/* dma_attr_sgllen */
201 	0x1000ULL,		/* dma_attr_granular */
202 	0,			/* dma_attr_flags */
203 };
204 
205 /*
206  * Various information saved from the previous boot to reconstruct
207  * multiboot_info.
208  */
209 extern multiboot_info_t saved_mbi;
210 extern mb_memory_map_t saved_mmap[FASTBOOT_SAVED_MMAP_COUNT];
211 extern uint8_t saved_drives[FASTBOOT_SAVED_DRIVES_SIZE];
212 extern char saved_cmdline[FASTBOOT_SAVED_CMDLINE_LEN];
213 extern int saved_cmdline_len;
214 extern size_t saved_file_size[];
215 
216 extern void* contig_alloc(size_t size, ddi_dma_attr_t *attr,
217     uintptr_t align, int cansleep);
218 extern void contig_free(void *addr, size_t size);
219 
220 
221 /* PRINTLIKE */
222 extern void vprintf(const char *, va_list);
223 
224 
225 /*
226  * Need to be able to get boot_archives from other places
227  */
228 #define	BOOTARCHIVE64	"/platform/i86pc/amd64/boot_archive"
229 #define	BOOTARCHIVE32	"/platform/i86pc/boot_archive"
230 #define	BOOTARCHIVE32_FAILSAFE	"/boot/x86.miniroot-safe"
231 #define	BOOTARCHIVE64_FAILSAFE	"/boot/amd64/x86.miniroot-safe"
232 #define	FAILSAFE_BOOTFILE32	"/boot/platform/i86pc/kernel/unix"
233 #define	FAILSAFE_BOOTFILE64	"/boot/platform/i86pc/kernel/amd64/unix"
234 
235 static uint_t fastboot_vatoindex(fastboot_info_t *, uintptr_t, int);
236 static void fastboot_map_with_size(fastboot_info_t *, uintptr_t,
237     paddr_t, size_t, int);
238 static void fastboot_build_pagetables(fastboot_info_t *);
239 static int fastboot_build_mbi(char *, fastboot_info_t *);
240 static void fastboot_free_file(fastboot_file_t *);
241 
242 static const char fastboot_enomem_msg[] = "!Fastboot: Couldn't allocate 0x%"
243 	PRIx64" bytes below %s to do fast reboot";
244 
245 static void
246 dprintf(char *fmt, ...)
247 {
248 	va_list adx;
249 
250 	if (!fastboot_debug)
251 		return;
252 
253 	va_start(adx, fmt);
254 	vprintf(fmt, adx);
255 	va_end(adx);
256 }
257 
258 
259 /*
260  * Return the index corresponding to a virt address at a given page table level.
261  */
262 static uint_t
263 fastboot_vatoindex(fastboot_info_t *nk, uintptr_t va, int level)
264 {
265 	return ((va >> nk->fi_shift_amt[level]) & (nk->fi_ptes_per_table - 1));
266 }
267 
268 
269 /*
270  * Add mapping from vstart to pstart for the specified size.
271  * vstart, pstart and size should all have been aligned at 2M boundaries.
272  */
273 static void
274 fastboot_map_with_size(fastboot_info_t *nk, uintptr_t vstart, paddr_t pstart,
275     size_t size, int level)
276 {
277 	x86pte_t	pteval, *table;
278 	uintptr_t	vaddr;
279 	paddr_t		paddr;
280 	int		index, l;
281 
282 	table = (x86pte_t *)(nk->fi_pagetable_va);
283 
284 	for (l = nk->fi_top_level; l >= level; l--) {
285 
286 		index = fastboot_vatoindex(nk, vstart, l);
287 
288 		if (l == level) {
289 			/*
290 			 * Last level.  Program the page table entries.
291 			 */
292 			for (vaddr = vstart, paddr = pstart;
293 			    vaddr < vstart + size;
294 			    vaddr += (1ULL << nk->fi_shift_amt[l]),
295 			    paddr += (1ULL << nk->fi_shift_amt[l])) {
296 
297 				uint_t index = fastboot_vatoindex(nk, vaddr, l);
298 
299 				if (l > 0)
300 					pteval = paddr | pte_bits | PT_PAGESIZE;
301 				else
302 					pteval = paddr | pte_bits;
303 
304 				table[index] = pteval;
305 			}
306 		} else if (table[index] & PT_VALID) {
307 
308 			table = (x86pte_t *)
309 			    ((uintptr_t)(((paddr_t)table[index] & MMU_PAGEMASK)
310 			    - nk->fi_pagetable_pa) + nk->fi_pagetable_va);
311 		} else {
312 			/*
313 			 * Intermediate levels.
314 			 * Program with either valid bit or PTP bits.
315 			 */
316 			if (l == nk->fi_top_level) {
317 #ifdef	__amd64
318 				ASSERT(nk->fi_top_level == 3);
319 				table[index] = nk->fi_next_table_pa | ptp_bits;
320 #else
321 				table[index] = nk->fi_next_table_pa | PT_VALID;
322 #endif	/* __amd64 */
323 			} else {
324 				table[index] = nk->fi_next_table_pa | ptp_bits;
325 			}
326 			table = (x86pte_t *)(nk->fi_next_table_va);
327 			nk->fi_next_table_va += MMU_PAGESIZE;
328 			nk->fi_next_table_pa += MMU_PAGESIZE;
329 		}
330 	}
331 }
332 
333 /*
334  * Build page tables for the lower 1G of physical memory using 2M
335  * pages, and prepare page tables for mapping new kernel and boot
336  * archive pages using 4K pages.
337  */
338 static void
339 fastboot_build_pagetables(fastboot_info_t *nk)
340 {
341 	/*
342 	 * Map lower 1G physical memory.  Use large pages.
343 	 */
344 	fastboot_map_with_size(nk, 0, 0, ONE_GIG, 1);
345 
346 	/*
347 	 * Map one 4K page to get the middle page tables set up.
348 	 */
349 	fake_va = P2ALIGN_TYPED(fake_va, nk->fi_lpagesize, uintptr_t);
350 	fastboot_map_with_size(nk, fake_va,
351 	    nk->fi_files[0].fb_pte_list_va[0] & MMU_PAGEMASK, PAGESIZE, 0);
352 }
353 
354 
355 /*
356  * Sanity check.  Look for dboot offset.
357  */
358 static int
359 fastboot_elf64_find_dboot_load_offset(void *img, off_t imgsz, uint32_t *offp)
360 {
361 	Elf64_Ehdr	*ehdr = (Elf64_Ehdr *)img;
362 	Elf64_Phdr	*phdr;
363 	uint8_t		*phdrbase;
364 	int		i;
365 
366 	if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz)
367 		return (-1);
368 
369 	phdrbase = (uint8_t *)img + ehdr->e_phoff;
370 
371 	for (i = 0; i < ehdr->e_phnum; i++) {
372 		phdr = (Elf64_Phdr *)(phdrbase + ehdr->e_phentsize * i);
373 
374 		if (phdr->p_type == PT_LOAD) {
375 			if (phdr->p_vaddr == phdr->p_paddr &&
376 			    phdr->p_vaddr == DBOOT_ENTRY_ADDRESS) {
377 				ASSERT(phdr->p_offset <= UINT32_MAX);
378 				*offp = (uint32_t)phdr->p_offset;
379 				return (0);
380 			}
381 		}
382 	}
383 
384 	return (-1);
385 }
386 
387 
388 /*
389  * Initialize text and data section information for 32-bit kernel.
390  * sectcntp - is both input/output parameter.
391  * On entry, *sectcntp contains maximum allowable number of sections;
392  * on return, it contains the actual number of sections filled.
393  */
394 static int
395 fastboot_elf32_find_loadables(void *img, off_t imgsz, fastboot_section_t *sectp,
396     int *sectcntp, uint32_t *offp)
397 {
398 	Elf32_Ehdr	*ehdr = (Elf32_Ehdr *)img;
399 	Elf32_Phdr	*phdr;
400 	uint8_t		*phdrbase;
401 	int		i;
402 	int		used_sections = 0;
403 	const int	max_sectcnt = *sectcntp;
404 
405 	if ((ehdr->e_phoff + ehdr->e_phnum * ehdr->e_phentsize) >= imgsz)
406 		return (-1);
407 
408 	phdrbase = (uint8_t *)img + ehdr->e_phoff;
409 
410 	for (i = 0; i < ehdr->e_phnum; i++) {
411 		phdr = (Elf32_Phdr *)(phdrbase + ehdr->e_phentsize * i);
412 
413 		if (phdr->p_type == PT_INTERP)
414 			return (-1);
415 
416 		if (phdr->p_type != PT_LOAD)
417 			continue;
418 
419 		if (phdr->p_vaddr == phdr->p_paddr &&
420 		    phdr->p_paddr == DBOOT_ENTRY_ADDRESS) {
421 			*offp = (uint32_t)phdr->p_offset;
422 		} else {
423 			if (max_sectcnt <= used_sections)
424 				return (-1);
425 
426 			sectp[used_sections].fb_sec_offset = phdr->p_offset;
427 			sectp[used_sections].fb_sec_paddr = phdr->p_paddr;
428 			sectp[used_sections].fb_sec_size = phdr->p_filesz;
429 			sectp[used_sections].fb_sec_bss_size =
430 			    (phdr->p_filesz < phdr->p_memsz) ?
431 			    (phdr->p_memsz - phdr->p_filesz) : 0;
432 
433 			/* Extra sanity check for the input object file */
434 			if (sectp[used_sections].fb_sec_paddr +
435 			    sectp[used_sections].fb_sec_size +
436 			    sectp[used_sections].fb_sec_bss_size >=
437 			    DBOOT_ENTRY_ADDRESS)
438 				return (-1);
439 
440 			used_sections++;
441 		}
442 	}
443 
444 	*sectcntp = used_sections;
445 	return (0);
446 }
447 
448 /*
449  * Create multiboot info structure (mbi) base on the saved mbi.
450  * Recalculate values of the pointer type fields in the data
451  * structure based on the new starting physical address of the
452  * data structure.
453  */
454 static int
455 fastboot_build_mbi(char *mdep, fastboot_info_t *nk)
456 {
457 	mb_module_t	*mbp;
458 	multiboot_info_t	*mbi;	/* pointer to multiboot structure */
459 	uintptr_t	start_addr_va;	/* starting VA of mbi */
460 	uintptr_t	start_addr_pa;	/* starting PA of mbi */
461 	size_t		offs = 0;	/* offset from the starting address */
462 	size_t		arglen;		/* length of the command line arg */
463 	size_t		size;	/* size of the memory reserved for mbi */
464 	size_t		mdnsz;	/* length of the boot archive name */
465 
466 	/*
467 	 * If mdep is not NULL or empty, use the length of mdep + 1
468 	 * (for NULL terminating) as the length of the new command
469 	 * line; else use the saved command line length as the
470 	 * length for the new command line.
471 	 */
472 	if (mdep != NULL && strlen(mdep) != 0) {
473 		arglen = strlen(mdep) + 1;
474 	} else {
475 		arglen = saved_cmdline_len;
476 	}
477 
478 	/*
479 	 * Allocate memory for the new multiboot info structure (mbi).
480 	 * If we have reserved memory for mbi but it's not enough,
481 	 * free it and reallocate.
482 	 */
483 	size = PAGESIZE + P2ROUNDUP(arglen, PAGESIZE);
484 	if (nk->fi_mbi_size && nk->fi_mbi_size < size) {
485 		contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
486 		nk->fi_mbi_size = 0;
487 	}
488 
489 	if (nk->fi_mbi_size == 0) {
490 		if ((nk->fi_new_mbi_va =
491 		    (uintptr_t)contig_alloc(size, &fastboot_below_1G_dma_attr,
492 		    PAGESIZE, 0)) == NULL) {
493 			cmn_err(CE_NOTE, fastboot_enomem_msg,
494 			    (uint64_t)size, "1G");
495 			return (-1);
496 		}
497 		/*
498 		 * fi_mbi_size must be set after the allocation succeeds
499 		 * as it's used to determine how much memory to free.
500 		 */
501 		nk->fi_mbi_size = size;
502 	}
503 
504 	/*
505 	 * Initalize memory
506 	 */
507 	bzero((void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
508 
509 	/*
510 	 * Get PA for the new mbi
511 	 */
512 	start_addr_va = nk->fi_new_mbi_va;
513 	start_addr_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
514 	    (caddr_t)start_addr_va));
515 	nk->fi_new_mbi_pa = (paddr_t)start_addr_pa;
516 
517 	/*
518 	 * Populate the rest of the fields in the data structure
519 	 */
520 
521 	/*
522 	 * Copy from the saved mbi to preserve all non-pointer type fields.
523 	 */
524 	mbi = (multiboot_info_t *)start_addr_va;
525 	bcopy(&saved_mbi, mbi, sizeof (*mbi));
526 
527 	/*
528 	 * Recalculate mods_addr.  Set mod_start and mod_end based on
529 	 * the physical address of the new boot archive.  Set mod_name
530 	 * to the name of the new boto archive.
531 	 */
532 	offs += sizeof (multiboot_info_t);
533 	mbi->mods_addr = start_addr_pa + offs;
534 	mbp = (mb_module_t *)(start_addr_va + offs);
535 	mbp->mod_start = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_dest_pa;
536 	mbp->mod_end = nk->fi_files[FASTBOOT_BOOTARCHIVE].fb_next_pa;
537 
538 	offs += sizeof (mb_module_t);
539 	mdnsz = strlen(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE]) + 1;
540 	bcopy(fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE],
541 	    (void *)(start_addr_va + offs), mdnsz);
542 	mbp->mod_name = start_addr_pa + offs;
543 	mbp->reserved = 0;
544 
545 	/*
546 	 * Make sure the offset is 16-byte aligned to avoid unaligned access.
547 	 */
548 	offs += mdnsz;
549 	offs = P2ROUNDUP_TYPED(offs, 16, size_t);
550 
551 	/*
552 	 * Recalculate mmap_addr
553 	 */
554 	mbi->mmap_addr = start_addr_pa + offs;
555 	bcopy((void *)(uintptr_t)saved_mmap, (void *)(start_addr_va + offs),
556 	    saved_mbi.mmap_length);
557 	offs += saved_mbi.mmap_length;
558 
559 	/*
560 	 * Recalculate drives_addr
561 	 */
562 	mbi->drives_addr = start_addr_pa + offs;
563 	bcopy((void *)(uintptr_t)saved_drives, (void *)(start_addr_va + offs),
564 	    saved_mbi.drives_length);
565 	offs += saved_mbi.drives_length;
566 
567 	/*
568 	 * Recalculate the address of cmdline.  Set cmdline to contain the
569 	 * new boot argument.
570 	 */
571 	mbi->cmdline = start_addr_pa + offs;
572 
573 	if (mdep != NULL && strlen(mdep) != 0) {
574 		bcopy(mdep, (void *)(start_addr_va + offs), arglen);
575 	} else {
576 		bcopy((void *)saved_cmdline, (void *)(start_addr_va + offs),
577 		    arglen);
578 	}
579 
580 	/* clear fields and flags that are not copied */
581 	bzero(&mbi->config_table,
582 	    sizeof (*mbi) - offsetof(multiboot_info_t, config_table));
583 	mbi->flags &= ~(MB_INFO_CONFIG_TABLE | MB_INFO_BOOT_LOADER_NAME |
584 	    MB_INFO_APM_TABLE | MB_INFO_VIDEO_INFO);
585 
586 	return (0);
587 }
588 
589 /*
590  * Initialize HAT related fields
591  */
592 static void
593 fastboot_init_fields(fastboot_info_t *nk)
594 {
595 	if (x86_feature & X86_PAE) {
596 		nk->fi_has_pae = 1;
597 		nk->fi_shift_amt = fastboot_shift_amt_pae;
598 		nk->fi_ptes_per_table = 512;
599 		nk->fi_lpagesize = (2 << 20);	/* 2M */
600 #ifdef	__amd64
601 		nk->fi_top_level = 3;
602 #else
603 		nk->fi_top_level = 2;
604 #endif	/* __amd64 */
605 	}
606 }
607 
608 /*
609  * Process boot argument
610  */
611 static void
612 fastboot_parse_mdep(char *mdep, char *kern_bootpath, int *bootpath_len,
613     char *bootargs)
614 {
615 	int	i;
616 
617 	/*
618 	 * If mdep is not NULL, it comes in the format of
619 	 *	mountpoint unix args
620 	 */
621 	if (mdep != NULL && strlen(mdep) != 0) {
622 		if (mdep[0] != '-') {
623 			/* First get the root argument */
624 			i = 0;
625 			while (mdep[i] != '\0' && mdep[i] != ' ') {
626 				i++;
627 			}
628 
629 			if (i < 4 || strncmp(&mdep[i-4], "unix", 4) != 0) {
630 				/* mount point */
631 				bcopy(mdep, kern_bootpath, i);
632 				kern_bootpath[i] = '\0';
633 				*bootpath_len = i;
634 
635 				/*
636 				 * Get the next argument. It should be unix as
637 				 * we have validated in in halt.c.
638 				 */
639 				if (strlen(mdep) > i) {
640 					mdep += (i + 1);
641 					i = 0;
642 					while (mdep[i] != '\0' &&
643 					    mdep[i] != ' ') {
644 						i++;
645 					}
646 				}
647 
648 			}
649 			bcopy(mdep, kern_bootfile, i);
650 			kern_bootfile[i] = '\0';
651 			bcopy(mdep, bootargs, strlen(mdep));
652 		} else {
653 			int off = strlen(kern_bootfile);
654 			bcopy(kern_bootfile, bootargs, off);
655 			bcopy(" ", &bootargs[off++], 1);
656 			bcopy(mdep, &bootargs[off], strlen(mdep));
657 			off += strlen(mdep);
658 			bootargs[off] = '\0';
659 		}
660 	}
661 }
662 
663 /*
664  * Reserve memory under PA 1G for mapping the new kernel and boot archive.
665  * This function is only called if fastreboot_onpanic is *not* set.
666  */
667 static void
668 fastboot_reserve_mem(fastboot_info_t *nk)
669 {
670 	int i;
671 
672 	/*
673 	 * A valid kernel is in place.  No need to reserve any memory.
674 	 */
675 	if (nk->fi_valid)
676 		return;
677 
678 	/*
679 	 * Reserve memory under PA 1G for PTE lists.
680 	 */
681 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
682 		fastboot_file_t *fb = &nk->fi_files[i];
683 		size_t fsize_roundup, size;
684 
685 		fsize_roundup = P2ROUNDUP_TYPED(saved_file_size[i],
686 		    PAGESIZE, size_t);
687 		size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup);
688 		if ((fb->fb_pte_list_va = contig_alloc(size,
689 		    &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) {
690 			return;
691 		}
692 		fb->fb_pte_list_size = size;
693 	}
694 
695 	/*
696 	 * Reserve memory under PA 1G for page tables.
697 	 */
698 	if ((nk->fi_pagetable_va =
699 	    (uintptr_t)contig_alloc(fastboot_pagetable_size,
700 	    &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) {
701 		return;
702 	}
703 	nk->fi_pagetable_size = fastboot_pagetable_size;
704 
705 	/*
706 	 * Reserve memory under PA 1G for multiboot structure.
707 	 */
708 	if ((nk->fi_new_mbi_va = (uintptr_t)contig_alloc(fastboot_mbi_size,
709 	    &fastboot_below_1G_dma_attr, PAGESIZE, 0)) == NULL) {
710 		return;
711 	}
712 	nk->fi_mbi_size = fastboot_mbi_size;
713 }
714 
715 /*
716  * Calculate MD5 digest for the given fastboot_file.
717  * Assumes that the file is allready loaded properly.
718  */
719 static void
720 fastboot_cksum_file(fastboot_file_t *fb, uchar_t *md5_hash)
721 {
722 	MD5_CTX md5_ctx;
723 
724 	MD5Init(&md5_ctx);
725 	MD5Update(&md5_ctx, (void *)fb->fb_va, fb->fb_size);
726 	MD5Final(md5_hash, &md5_ctx);
727 }
728 
729 /*
730  * Free up the memory we have allocated for a file
731  */
732 static void
733 fastboot_free_file(fastboot_file_t *fb)
734 {
735 	size_t	fsize_roundup;
736 
737 	fsize_roundup = P2ROUNDUP_TYPED(fb->fb_size, PAGESIZE, size_t);
738 	if (fsize_roundup) {
739 		contig_free((void *)fb->fb_va, fsize_roundup);
740 		fb->fb_va = NULL;
741 		fb->fb_size = 0;
742 	}
743 }
744 
745 /*
746  * Free up memory used by the PTEs for a file.
747  */
748 static void
749 fastboot_free_file_pte(fastboot_file_t *fb, uint64_t endaddr)
750 {
751 	if (fb->fb_pte_list_size && fb->fb_pte_list_pa < endaddr) {
752 		contig_free((void *)fb->fb_pte_list_va, fb->fb_pte_list_size);
753 		fb->fb_pte_list_va = 0;
754 		fb->fb_pte_list_pa = 0;
755 		fb->fb_pte_list_size = 0;
756 	}
757 }
758 
759 /*
760  * Free up all the memory used for representing a kernel with
761  * fastboot_info_t.
762  */
763 static void
764 fastboot_free_mem(fastboot_info_t *nk, uint64_t endaddr)
765 {
766 	int i;
767 
768 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
769 		fastboot_free_file(nk->fi_files + i);
770 		fastboot_free_file_pte(nk->fi_files + i, endaddr);
771 	}
772 
773 	if (nk->fi_pagetable_size && nk->fi_pagetable_pa < endaddr) {
774 		contig_free((void *)nk->fi_pagetable_va, nk->fi_pagetable_size);
775 		nk->fi_pagetable_va = 0;
776 		nk->fi_pagetable_pa = 0;
777 		nk->fi_pagetable_size = 0;
778 	}
779 
780 	if (nk->fi_mbi_size && nk->fi_new_mbi_pa < endaddr) {
781 		contig_free((void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
782 		nk->fi_new_mbi_va = 0;
783 		nk->fi_new_mbi_pa = 0;
784 		nk->fi_mbi_size = 0;
785 	}
786 }
787 
788 /*
789  * Only free up the memory allocated for the kernel and boot archive,
790  * but not for the page tables.
791  */
792 void
793 fastboot_free_newkernel(fastboot_info_t *nk)
794 {
795 	int i;
796 
797 	nk->fi_valid = 0;
798 	/*
799 	 * Free the memory we have allocated
800 	 */
801 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
802 		fastboot_free_file(&(nk->fi_files[i]));
803 	}
804 }
805 
806 static void
807 fastboot_cksum_cdata(fastboot_info_t *nk, uchar_t *md5_hash)
808 {
809 	int i;
810 	MD5_CTX md5_ctx;
811 
812 	MD5Init(&md5_ctx);
813 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
814 		MD5Update(&md5_ctx, nk->fi_files[i].fb_pte_list_va,
815 		    nk->fi_files[i].fb_pte_list_size);
816 	}
817 	MD5Update(&md5_ctx, (void *)nk->fi_pagetable_va, nk->fi_pagetable_size);
818 	MD5Update(&md5_ctx, (void *)nk->fi_new_mbi_va, nk->fi_mbi_size);
819 
820 	MD5Final(md5_hash, &md5_ctx);
821 }
822 
823 /*
824  * Generate MD5 checksum of the given kernel.
825  */
826 static void
827 fastboot_cksum_generate(fastboot_info_t *nk)
828 {
829 	int i;
830 
831 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
832 		fastboot_cksum_file(nk->fi_files + i, nk->fi_md5_hash[i]);
833 	}
834 	fastboot_cksum_cdata(nk, nk->fi_md5_hash[i]);
835 }
836 
837 /*
838  * Calculate MD5 checksum of the given kernel and verify that
839  * it matches with what was calculated before.
840  */
841 int
842 fastboot_cksum_verify(fastboot_info_t *nk)
843 {
844 	int i;
845 	uchar_t md5_hash[MD5_DIGEST_LENGTH];
846 
847 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
848 		fastboot_cksum_file(nk->fi_files + i, md5_hash);
849 		if (bcmp(nk->fi_md5_hash[i], md5_hash,
850 		    sizeof (nk->fi_md5_hash[i])) != 0)
851 			return (i + 1);
852 	}
853 
854 	fastboot_cksum_cdata(nk, md5_hash);
855 	if (bcmp(nk->fi_md5_hash[i], md5_hash,
856 	    sizeof (nk->fi_md5_hash[i])) != 0)
857 		return (i + 1);
858 
859 	return (0);
860 }
861 
862 /*
863  * This function performs the following tasks:
864  * - Read the sizes of the new kernel and boot archive.
865  * - Allocate memory for the new kernel and boot archive.
866  * - Allocate memory for page tables necessary for mapping the memory
867  *   allocated for the files.
868  * - Read the new kernel and boot archive into memory.
869  * - Map in the fast reboot switcher.
870  * - Load the fast reboot switcher to FASTBOOT_SWTCH_PA.
871  * - Build the new multiboot_info structure
872  * - Build page tables for the low 1G of physical memory.
873  * - Mark the data structure as valid if all steps have succeeded.
874  */
875 void
876 fastboot_load_kernel(char *mdep)
877 {
878 	void		*buf = NULL;
879 	int		i;
880 	fastboot_file_t	*fb;
881 	uint32_t	dboot_start_offset;
882 	char		kern_bootpath[OBP_MAXPATHLEN];
883 	extern uintptr_t postbootkernelbase;
884 	uintptr_t	saved_kernelbase;
885 	int		bootpath_len = 0;
886 	int		is_failsafe = 0;
887 	int		is_retry = 0;
888 	uint64_t	end_addr;
889 
890 	if (!fastreboot_capable)
891 		return;
892 
893 	if (newkernel.fi_valid)
894 		fastboot_free_newkernel(&newkernel);
895 
896 	saved_kernelbase = postbootkernelbase;
897 
898 	postbootkernelbase = 0;
899 
900 	/*
901 	 * Initialize various HAT related fields in the data structure
902 	 */
903 	fastboot_init_fields(&newkernel);
904 
905 	bzero(kern_bootpath, OBP_MAXPATHLEN);
906 
907 	/*
908 	 * Process the boot argument
909 	 */
910 	bzero(fastboot_args, OBP_MAXPATHLEN);
911 	fastboot_parse_mdep(mdep, kern_bootpath, &bootpath_len, fastboot_args);
912 
913 	/*
914 	 * Make sure we get the null character
915 	 */
916 	bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_UNIX],
917 	    bootpath_len);
918 	bcopy(kern_bootfile,
919 	    &fastboot_filename[FASTBOOT_NAME_UNIX][bootpath_len],
920 	    strlen(kern_bootfile) + 1);
921 
922 	bcopy(kern_bootpath, fastboot_filename[FASTBOOT_NAME_BOOTARCHIVE],
923 	    bootpath_len);
924 
925 	if (bcmp(kern_bootfile, FAILSAFE_BOOTFILE32,
926 	    (sizeof (FAILSAFE_BOOTFILE32) - 1)) == 0 ||
927 	    bcmp(kern_bootfile, FAILSAFE_BOOTFILE64,
928 	    (sizeof (FAILSAFE_BOOTFILE64) - 1)) == 0) {
929 		is_failsafe = 1;
930 	}
931 
932 load_kernel_retry:
933 	/*
934 	 * Read in unix and boot_archive
935 	 */
936 	end_addr = DBOOT_ENTRY_ADDRESS;
937 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
938 		struct _buf	*file;
939 		uintptr_t	va;
940 		uint64_t	fsize;
941 		size_t		fsize_roundup, pt_size;
942 		int		page_index;
943 		uintptr_t	offset;
944 		ddi_dma_attr_t dma_attr = fastboot_dma_attr;
945 
946 
947 		dprintf("fastboot_filename[%d] = %s\n",
948 		    i, fastboot_filename[i]);
949 
950 		if ((file = kobj_open_file(fastboot_filename[i])) ==
951 		    (struct _buf *)-1) {
952 			cmn_err(CE_NOTE, "!Fastboot: Couldn't open %s",
953 			    fastboot_filename[i]);
954 			goto err_out;
955 		}
956 
957 		if (kobj_get_filesize(file, &fsize) != 0) {
958 			cmn_err(CE_NOTE,
959 			    "!Fastboot: Couldn't get filesize for %s",
960 			    fastboot_filename[i]);
961 			goto err_out;
962 		}
963 
964 		fsize_roundup = P2ROUNDUP_TYPED(fsize, PAGESIZE, size_t);
965 
966 		/*
967 		 * Where the files end in physical memory after being
968 		 * relocated by the fast boot switcher.
969 		 */
970 		end_addr += fsize_roundup;
971 		if (end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_hi) {
972 			cmn_err(CE_NOTE, "!Fastboot: boot archive is too big");
973 			goto err_out;
974 		}
975 
976 		/*
977 		 * Adjust dma_attr_addr_lo so that the new kernel and boot
978 		 * archive will not be overridden during relocation.
979 		 */
980 		if (end_addr > fastboot_dma_attr.dma_attr_addr_lo ||
981 		    end_addr > fastboot_below_1G_dma_attr.dma_attr_addr_lo) {
982 
983 			if (is_retry) {
984 				/*
985 				 * If we have already tried and didn't succeed,
986 				 * just give up.
987 				 */
988 				cmn_err(CE_NOTE,
989 				    "!Fastboot: boot archive is too big");
990 				goto err_out;
991 			} else {
992 				/* Set the flag so we don't keep retrying */
993 				is_retry++;
994 
995 				/* Adjust dma_attr_addr_lo */
996 				fastboot_dma_attr.dma_attr_addr_lo = end_addr;
997 				fastboot_below_1G_dma_attr.dma_attr_addr_lo =
998 				    end_addr;
999 
1000 				/*
1001 				 * Free the memory we have already allocated
1002 				 * whose physical addresses might not fit
1003 				 * the new lo and hi constraints.
1004 				 */
1005 				fastboot_free_mem(&newkernel, end_addr);
1006 				goto load_kernel_retry;
1007 			}
1008 		}
1009 
1010 
1011 		if (!fastboot_contig)
1012 			dma_attr.dma_attr_sgllen = (fsize / PAGESIZE) +
1013 			    (((fsize % PAGESIZE) == 0) ? 0 : 1);
1014 
1015 		if ((buf = contig_alloc(fsize, &dma_attr, PAGESIZE, 0))
1016 		    == NULL) {
1017 			cmn_err(CE_NOTE, fastboot_enomem_msg, fsize, "64G");
1018 			goto err_out;
1019 		}
1020 
1021 		va = P2ROUNDUP_TYPED((uintptr_t)buf, PAGESIZE, uintptr_t);
1022 
1023 		if (kobj_read_file(file, (char *)va, fsize, 0) < 0) {
1024 			cmn_err(CE_NOTE, "!Fastboot: Couldn't read %s",
1025 			    fastboot_filename[i]);
1026 			goto err_out;
1027 		}
1028 
1029 		fb = &newkernel.fi_files[i];
1030 		fb->fb_va = va;
1031 		fb->fb_size = fsize;
1032 		fb->fb_sectcnt = 0;
1033 
1034 		pt_size = FASTBOOT_PTE_LIST_SIZE(fsize_roundup);
1035 
1036 		/*
1037 		 * If we have reserved memory but it not enough, free it.
1038 		 */
1039 		if (fb->fb_pte_list_size && fb->fb_pte_list_size < pt_size) {
1040 			contig_free((void *)fb->fb_pte_list_va,
1041 			    fb->fb_pte_list_size);
1042 			fb->fb_pte_list_size = 0;
1043 		}
1044 
1045 		if (fb->fb_pte_list_size == 0) {
1046 			if ((fb->fb_pte_list_va =
1047 			    (x86pte_t *)contig_alloc(pt_size,
1048 			    &fastboot_below_1G_dma_attr, PAGESIZE, 0))
1049 			    == NULL) {
1050 				cmn_err(CE_NOTE, fastboot_enomem_msg,
1051 				    (uint64_t)pt_size, "1G");
1052 				goto err_out;
1053 			}
1054 			/*
1055 			 * fb_pte_list_size must be set after the allocation
1056 			 * succeeds as it's used to determine how much memory to
1057 			 * free.
1058 			 */
1059 			fb->fb_pte_list_size = pt_size;
1060 		}
1061 
1062 		bzero((void *)(fb->fb_pte_list_va), fb->fb_pte_list_size);
1063 
1064 		fb->fb_pte_list_pa = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
1065 		    (caddr_t)fb->fb_pte_list_va));
1066 
1067 		for (page_index = 0, offset = 0; offset < fb->fb_size;
1068 		    offset += PAGESIZE) {
1069 			uint64_t paddr;
1070 
1071 			paddr = mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
1072 			    (caddr_t)fb->fb_va + offset));
1073 
1074 			ASSERT(paddr >= fastboot_dma_attr.dma_attr_addr_lo);
1075 
1076 			/*
1077 			 * Include the pte_bits so we don't have to make
1078 			 * it in assembly.
1079 			 */
1080 			fb->fb_pte_list_va[page_index++] = (x86pte_t)
1081 			    (paddr | pte_bits);
1082 		}
1083 
1084 		fb->fb_pte_list_va[page_index] = FASTBOOT_TERMINATE;
1085 
1086 		if (i == FASTBOOT_UNIX) {
1087 			Ehdr	*ehdr = (Ehdr *)va;
1088 			int	j;
1089 
1090 			/*
1091 			 * Sanity checks:
1092 			 */
1093 			for (j = 0; j < SELFMAG; j++) {
1094 				if (ehdr->e_ident[j] != ELFMAG[j]) {
1095 					cmn_err(CE_NOTE, "!Fastboot: Bad ELF "
1096 					    "signature");
1097 					goto err_out;
1098 				}
1099 			}
1100 
1101 			if (ehdr->e_ident[EI_CLASS] == ELFCLASS32 &&
1102 			    ehdr->e_ident[EI_DATA] == ELFDATA2LSB &&
1103 			    ehdr->e_machine == EM_386) {
1104 
1105 				fb->fb_sectcnt = sizeof (fb->fb_sections) /
1106 				    sizeof (fb->fb_sections[0]);
1107 
1108 				if (fastboot_elf32_find_loadables((void *)va,
1109 				    fsize, &fb->fb_sections[0],
1110 				    &fb->fb_sectcnt, &dboot_start_offset) < 0) {
1111 					cmn_err(CE_NOTE, "!Fastboot: ELF32 "
1112 					    "program section failure");
1113 					goto err_out;
1114 				}
1115 
1116 				if (fb->fb_sectcnt == 0) {
1117 					cmn_err(CE_NOTE, "!Fastboot: No ELF32 "
1118 					    "program sections found");
1119 					goto err_out;
1120 				}
1121 
1122 				if (is_failsafe) {
1123 					/* Failsafe boot_archive */
1124 					bcopy(BOOTARCHIVE32_FAILSAFE,
1125 					    &fastboot_filename
1126 					    [FASTBOOT_NAME_BOOTARCHIVE]
1127 					    [bootpath_len],
1128 					    sizeof (BOOTARCHIVE32_FAILSAFE));
1129 				} else {
1130 					bcopy(BOOTARCHIVE32,
1131 					    &fastboot_filename
1132 					    [FASTBOOT_NAME_BOOTARCHIVE]
1133 					    [bootpath_len],
1134 					    sizeof (BOOTARCHIVE32));
1135 				}
1136 
1137 			} else if (ehdr->e_ident[EI_CLASS] == ELFCLASS64 &&
1138 			    ehdr->e_ident[EI_DATA] == ELFDATA2LSB &&
1139 			    ehdr->e_machine == EM_AMD64) {
1140 
1141 				if (fastboot_elf64_find_dboot_load_offset(
1142 				    (void *)va, fsize, &dboot_start_offset)
1143 				    != 0) {
1144 					cmn_err(CE_NOTE, "!Fastboot: Couldn't "
1145 					    "find ELF64 dboot entry offset");
1146 					goto err_out;
1147 				}
1148 
1149 				if ((x86_feature & X86_64) == 0 ||
1150 				    (x86_feature & X86_PAE) == 0) {
1151 					cmn_err(CE_NOTE, "!Fastboot: Cannot "
1152 					    "reboot to %s: "
1153 					    "not a 64-bit capable system",
1154 					    kern_bootfile);
1155 					goto err_out;
1156 				}
1157 
1158 				if (is_failsafe) {
1159 					/* Failsafe boot_archive */
1160 					bcopy(BOOTARCHIVE64_FAILSAFE,
1161 					    &fastboot_filename
1162 					    [FASTBOOT_NAME_BOOTARCHIVE]
1163 					    [bootpath_len],
1164 					    sizeof (BOOTARCHIVE64_FAILSAFE));
1165 				} else {
1166 					bcopy(BOOTARCHIVE64,
1167 					    &fastboot_filename
1168 					    [FASTBOOT_NAME_BOOTARCHIVE]
1169 					    [bootpath_len],
1170 					    sizeof (BOOTARCHIVE64));
1171 				}
1172 			} else {
1173 				cmn_err(CE_NOTE, "!Fastboot: Unknown ELF type");
1174 				goto err_out;
1175 			}
1176 
1177 			fb->fb_dest_pa = DBOOT_ENTRY_ADDRESS -
1178 			    dboot_start_offset;
1179 
1180 			fb->fb_next_pa = DBOOT_ENTRY_ADDRESS + fsize_roundup;
1181 		} else {
1182 			fb->fb_dest_pa = newkernel.fi_files[i - 1].fb_next_pa;
1183 			fb->fb_next_pa = fb->fb_dest_pa + fsize_roundup;
1184 		}
1185 
1186 		kobj_close_file(file);
1187 
1188 	}
1189 
1190 	/*
1191 	 * Add the function that will switch us to 32-bit protected mode
1192 	 */
1193 	fb = &newkernel.fi_files[FASTBOOT_SWTCH];
1194 	fb->fb_va = fb->fb_dest_pa = FASTBOOT_SWTCH_PA;
1195 	fb->fb_size = MMU_PAGESIZE;
1196 
1197 	hat_devload(kas.a_hat, (caddr_t)fb->fb_va,
1198 	    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
1199 	    PROT_READ | PROT_WRITE | PROT_EXEC,
1200 	    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
1201 
1202 	/*
1203 	 * Build the new multiboot_info structure
1204 	 */
1205 	if (fastboot_build_mbi(fastboot_args, &newkernel) != 0) {
1206 		goto err_out;
1207 	}
1208 
1209 	/*
1210 	 * Build page table for low 1G physical memory. Use big pages.
1211 	 * Allocate 4 (5 for amd64) pages for the page tables.
1212 	 *    1 page for PML4 (amd64)
1213 	 *    1 page for Page-Directory-Pointer Table
1214 	 *    2 pages for Page Directory
1215 	 *    1 page for Page Table.
1216 	 * The page table entry will be rewritten to map the physical
1217 	 * address as we do the copying.
1218 	 */
1219 	if (newkernel.fi_has_pae) {
1220 #ifdef	__amd64
1221 		size_t size = MMU_PAGESIZE * 5;
1222 #else
1223 		size_t size = MMU_PAGESIZE * 4;
1224 #endif	/* __amd64 */
1225 
1226 		if (newkernel.fi_pagetable_size && newkernel.fi_pagetable_size
1227 		    < size) {
1228 			contig_free((void *)newkernel.fi_pagetable_va,
1229 			    newkernel.fi_pagetable_size);
1230 			newkernel.fi_pagetable_size = 0;
1231 		}
1232 
1233 		if (newkernel.fi_pagetable_size == 0) {
1234 			if ((newkernel.fi_pagetable_va = (uintptr_t)
1235 			    contig_alloc(size, &fastboot_below_1G_dma_attr,
1236 			    MMU_PAGESIZE, 0)) == NULL) {
1237 				cmn_err(CE_NOTE, fastboot_enomem_msg,
1238 				    (uint64_t)size, "1G");
1239 				goto err_out;
1240 			}
1241 			/*
1242 			 * fi_pagetable_size must be set after the allocation
1243 			 * succeeds as it's used to determine how much memory to
1244 			 * free.
1245 			 */
1246 			newkernel.fi_pagetable_size = size;
1247 		}
1248 
1249 		bzero((void *)(newkernel.fi_pagetable_va), size);
1250 
1251 		newkernel.fi_pagetable_pa =
1252 		    mmu_ptob((uint64_t)hat_getpfnum(kas.a_hat,
1253 		    (caddr_t)newkernel.fi_pagetable_va));
1254 
1255 		newkernel.fi_last_table_pa = newkernel.fi_pagetable_pa +
1256 		    size - MMU_PAGESIZE;
1257 
1258 		newkernel.fi_next_table_va = newkernel.fi_pagetable_va +
1259 		    MMU_PAGESIZE;
1260 		newkernel.fi_next_table_pa = newkernel.fi_pagetable_pa +
1261 		    MMU_PAGESIZE;
1262 
1263 		fastboot_build_pagetables(&newkernel);
1264 	}
1265 
1266 
1267 	/* Generate MD5 checksums */
1268 	fastboot_cksum_generate(&newkernel);
1269 
1270 	/* Mark it as valid */
1271 	newkernel.fi_valid = 1;
1272 	newkernel.fi_magic = FASTBOOT_MAGIC;
1273 
1274 	postbootkernelbase = saved_kernelbase;
1275 	return;
1276 
1277 err_out:
1278 	postbootkernelbase = saved_kernelbase;
1279 	newkernel.fi_valid = 0;
1280 	fastboot_free_newkernel(&newkernel);
1281 }
1282 
1283 
1284 /* ARGSUSED */
1285 static int
1286 fastboot_xc_func(fastboot_info_t *nk, xc_arg_t unused2, xc_arg_t unused3)
1287 {
1288 	void (*fastboot_func)(fastboot_info_t *);
1289 	fastboot_file_t	*fb = &nk->fi_files[FASTBOOT_SWTCH];
1290 	fastboot_func = (void (*)())(fb->fb_va);
1291 	kthread_t *t_intr = curthread->t_intr;
1292 
1293 	if (&kas != curproc->p_as) {
1294 		hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va,
1295 		    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
1296 		    PROT_READ | PROT_WRITE | PROT_EXEC,
1297 		    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
1298 	}
1299 
1300 	/*
1301 	 * If we have pinned a thread, make sure the address is mapped
1302 	 * in the address space of the pinned thread.
1303 	 */
1304 	if (t_intr && t_intr->t_procp->p_as->a_hat != curproc->p_as->a_hat &&
1305 	    t_intr->t_procp->p_as != &kas)
1306 		hat_devload(t_intr->t_procp->p_as->a_hat, (caddr_t)fb->fb_va,
1307 		    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
1308 		    PROT_READ | PROT_WRITE | PROT_EXEC,
1309 		    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
1310 
1311 	(*psm_shutdownf)(A_SHUTDOWN, AD_FASTREBOOT);
1312 	(*fastboot_func)(nk);
1313 
1314 	/*NOTREACHED*/
1315 	return (0);
1316 }
1317 
1318 /*
1319  * Jump to the fast reboot switcher.  This function never returns.
1320  */
1321 void
1322 fast_reboot()
1323 {
1324 	processorid_t bootcpuid = 0;
1325 	extern uintptr_t postbootkernelbase;
1326 	extern char	fb_swtch_image[];
1327 	fastboot_file_t	*fb;
1328 	int i;
1329 
1330 	postbootkernelbase = 0;
1331 
1332 	fb = &newkernel.fi_files[FASTBOOT_SWTCH];
1333 
1334 	/*
1335 	 * Map the address into both the current proc's address
1336 	 * space and the kernel's address space in case the panic
1337 	 * is forced by kmdb.
1338 	 */
1339 	if (&kas != curproc->p_as) {
1340 		hat_devload(curproc->p_as->a_hat, (caddr_t)fb->fb_va,
1341 		    MMU_PAGESIZE, mmu_btop(fb->fb_dest_pa),
1342 		    PROT_READ | PROT_WRITE | PROT_EXEC,
1343 		    HAT_LOAD_NOCONSIST | HAT_LOAD_LOCK);
1344 	}
1345 
1346 	bcopy((void *)fb_swtch_image, (void *)fb->fb_va, fb->fb_size);
1347 
1348 
1349 	/*
1350 	 * Set fb_va to fake_va
1351 	 */
1352 	for (i = 0; i < FASTBOOT_MAX_FILES_MAP; i++) {
1353 		newkernel.fi_files[i].fb_va = fake_va;
1354 
1355 	}
1356 
1357 	if (panicstr && CPU->cpu_id != bootcpuid &&
1358 	    CPU_ACTIVE(cpu_get(bootcpuid))) {
1359 		extern void panic_idle(void);
1360 		cpuset_t cpuset;
1361 
1362 		CPUSET_ZERO(cpuset);
1363 		CPUSET_ADD(cpuset, bootcpuid);
1364 		xc_priority((xc_arg_t)&newkernel, 0, 0, CPUSET2BV(cpuset),
1365 		    (xc_func_t)fastboot_xc_func);
1366 
1367 		panic_idle();
1368 	} else
1369 		(void) fastboot_xc_func(&newkernel, 0, 0);
1370 }
1371 
1372 
1373 /*
1374  * Get boot property value for fastreboot_onpanic.
1375  *
1376  * NOTE: If fastreboot_onpanic is set to non-zero in /etc/system,
1377  * new setting passed in via "-B fastreboot_onpanic" is ignored.
1378  * This order of precedence is to enable developers debugging panics
1379  * that occur early in boot to utilize Fast Reboot on panic.
1380  */
1381 static void
1382 fastboot_get_bootprop(void)
1383 {
1384 	int		val = 0xaa, len, ret;
1385 	dev_info_t	*devi;
1386 	char		*propstr = NULL;
1387 
1388 	devi = ddi_root_node();
1389 
1390 	ret = ddi_prop_lookup_string(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS,
1391 	    FASTREBOOT_ONPANIC, &propstr);
1392 
1393 	if (ret == DDI_PROP_SUCCESS) {
1394 		if (FASTREBOOT_ONPANIC_NOTSET(propstr))
1395 			val = 0;
1396 		else if (FASTREBOOT_ONPANIC_ISSET(propstr))
1397 			val = UA_FASTREBOOT_ONPANIC;
1398 
1399 		/*
1400 		 * Only set fastreboot_onpanic to the value passed in
1401 		 * if it's not already set to non-zero, and the value
1402 		 * has indeed been passed in via command line.
1403 		 */
1404 		if (!fastreboot_onpanic && val != 0xaa)
1405 			fastreboot_onpanic = val;
1406 		ddi_prop_free(propstr);
1407 	} else if (ret != DDI_PROP_NOT_FOUND && ret != DDI_PROP_UNDEFINED) {
1408 		cmn_err(CE_NOTE, "!%s value is invalid, will be ignored",
1409 		    FASTREBOOT_ONPANIC);
1410 	}
1411 
1412 	len = sizeof (fastreboot_onpanic_cmdline);
1413 	ret = ddi_getlongprop_buf(DDI_DEV_T_ANY, devi, DDI_PROP_DONTPASS,
1414 	    FASTREBOOT_ONPANIC_CMDLINE, fastreboot_onpanic_cmdline, &len);
1415 
1416 	if (ret == DDI_PROP_BUF_TOO_SMALL)
1417 		cmn_err(CE_NOTE, "!%s value is too long, will be ignored",
1418 		    FASTREBOOT_ONPANIC_CMDLINE);
1419 }
1420 
1421 /*
1422  * This function is called by main() to either load the backup kernel for panic
1423  * fast reboot, or to reserve low physical memory for fast reboot.
1424  */
1425 void
1426 fastboot_post_startup()
1427 {
1428 	lbolt_at_boot = ddi_get_lbolt();
1429 
1430 	/* Default to 10 minutes */
1431 	if (fastreboot_onpanic_uptime == LONG_MAX)
1432 		fastreboot_onpanic_uptime = SEC_TO_TICK(10 * 60);
1433 
1434 	if (!fastreboot_capable)
1435 		return;
1436 
1437 	mutex_enter(&fastreboot_config_mutex);
1438 
1439 	fastboot_get_bootprop();
1440 
1441 	if (fastreboot_onpanic)
1442 		fastboot_load_kernel(fastreboot_onpanic_cmdline);
1443 	else if (reserve_mem_enabled)
1444 		fastboot_reserve_mem(&newkernel);
1445 
1446 	mutex_exit(&fastreboot_config_mutex);
1447 }
1448 
1449 /*
1450  * Update boot configuration settings.
1451  * If the new fastreboot_onpanic setting is false, and a kernel has
1452  * been preloaded, free the memory;
1453  * if the new fastreboot_onpanic setting is true and newkernel is
1454  * not valid, load the new kernel.
1455  */
1456 void
1457 fastboot_update_config(const char *mdep)
1458 {
1459 	uint8_t boot_config = (uint8_t)*mdep;
1460 	int cur_fastreboot_onpanic;
1461 
1462 	if (!fastreboot_capable)
1463 		return;
1464 
1465 	mutex_enter(&fastreboot_config_mutex);
1466 
1467 	cur_fastreboot_onpanic = fastreboot_onpanic;
1468 	fastreboot_onpanic = boot_config & UA_FASTREBOOT_ONPANIC;
1469 
1470 	if (fastreboot_onpanic && (!cur_fastreboot_onpanic ||
1471 	    !newkernel.fi_valid))
1472 		fastboot_load_kernel(fastreboot_onpanic_cmdline);
1473 	if (cur_fastreboot_onpanic && !fastreboot_onpanic)
1474 		fastboot_free_newkernel(&newkernel);
1475 
1476 	mutex_exit(&fastreboot_config_mutex);
1477 }
1478 
1479 /*
1480  * This is the interface to be called by other kernel components to
1481  * disable fastreboot_onpanic.
1482  */
1483 void
1484 fastreboot_disable()
1485 {
1486 	uint8_t boot_config = (uint8_t)(~UA_FASTREBOOT_ONPANIC);
1487 	fastboot_update_config((const char *)&boot_config);
1488 }
1489 
1490 /*
1491  * This is the interface to be called by fm_panic() in case FMA has diagnosed
1492  * a terminal machine check exception.  It does not free up memory allocated
1493  * for the backup kernel.  General disabling fastreboot_onpanic in a
1494  * non-panicking situation must go through fastboot_update_config().
1495  */
1496 void
1497 fastreboot_disable_highpil()
1498 {
1499 	fastreboot_onpanic = 0;
1500 }
1501 
1502 
1503 /*
1504  * A simplified interface for uadmin to call to update the configuration
1505  * setting and load a new kernel if necessary.
1506  */
1507 void
1508 fastboot_update_and_load(int fcn, char *mdep)
1509 {
1510 	if (fcn != AD_FASTREBOOT) {
1511 		/*
1512 		 * If user has explicitly requested reboot to prom,
1513 		 * or uadmin(1M) was invoked with other functions,
1514 		 * don't try to fast reboot after dumping.
1515 		 */
1516 		fastreboot_disable();
1517 	}
1518 
1519 	mutex_enter(&fastreboot_config_mutex);
1520 
1521 	if (fastreboot_onpanic)
1522 		fastboot_load_kernel(mdep);
1523 
1524 	mutex_exit(&fastreboot_config_mutex);
1525 }
1526