xref: /freebsd/stand/efi/loader/arch/amd64/elf64_freebsd.c (revision f75caed644a5c8c342a1ea5e7a6d5251f82ed0b1)
1ca987d46SWarner Losh /*-
2ca987d46SWarner Losh  * Copyright (c) 1998 Michael Smith <msmith@freebsd.org>
3ca987d46SWarner Losh  * Copyright (c) 2014 The FreeBSD Foundation
4ca987d46SWarner Losh  * All rights reserved.
5ca987d46SWarner Losh  *
6ca987d46SWarner Losh  * Redistribution and use in source and binary forms, with or without
7ca987d46SWarner Losh  * modification, are permitted provided that the following conditions
8ca987d46SWarner Losh  * are met:
9ca987d46SWarner Losh  * 1. Redistributions of source code must retain the above copyright
10ca987d46SWarner Losh  *    notice, this list of conditions and the following disclaimer.
11ca987d46SWarner Losh  * 2. Redistributions in binary form must reproduce the above copyright
12ca987d46SWarner Losh  *    notice, this list of conditions and the following disclaimer in the
13ca987d46SWarner Losh  *    documentation and/or other materials provided with the distribution.
14ca987d46SWarner Losh  *
15ca987d46SWarner Losh  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16ca987d46SWarner Losh  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17ca987d46SWarner Losh  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18ca987d46SWarner Losh  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19ca987d46SWarner Losh  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20ca987d46SWarner Losh  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21ca987d46SWarner Losh  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22ca987d46SWarner Losh  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23ca987d46SWarner Losh  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24ca987d46SWarner Losh  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25ca987d46SWarner Losh  * SUCH DAMAGE.
26ca987d46SWarner Losh  */
27ca987d46SWarner Losh 
28ca987d46SWarner Losh #include <sys/cdefs.h>
29ca987d46SWarner Losh __FBSDID("$FreeBSD$");
30ca987d46SWarner Losh 
31ca987d46SWarner Losh #define __ELF_WORD_SIZE 64
32ca987d46SWarner Losh #include <sys/param.h>
33ca987d46SWarner Losh #include <sys/exec.h>
34ca987d46SWarner Losh #include <sys/linker.h>
35ca987d46SWarner Losh #include <string.h>
36ca987d46SWarner Losh #include <machine/elf.h>
37ca987d46SWarner Losh #include <stand.h>
38ca987d46SWarner Losh #include <vm/vm.h>
39ca987d46SWarner Losh #include <vm/pmap.h>
40ca987d46SWarner Losh 
41ca987d46SWarner Losh #include <efi.h>
42ca987d46SWarner Losh #include <efilib.h>
43ca987d46SWarner Losh 
44ca987d46SWarner Losh #include "bootstrap.h"
45ca987d46SWarner Losh 
46ca987d46SWarner Losh #include "platform/acfreebsd.h"
47ca987d46SWarner Losh #include "acconfig.h"
48ca987d46SWarner Losh #define ACPI_SYSTEM_XFACE
49ca987d46SWarner Losh #include "actypes.h"
50ca987d46SWarner Losh #include "actbl.h"
51ca987d46SWarner Losh 
52ca987d46SWarner Losh #include "loader_efi.h"
53ca987d46SWarner Losh 
54ca987d46SWarner Losh static EFI_GUID acpi_guid = ACPI_TABLE_GUID;
55ca987d46SWarner Losh static EFI_GUID acpi20_guid = ACPI_20_TABLE_GUID;
56ca987d46SWarner Losh 
57ed87efbeSRoger Pau Monné extern int bi_load(char *args, vm_offset_t *modulep, vm_offset_t *kernendp,
58ed87efbeSRoger Pau Monné     bool exit_bs);
59ca987d46SWarner Losh 
60ca987d46SWarner Losh static int	elf64_exec(struct preloaded_file *amp);
61ca987d46SWarner Losh static int	elf64_obj_exec(struct preloaded_file *amp);
62ca987d46SWarner Losh 
63ca987d46SWarner Losh static struct file_format amd64_elf = {
64ca987d46SWarner Losh 	.l_load = elf64_loadfile,
65ca987d46SWarner Losh 	.l_exec = elf64_exec,
66ca987d46SWarner Losh };
67ca987d46SWarner Losh static struct file_format amd64_elf_obj = {
68ca987d46SWarner Losh 	.l_load = elf64_obj_loadfile,
69ca987d46SWarner Losh 	.l_exec = elf64_obj_exec,
70ca987d46SWarner Losh };
71ca987d46SWarner Losh 
72adda2797SRoger Pau Monné extern struct file_format multiboot2;
73adda2797SRoger Pau Monné extern struct file_format multiboot2_obj;
74adda2797SRoger Pau Monné 
75ca987d46SWarner Losh struct file_format *file_formats[] = {
76adda2797SRoger Pau Monné 	&multiboot2,
77adda2797SRoger Pau Monné 	&multiboot2_obj,
78ca987d46SWarner Losh 	&amd64_elf,
79ca987d46SWarner Losh 	&amd64_elf_obj,
80ca987d46SWarner Losh 	NULL
81ca987d46SWarner Losh };
82ca987d46SWarner Losh 
83ca987d46SWarner Losh static pml4_entry_t *PT4;
84ca987d46SWarner Losh static pdp_entry_t *PT3;
85*f75caed6SKonstantin Belousov static pdp_entry_t *PT3_l, *PT3_u;
86ca987d46SWarner Losh static pd_entry_t *PT2;
87*f75caed6SKonstantin Belousov static pd_entry_t *PT2_l0, *PT2_l1, *PT2_l2, *PT2_l3, *PT2_u0, *PT2_u1;
88*f75caed6SKonstantin Belousov 
89*f75caed6SKonstantin Belousov extern EFI_PHYSICAL_ADDRESS staging;
90ca987d46SWarner Losh 
91ca987d46SWarner Losh static void (*trampoline)(uint64_t stack, void *copy_finish, uint64_t kernend,
92ca987d46SWarner Losh     uint64_t modulep, pml4_entry_t *pagetable, uint64_t entry);
93ca987d46SWarner Losh 
94ca987d46SWarner Losh extern uintptr_t amd64_tramp;
95ca987d46SWarner Losh extern uint32_t amd64_tramp_size;
96ca987d46SWarner Losh 
97ca987d46SWarner Losh /*
98ca987d46SWarner Losh  * There is an ELF kernel and one or more ELF modules loaded.
99ca987d46SWarner Losh  * We wish to start executing the kernel image, so make such
100ca987d46SWarner Losh  * preparations as are required, and do so.
101ca987d46SWarner Losh  */
102ca987d46SWarner Losh static int
103ca987d46SWarner Losh elf64_exec(struct preloaded_file *fp)
104ca987d46SWarner Losh {
105ca987d46SWarner Losh 	struct file_metadata	*md;
106ca987d46SWarner Losh 	Elf_Ehdr 		*ehdr;
107ca987d46SWarner Losh 	vm_offset_t		modulep, kernend, trampcode, trampstack;
108ca987d46SWarner Losh 	int			err, i;
109ca987d46SWarner Losh 	ACPI_TABLE_RSDP		*rsdp;
110ca987d46SWarner Losh 	char			buf[24];
111ca987d46SWarner Losh 	int			revision;
112*f75caed6SKonstantin Belousov 	bool			copy_auto;
113*f75caed6SKonstantin Belousov 
114*f75caed6SKonstantin Belousov 	copy_auto = copy_staging == COPY_STAGING_AUTO;
115*f75caed6SKonstantin Belousov 	if (copy_auto)
116*f75caed6SKonstantin Belousov 		copy_staging = fp->f_kernphys_relocatable ?
117*f75caed6SKonstantin Belousov 		    COPY_STAGING_DISABLE : COPY_STAGING_ENABLE;
118ca987d46SWarner Losh 
119ca987d46SWarner Losh 	/*
120ca987d46SWarner Losh 	 * Report the RSDP to the kernel. While this can be found with
121ca987d46SWarner Losh 	 * a BIOS boot, the RSDP may be elsewhere when booted from UEFI.
122ca987d46SWarner Losh 	 * The old code used the 'hints' method to communite this to
123ca987d46SWarner Losh 	 * the kernel. However, while convenient, the 'hints' method
124ca987d46SWarner Losh 	 * is fragile and does not work when static hints are compiled
125ca987d46SWarner Losh 	 * into the kernel. Instead, move to setting different tunables
126ca987d46SWarner Losh 	 * that start with acpi. The old 'hints' can be removed before
127ca987d46SWarner Losh 	 * we branch for FreeBSD 12.
128ca987d46SWarner Losh 	 */
129ca987d46SWarner Losh 
130ca987d46SWarner Losh 	rsdp = efi_get_table(&acpi20_guid);
131ca987d46SWarner Losh 	if (rsdp == NULL) {
132ca987d46SWarner Losh 		rsdp = efi_get_table(&acpi_guid);
133ca987d46SWarner Losh 	}
134ca987d46SWarner Losh 	if (rsdp != NULL) {
135ca987d46SWarner Losh 		sprintf(buf, "0x%016llx", (unsigned long long)rsdp);
136ca987d46SWarner Losh 		setenv("hint.acpi.0.rsdp", buf, 1);
137ca987d46SWarner Losh 		setenv("acpi.rsdp", buf, 1);
138ca987d46SWarner Losh 		revision = rsdp->Revision;
139ca987d46SWarner Losh 		if (revision == 0)
140ca987d46SWarner Losh 			revision = 1;
141ca987d46SWarner Losh 		sprintf(buf, "%d", revision);
142ca987d46SWarner Losh 		setenv("hint.acpi.0.revision", buf, 1);
143ca987d46SWarner Losh 		setenv("acpi.revision", buf, 1);
144ca987d46SWarner Losh 		strncpy(buf, rsdp->OemId, sizeof(rsdp->OemId));
145ca987d46SWarner Losh 		buf[sizeof(rsdp->OemId)] = '\0';
146ca987d46SWarner Losh 		setenv("hint.acpi.0.oem", buf, 1);
147ca987d46SWarner Losh 		setenv("acpi.oem", buf, 1);
148ca987d46SWarner Losh 		sprintf(buf, "0x%016x", rsdp->RsdtPhysicalAddress);
149ca987d46SWarner Losh 		setenv("hint.acpi.0.rsdt", buf, 1);
150ca987d46SWarner Losh 		setenv("acpi.rsdt", buf, 1);
151ca987d46SWarner Losh 		if (revision >= 2) {
152ca987d46SWarner Losh 			/* XXX extended checksum? */
153ca987d46SWarner Losh 			sprintf(buf, "0x%016llx",
154ca987d46SWarner Losh 			    (unsigned long long)rsdp->XsdtPhysicalAddress);
155ca987d46SWarner Losh 			setenv("hint.acpi.0.xsdt", buf, 1);
156ca987d46SWarner Losh 			setenv("acpi.xsdt", buf, 1);
157ca987d46SWarner Losh 			sprintf(buf, "%d", rsdp->Length);
158ca987d46SWarner Losh 			setenv("hint.acpi.0.xsdt_length", buf, 1);
159ca987d46SWarner Losh 			setenv("acpi.xsdt_length", buf, 1);
160ca987d46SWarner Losh 		}
161ca987d46SWarner Losh 	}
162ca987d46SWarner Losh 
163ca987d46SWarner Losh 	if ((md = file_findmetadata(fp, MODINFOMD_ELFHDR)) == NULL)
164ca987d46SWarner Losh 		return (EFTYPE);
165ca987d46SWarner Losh 	ehdr = (Elf_Ehdr *)&(md->md_data);
166ca987d46SWarner Losh 
167*f75caed6SKonstantin Belousov 	trampcode = copy_staging == COPY_STAGING_ENABLE ?
168*f75caed6SKonstantin Belousov 	    (vm_offset_t)0x0000000040000000 /* 1G */ :
169*f75caed6SKonstantin Belousov 	    (vm_offset_t)0x0000000100000000; /* 4G */;
170ca987d46SWarner Losh 	err = BS->AllocatePages(AllocateMaxAddress, EfiLoaderData, 1,
171ca987d46SWarner Losh 	    (EFI_PHYSICAL_ADDRESS *)&trampcode);
172*f75caed6SKonstantin Belousov 	if (EFI_ERROR(err)) {
173*f75caed6SKonstantin Belousov 		printf("Unable to allocate trampoline\n");
174*f75caed6SKonstantin Belousov 		if (copy_auto)
175*f75caed6SKonstantin Belousov 			copy_staging = COPY_STAGING_AUTO;
176*f75caed6SKonstantin Belousov 		return (ENOMEM);
177*f75caed6SKonstantin Belousov 	}
178ca987d46SWarner Losh 	bzero((void *)trampcode, EFI_PAGE_SIZE);
179ca987d46SWarner Losh 	trampstack = trampcode + EFI_PAGE_SIZE - 8;
180ca987d46SWarner Losh 	bcopy((void *)&amd64_tramp, (void *)trampcode, amd64_tramp_size);
181ca987d46SWarner Losh 	trampoline = (void *)trampcode;
182ca987d46SWarner Losh 
183*f75caed6SKonstantin Belousov 	if (copy_staging == COPY_STAGING_ENABLE) {
184ca987d46SWarner Losh 		PT4 = (pml4_entry_t *)0x0000000040000000;
185ca987d46SWarner Losh 		err = BS->AllocatePages(AllocateMaxAddress, EfiLoaderData, 3,
186ca987d46SWarner Losh 		    (EFI_PHYSICAL_ADDRESS *)&PT4);
187*f75caed6SKonstantin Belousov 		if (EFI_ERROR(err)) {
188*f75caed6SKonstantin Belousov 			printf("Unable to allocate trampoline page table\n");
189*f75caed6SKonstantin Belousov 			BS->FreePages(trampcode, 1);
190*f75caed6SKonstantin Belousov 			if (copy_auto)
191*f75caed6SKonstantin Belousov 				copy_staging = COPY_STAGING_AUTO;
192*f75caed6SKonstantin Belousov 			return (ENOMEM);
193*f75caed6SKonstantin Belousov 		}
194ca987d46SWarner Losh 		bzero(PT4, 3 * EFI_PAGE_SIZE);
195ca987d46SWarner Losh 		PT3 = &PT4[512];
196ca987d46SWarner Losh 		PT2 = &PT3[512];
197ca987d46SWarner Losh 
198ca987d46SWarner Losh 		/*
199*f75caed6SKonstantin Belousov 		 * This is kinda brutal, but every single 1GB VM
200*f75caed6SKonstantin Belousov 		 * memory segment points to the same first 1GB of
201*f75caed6SKonstantin Belousov 		 * physical memory.  But it is more than adequate.
202ca987d46SWarner Losh 		 */
203*f75caed6SKonstantin Belousov 		for (i = 0; i < NPTEPG; i++) {
204*f75caed6SKonstantin Belousov 			/*
205*f75caed6SKonstantin Belousov 			 * Each slot of the L4 pages points to the
206*f75caed6SKonstantin Belousov 			 * same L3 page.
207*f75caed6SKonstantin Belousov 			 */
208ca987d46SWarner Losh 			PT4[i] = (pml4_entry_t)PT3;
2095c170925SMark Johnston 			PT4[i] |= PG_V | PG_RW;
210ca987d46SWarner Losh 
211*f75caed6SKonstantin Belousov 			/*
212*f75caed6SKonstantin Belousov 			 * Each slot of the L3 pages points to the
213*f75caed6SKonstantin Belousov 			 * same L2 page.
214*f75caed6SKonstantin Belousov 			 */
215ca987d46SWarner Losh 			PT3[i] = (pdp_entry_t)PT2;
2165c170925SMark Johnston 			PT3[i] |= PG_V | PG_RW;
217ca987d46SWarner Losh 
218*f75caed6SKonstantin Belousov 			/*
219*f75caed6SKonstantin Belousov 			 * The L2 page slots are mapped with 2MB pages for 1GB.
220*f75caed6SKonstantin Belousov 			 */
221*f75caed6SKonstantin Belousov 			PT2[i] = (pd_entry_t)i * (2 * 1024 * 1024);
2225c170925SMark Johnston 			PT2[i] |= PG_V | PG_RW | PG_PS;
223ca987d46SWarner Losh 		}
224*f75caed6SKonstantin Belousov 	} else {
225*f75caed6SKonstantin Belousov 		PT4 = (pml4_entry_t *)0x0000000100000000; /* 4G */
226*f75caed6SKonstantin Belousov 		err = BS->AllocatePages(AllocateMaxAddress, EfiLoaderData, 9,
227*f75caed6SKonstantin Belousov 		    (EFI_PHYSICAL_ADDRESS *)&PT4);
228*f75caed6SKonstantin Belousov 		if (EFI_ERROR(err)) {
229*f75caed6SKonstantin Belousov 			printf("Unable to allocate trampoline page table\n");
230*f75caed6SKonstantin Belousov 			BS->FreePages(trampcode, 9);
231*f75caed6SKonstantin Belousov 			if (copy_auto)
232*f75caed6SKonstantin Belousov 				copy_staging = COPY_STAGING_AUTO;
233*f75caed6SKonstantin Belousov 			return (ENOMEM);
234*f75caed6SKonstantin Belousov 		}
235ca987d46SWarner Losh 
236*f75caed6SKonstantin Belousov 		bzero(PT4, 9 * EFI_PAGE_SIZE);
237*f75caed6SKonstantin Belousov 
238*f75caed6SKonstantin Belousov 		PT3_l = &PT4[NPML4EPG * 1];
239*f75caed6SKonstantin Belousov 		PT3_u = &PT4[NPML4EPG * 2];
240*f75caed6SKonstantin Belousov 		PT2_l0 = &PT4[NPML4EPG * 3];
241*f75caed6SKonstantin Belousov 		PT2_l1 = &PT4[NPML4EPG * 4];
242*f75caed6SKonstantin Belousov 		PT2_l2 = &PT4[NPML4EPG * 5];
243*f75caed6SKonstantin Belousov 		PT2_l3 = &PT4[NPML4EPG * 6];
244*f75caed6SKonstantin Belousov 		PT2_u0 = &PT4[NPML4EPG * 7];
245*f75caed6SKonstantin Belousov 		PT2_u1 = &PT4[NPML4EPG * 8];
246*f75caed6SKonstantin Belousov 
247*f75caed6SKonstantin Belousov 		/* 1:1 mapping of lower 4G */
248*f75caed6SKonstantin Belousov 		PT4[0] = (pml4_entry_t)PT3_l | PG_V | PG_RW;
249*f75caed6SKonstantin Belousov 		PT3_l[0] = (pdp_entry_t)PT2_l0 | PG_V | PG_RW;
250*f75caed6SKonstantin Belousov 		PT3_l[1] = (pdp_entry_t)PT2_l1 | PG_V | PG_RW;
251*f75caed6SKonstantin Belousov 		PT3_l[2] = (pdp_entry_t)PT2_l2 | PG_V | PG_RW;
252*f75caed6SKonstantin Belousov 		PT3_l[3] = (pdp_entry_t)PT2_l3 | PG_V | PG_RW;
253*f75caed6SKonstantin Belousov 		for (i = 0; i < 4 * NPDEPG; i++) {
254*f75caed6SKonstantin Belousov 			PT2_l0[i] = ((pd_entry_t)i << PDRSHIFT) | PG_V |
255*f75caed6SKonstantin Belousov 			    PG_RW | PG_PS;
256*f75caed6SKonstantin Belousov 		}
257*f75caed6SKonstantin Belousov 
258*f75caed6SKonstantin Belousov 		/* mapping of kernel 2G below top */
259*f75caed6SKonstantin Belousov 		PT4[NPML4EPG - 1] = (pml4_entry_t)PT3_u | PG_V | PG_RW;
260*f75caed6SKonstantin Belousov 		PT3_u[NPDPEPG - 2] = (pdp_entry_t)PT2_u0 | PG_V | PG_RW;
261*f75caed6SKonstantin Belousov 		PT3_u[NPDPEPG - 1] = (pdp_entry_t)PT2_u1 | PG_V | PG_RW;
262*f75caed6SKonstantin Belousov 		/* compat mapping of phys @0 */
263*f75caed6SKonstantin Belousov 		PT2_u0[0] = PG_PS | PG_V | PG_RW;
264*f75caed6SKonstantin Belousov 		/* this maps past staging area */
265*f75caed6SKonstantin Belousov 		for (i = 1; i < 2 * NPDEPG; i++) {
266*f75caed6SKonstantin Belousov 			PT2_u0[i] = ((pd_entry_t)staging +
267*f75caed6SKonstantin Belousov 			    ((pd_entry_t)i - 1) * NBPDR) |
268*f75caed6SKonstantin Belousov 			    PG_V | PG_RW | PG_PS;
269*f75caed6SKonstantin Belousov 		}
270*f75caed6SKonstantin Belousov 	}
271*f75caed6SKonstantin Belousov 
272*f75caed6SKonstantin Belousov 	printf("staging %#lx (%scoping) tramp %p PT4 %p\n",
273*f75caed6SKonstantin Belousov 	    staging, copy_staging == COPY_STAGING_ENABLE ? "" : "not ",
274*f75caed6SKonstantin Belousov 	    trampoline, PT4);
275ca987d46SWarner Losh 	printf("Start @ 0x%lx ...\n", ehdr->e_entry);
276ca987d46SWarner Losh 
277ca987d46SWarner Losh 	efi_time_fini();
278ed87efbeSRoger Pau Monné 	err = bi_load(fp->f_args, &modulep, &kernend, true);
279ca987d46SWarner Losh 	if (err != 0) {
280ca987d46SWarner Losh 		efi_time_init();
281*f75caed6SKonstantin Belousov 		if (copy_auto)
282*f75caed6SKonstantin Belousov 			copy_staging = COPY_STAGING_AUTO;
283ca987d46SWarner Losh 		return (err);
284ca987d46SWarner Losh 	}
285ca987d46SWarner Losh 
286ca987d46SWarner Losh 	dev_cleanup();
287ca987d46SWarner Losh 
288*f75caed6SKonstantin Belousov 	trampoline(trampstack, copy_staging == COPY_STAGING_ENABLE ?
289*f75caed6SKonstantin Belousov 	    efi_copy_finish : efi_copy_finish_nop, kernend, modulep,
290*f75caed6SKonstantin Belousov 	    PT4, ehdr->e_entry);
291ca987d46SWarner Losh 
292ca987d46SWarner Losh 	panic("exec returned");
293ca987d46SWarner Losh }
294ca987d46SWarner Losh 
295ca987d46SWarner Losh static int
296ca987d46SWarner Losh elf64_obj_exec(struct preloaded_file *fp)
297ca987d46SWarner Losh {
298ca987d46SWarner Losh 
299ca987d46SWarner Losh 	return (EFTYPE);
300ca987d46SWarner Losh }
301