xref: /freebsd/sys/kern/link_elf.c (revision 1e66f787c838b5af7de716e266caf4e5d190d54b)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 1998-2000 Doug Rabson
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26  * SUCH DAMAGE.
27  */
28 
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
31 
32 #include "opt_ddb.h"
33 #include "opt_gdb.h"
34 
35 #include <sys/param.h>
36 #include <sys/systm.h>
37 #ifdef GPROF
38 #include <sys/gmon.h>
39 #endif
40 #include <sys/kernel.h>
41 #include <sys/lock.h>
42 #include <sys/malloc.h>
43 #include <sys/mutex.h>
44 #include <sys/mount.h>
45 #include <sys/pcpu.h>
46 #include <sys/proc.h>
47 #include <sys/namei.h>
48 #include <sys/fcntl.h>
49 #include <sys/vnode.h>
50 #include <sys/linker.h>
51 
52 #include <machine/elf.h>
53 
54 #include <net/vnet.h>
55 
56 #include <security/mac/mac_framework.h>
57 
58 #include <vm/vm.h>
59 #include <vm/vm_param.h>
60 #ifdef SPARSE_MAPPING
61 #include <vm/vm_object.h>
62 #include <vm/vm_kern.h>
63 #include <vm/vm_extern.h>
64 #endif
65 #include <vm/pmap.h>
66 #include <vm/vm_map.h>
67 
68 #include <sys/link_elf.h>
69 
70 #ifdef DDB_CTF
71 #include <sys/zlib.h>
72 #endif
73 
74 #include "linker_if.h"
75 
76 #define MAXSEGS 4
77 
78 typedef struct elf_file {
79 	struct linker_file lf;		/* Common fields */
80 	int		preloaded;	/* Was file pre-loaded */
81 	caddr_t		address;	/* Relocation address */
82 #ifdef SPARSE_MAPPING
83 	vm_object_t	object;		/* VM object to hold file pages */
84 #endif
85 	Elf_Dyn		*dynamic;	/* Symbol table etc. */
86 	Elf_Hashelt	nbuckets;	/* DT_HASH info */
87 	Elf_Hashelt	nchains;
88 	const Elf_Hashelt *buckets;
89 	const Elf_Hashelt *chains;
90 	caddr_t		hash;
91 	caddr_t		strtab;		/* DT_STRTAB */
92 	int		strsz;		/* DT_STRSZ */
93 	const Elf_Sym	*symtab;		/* DT_SYMTAB */
94 	Elf_Addr	*got;		/* DT_PLTGOT */
95 	const Elf_Rel	*pltrel;	/* DT_JMPREL */
96 	int		pltrelsize;	/* DT_PLTRELSZ */
97 	const Elf_Rela	*pltrela;	/* DT_JMPREL */
98 	int		pltrelasize;	/* DT_PLTRELSZ */
99 	const Elf_Rel	*rel;		/* DT_REL */
100 	int		relsize;	/* DT_RELSZ */
101 	const Elf_Rela	*rela;		/* DT_RELA */
102 	int		relasize;	/* DT_RELASZ */
103 	caddr_t		modptr;
104 	const Elf_Sym	*ddbsymtab;	/* The symbol table we are using */
105 	long		ddbsymcnt;	/* Number of symbols */
106 	caddr_t		ddbstrtab;	/* String table */
107 	long		ddbstrcnt;	/* number of bytes in string table */
108 	caddr_t		symbase;	/* malloc'ed symbold base */
109 	caddr_t		strbase;	/* malloc'ed string base */
110 	caddr_t		ctftab;		/* CTF table */
111 	long		ctfcnt;		/* number of bytes in CTF table */
112 	caddr_t		ctfoff;		/* CTF offset table */
113 	caddr_t		typoff;		/* Type offset table */
114 	long		typlen;		/* Number of type entries. */
115 	Elf_Addr	pcpu_start;	/* Pre-relocation pcpu set start. */
116 	Elf_Addr	pcpu_stop;	/* Pre-relocation pcpu set stop. */
117 	Elf_Addr	pcpu_base;	/* Relocated pcpu set address. */
118 #ifdef VIMAGE
119 	Elf_Addr	vnet_start;	/* Pre-relocation vnet set start. */
120 	Elf_Addr	vnet_stop;	/* Pre-relocation vnet set stop. */
121 	Elf_Addr	vnet_base;	/* Relocated vnet set address. */
122 #endif
123 #ifdef GDB
124 	struct link_map	gdb;		/* hooks for gdb */
125 #endif
126 } *elf_file_t;
127 
128 struct elf_set {
129 	Elf_Addr	es_start;
130 	Elf_Addr	es_stop;
131 	Elf_Addr	es_base;
132 	TAILQ_ENTRY(elf_set)	es_link;
133 };
134 
135 TAILQ_HEAD(elf_set_head, elf_set);
136 
137 #include <kern/kern_ctf.c>
138 
139 static int	link_elf_link_common_finish(linker_file_t);
140 static int	link_elf_link_preload(linker_class_t cls,
141 				      const char *, linker_file_t *);
142 static int	link_elf_link_preload_finish(linker_file_t);
143 static int	link_elf_load_file(linker_class_t, const char *,
144 		    linker_file_t *);
145 static int	link_elf_lookup_symbol(linker_file_t, const char *,
146 		    c_linker_sym_t *);
147 static int	link_elf_symbol_values(linker_file_t, c_linker_sym_t,
148 		    linker_symval_t *);
149 static int	link_elf_search_symbol(linker_file_t, caddr_t,
150 		    c_linker_sym_t *, long *);
151 
152 static void	link_elf_unload_file(linker_file_t);
153 static void	link_elf_unload_preload(linker_file_t);
154 static int	link_elf_lookup_set(linker_file_t, const char *,
155 		    void ***, void ***, int *);
156 static int	link_elf_each_function_name(linker_file_t,
157 		    int (*)(const char *, void *), void *);
158 static int	link_elf_each_function_nameval(linker_file_t,
159 		    linker_function_nameval_callback_t, void *);
160 static void	link_elf_reloc_local(linker_file_t);
161 static long	link_elf_symtab_get(linker_file_t, const Elf_Sym **);
162 static long	link_elf_strtab_get(linker_file_t, caddr_t *);
163 static int	elf_lookup(linker_file_t, Elf_Size, int, Elf_Addr *);
164 
165 static kobj_method_t link_elf_methods[] = {
166 	KOBJMETHOD(linker_lookup_symbol,	link_elf_lookup_symbol),
167 	KOBJMETHOD(linker_symbol_values,	link_elf_symbol_values),
168 	KOBJMETHOD(linker_search_symbol,	link_elf_search_symbol),
169 	KOBJMETHOD(linker_unload,		link_elf_unload_file),
170 	KOBJMETHOD(linker_load_file,		link_elf_load_file),
171 	KOBJMETHOD(linker_link_preload,		link_elf_link_preload),
172 	KOBJMETHOD(linker_link_preload_finish,	link_elf_link_preload_finish),
173 	KOBJMETHOD(linker_lookup_set,		link_elf_lookup_set),
174 	KOBJMETHOD(linker_each_function_name,	link_elf_each_function_name),
175 	KOBJMETHOD(linker_each_function_nameval, link_elf_each_function_nameval),
176 	KOBJMETHOD(linker_ctf_get,		link_elf_ctf_get),
177 	KOBJMETHOD(linker_symtab_get,		link_elf_symtab_get),
178 	KOBJMETHOD(linker_strtab_get,		link_elf_strtab_get),
179 	{ 0, 0 }
180 };
181 
182 static struct linker_class link_elf_class = {
183 #if ELF_TARG_CLASS == ELFCLASS32
184 	"elf32",
185 #else
186 	"elf64",
187 #endif
188 	link_elf_methods, sizeof(struct elf_file)
189 };
190 
191 static int	parse_dynamic(elf_file_t);
192 static int	relocate_file(elf_file_t);
193 static int	link_elf_preload_parse_symbols(elf_file_t);
194 
195 static struct elf_set_head set_pcpu_list;
196 #ifdef VIMAGE
197 static struct elf_set_head set_vnet_list;
198 #endif
199 
200 static void
201 elf_set_add(struct elf_set_head *list, Elf_Addr start, Elf_Addr stop, Elf_Addr base)
202 {
203 	struct elf_set *set, *iter;
204 
205 	set = malloc(sizeof(*set), M_LINKER, M_WAITOK);
206 	set->es_start = start;
207 	set->es_stop = stop;
208 	set->es_base = base;
209 
210 	TAILQ_FOREACH(iter, list, es_link) {
211 
212 		KASSERT((set->es_start < iter->es_start && set->es_stop < iter->es_stop) ||
213 		    (set->es_start > iter->es_start && set->es_stop > iter->es_stop),
214 		    ("linker sets intersection: to insert: 0x%jx-0x%jx; inserted: 0x%jx-0x%jx",
215 		    (uintmax_t)set->es_start, (uintmax_t)set->es_stop,
216 		    (uintmax_t)iter->es_start, (uintmax_t)iter->es_stop));
217 
218 		if (iter->es_start > set->es_start) {
219 			TAILQ_INSERT_BEFORE(iter, set, es_link);
220 			break;
221 		}
222 	}
223 
224 	if (iter == NULL)
225 		TAILQ_INSERT_TAIL(list, set, es_link);
226 }
227 
228 static int
229 elf_set_find(struct elf_set_head *list, Elf_Addr addr, Elf_Addr *start, Elf_Addr *base)
230 {
231 	struct elf_set *set;
232 
233 	TAILQ_FOREACH(set, list, es_link) {
234 		if (addr < set->es_start)
235 			return (0);
236 		if (addr < set->es_stop) {
237 			*start = set->es_start;
238 			*base = set->es_base;
239 			return (1);
240 		}
241 	}
242 
243 	return (0);
244 }
245 
246 static void
247 elf_set_delete(struct elf_set_head *list, Elf_Addr start)
248 {
249 	struct elf_set *set;
250 
251 	TAILQ_FOREACH(set, list, es_link) {
252 		if (start < set->es_start)
253 			break;
254 		if (start == set->es_start) {
255 			TAILQ_REMOVE(list, set, es_link);
256 			free(set, M_LINKER);
257 			return;
258 		}
259 	}
260 	KASSERT(0, ("deleting unknown linker set (start = 0x%jx)",
261 	    (uintmax_t)start));
262 }
263 
264 #ifdef GDB
265 static void	r_debug_state(struct r_debug *, struct link_map *);
266 
267 /*
268  * A list of loaded modules for GDB to use for loading symbols.
269  */
270 struct r_debug r_debug;
271 
272 #define GDB_STATE(s) do {				\
273 	r_debug.r_state = s; r_debug_state(NULL, NULL);	\
274 } while (0)
275 
276 /*
277  * Function for the debugger to set a breakpoint on to gain control.
278  */
279 static void
280 r_debug_state(struct r_debug *dummy_one __unused,
281 	      struct link_map *dummy_two __unused)
282 {
283 }
284 
285 static void
286 link_elf_add_gdb(struct link_map *l)
287 {
288 	struct link_map *prev;
289 
290 	l->l_next = NULL;
291 
292 	if (r_debug.r_map == NULL) {
293 		/* Add first. */
294 		l->l_prev = NULL;
295 		r_debug.r_map = l;
296 	} else {
297 		/* Append to list. */
298 		for (prev = r_debug.r_map;
299 		    prev->l_next != NULL;
300 		    prev = prev->l_next)
301 			;
302 		l->l_prev = prev;
303 		prev->l_next = l;
304 	}
305 }
306 
307 static void
308 link_elf_delete_gdb(struct link_map *l)
309 {
310 	if (l->l_prev == NULL) {
311 		/* Remove first. */
312 		if ((r_debug.r_map = l->l_next) != NULL)
313 			l->l_next->l_prev = NULL;
314 	} else {
315 		/* Remove any but first. */
316 		if ((l->l_prev->l_next = l->l_next) != NULL)
317 			l->l_next->l_prev = l->l_prev;
318 	}
319 }
320 #endif /* GDB */
321 
322 /*
323  * The kernel symbol table starts here.
324  */
325 extern struct _dynamic _DYNAMIC;
326 
327 static void
328 link_elf_error(const char *filename, const char *s)
329 {
330 	if (filename == NULL)
331 		printf("kldload: %s\n", s);
332 	else
333 		printf("kldload: %s: %s\n", filename, s);
334 }
335 
336 static void
337 link_elf_invoke_ctors(caddr_t addr, size_t size)
338 {
339 	void (**ctor)(void);
340 	size_t i, cnt;
341 
342 	if (addr == NULL || size == 0)
343 		return;
344 	cnt = size / sizeof(*ctor);
345 	ctor = (void *)addr;
346 	for (i = 0; i < cnt; i++) {
347 		if (ctor[i] != NULL)
348 			(*ctor[i])();
349 	}
350 }
351 
352 /*
353  * Actions performed after linking/loading both the preloaded kernel and any
354  * modules; whether preloaded or dynamicly loaded.
355  */
356 static int
357 link_elf_link_common_finish(linker_file_t lf)
358 {
359 #ifdef GDB
360 	elf_file_t ef = (elf_file_t)lf;
361 	char *newfilename;
362 #endif
363 	int error;
364 
365 	/* Notify MD code that a module is being loaded. */
366 	error = elf_cpu_load_file(lf);
367 	if (error != 0)
368 		return (error);
369 
370 #ifdef GDB
371 	GDB_STATE(RT_ADD);
372 	ef->gdb.l_addr = lf->address;
373 	newfilename = malloc(strlen(lf->filename) + 1, M_LINKER, M_WAITOK);
374 	strcpy(newfilename, lf->filename);
375 	ef->gdb.l_name = newfilename;
376 	ef->gdb.l_ld = ef->dynamic;
377 	link_elf_add_gdb(&ef->gdb);
378 	GDB_STATE(RT_CONSISTENT);
379 #endif
380 
381 	/* Invoke .ctors */
382 	link_elf_invoke_ctors(lf->ctors_addr, lf->ctors_size);
383 	return (0);
384 }
385 
386 extern vm_offset_t __startkernel;
387 
388 static void
389 link_elf_init(void* arg)
390 {
391 	Elf_Dyn *dp;
392 	Elf_Addr *ctors_addrp;
393 	Elf_Size *ctors_sizep;
394 	caddr_t modptr, baseptr, sizeptr;
395 	elf_file_t ef;
396 	char *modname;
397 
398 	linker_add_class(&link_elf_class);
399 
400 	dp = (Elf_Dyn *)&_DYNAMIC;
401 	modname = NULL;
402 	modptr = preload_search_by_type("elf" __XSTRING(__ELF_WORD_SIZE) " kernel");
403 	if (modptr == NULL)
404 		modptr = preload_search_by_type("elf kernel");
405 	modname = (char *)preload_search_info(modptr, MODINFO_NAME);
406 	if (modname == NULL)
407 		modname = "kernel";
408 	linker_kernel_file = linker_make_file(modname, &link_elf_class);
409 	if (linker_kernel_file == NULL)
410 		panic("%s: Can't create linker structures for kernel",
411 		    __func__);
412 
413 	ef = (elf_file_t) linker_kernel_file;
414 	ef->preloaded = 1;
415 #ifdef __powerpc__
416 	ef->address = (caddr_t) (__startkernel - KERNBASE);
417 #else
418 	ef->address = 0;
419 #endif
420 #ifdef SPARSE_MAPPING
421 	ef->object = 0;
422 #endif
423 	ef->dynamic = dp;
424 
425 	if (dp != NULL)
426 		parse_dynamic(ef);
427 	linker_kernel_file->address += KERNBASE;
428 	linker_kernel_file->size = -(intptr_t)linker_kernel_file->address;
429 
430 	if (modptr != NULL) {
431 		ef->modptr = modptr;
432 		baseptr = preload_search_info(modptr, MODINFO_ADDR);
433 		if (baseptr != NULL)
434 			linker_kernel_file->address = *(caddr_t *)baseptr;
435 		sizeptr = preload_search_info(modptr, MODINFO_SIZE);
436 		if (sizeptr != NULL)
437 			linker_kernel_file->size = *(size_t *)sizeptr;
438 		ctors_addrp = (Elf_Addr *)preload_search_info(modptr,
439 			MODINFO_METADATA | MODINFOMD_CTORS_ADDR);
440 		ctors_sizep = (Elf_Size *)preload_search_info(modptr,
441 			MODINFO_METADATA | MODINFOMD_CTORS_SIZE);
442 		if (ctors_addrp != NULL && ctors_sizep != NULL) {
443 			linker_kernel_file->ctors_addr = ef->address +
444 			    *ctors_addrp;
445 			linker_kernel_file->ctors_size = *ctors_sizep;
446 		}
447 	}
448 	(void)link_elf_preload_parse_symbols(ef);
449 
450 #ifdef GDB
451 	r_debug.r_map = NULL;
452 	r_debug.r_brk = r_debug_state;
453 	r_debug.r_state = RT_CONSISTENT;
454 #endif
455 
456 	(void)link_elf_link_common_finish(linker_kernel_file);
457 	linker_kernel_file->flags |= LINKER_FILE_LINKED;
458 	TAILQ_INIT(&set_pcpu_list);
459 #ifdef VIMAGE
460 	TAILQ_INIT(&set_vnet_list);
461 #endif
462 }
463 
464 SYSINIT(link_elf, SI_SUB_KLD, SI_ORDER_THIRD, link_elf_init, 0);
465 
466 static int
467 link_elf_preload_parse_symbols(elf_file_t ef)
468 {
469 	caddr_t pointer;
470 	caddr_t ssym, esym, base;
471 	caddr_t strtab;
472 	int strcnt;
473 	Elf_Sym *symtab;
474 	int symcnt;
475 
476 	if (ef->modptr == NULL)
477 		return (0);
478 	pointer = preload_search_info(ef->modptr,
479 	    MODINFO_METADATA | MODINFOMD_SSYM);
480 	if (pointer == NULL)
481 		return (0);
482 	ssym = *(caddr_t *)pointer;
483 	pointer = preload_search_info(ef->modptr,
484 	    MODINFO_METADATA | MODINFOMD_ESYM);
485 	if (pointer == NULL)
486 		return (0);
487 	esym = *(caddr_t *)pointer;
488 
489 	base = ssym;
490 
491 	symcnt = *(long *)base;
492 	base += sizeof(long);
493 	symtab = (Elf_Sym *)base;
494 	base += roundup(symcnt, sizeof(long));
495 
496 	if (base > esym || base < ssym) {
497 		printf("Symbols are corrupt!\n");
498 		return (EINVAL);
499 	}
500 
501 	strcnt = *(long *)base;
502 	base += sizeof(long);
503 	strtab = base;
504 	base += roundup(strcnt, sizeof(long));
505 
506 	if (base > esym || base < ssym) {
507 		printf("Symbols are corrupt!\n");
508 		return (EINVAL);
509 	}
510 
511 	ef->ddbsymtab = symtab;
512 	ef->ddbsymcnt = symcnt / sizeof(Elf_Sym);
513 	ef->ddbstrtab = strtab;
514 	ef->ddbstrcnt = strcnt;
515 
516 	return (0);
517 }
518 
519 static int
520 parse_dynamic(elf_file_t ef)
521 {
522 	Elf_Dyn *dp;
523 	int plttype = DT_REL;
524 
525 	for (dp = ef->dynamic; dp->d_tag != DT_NULL; dp++) {
526 		switch (dp->d_tag) {
527 		case DT_HASH:
528 		{
529 			/* From src/libexec/rtld-elf/rtld.c */
530 			const Elf_Hashelt *hashtab = (const Elf_Hashelt *)
531 			    (ef->address + dp->d_un.d_ptr);
532 			ef->nbuckets = hashtab[0];
533 			ef->nchains = hashtab[1];
534 			ef->buckets = hashtab + 2;
535 			ef->chains = ef->buckets + ef->nbuckets;
536 			break;
537 		}
538 		case DT_STRTAB:
539 			ef->strtab = (caddr_t) (ef->address + dp->d_un.d_ptr);
540 			break;
541 		case DT_STRSZ:
542 			ef->strsz = dp->d_un.d_val;
543 			break;
544 		case DT_SYMTAB:
545 			ef->symtab = (Elf_Sym*) (ef->address + dp->d_un.d_ptr);
546 			break;
547 		case DT_SYMENT:
548 			if (dp->d_un.d_val != sizeof(Elf_Sym))
549 				return (ENOEXEC);
550 			break;
551 		case DT_PLTGOT:
552 			ef->got = (Elf_Addr *) (ef->address + dp->d_un.d_ptr);
553 			break;
554 		case DT_REL:
555 			ef->rel = (const Elf_Rel *) (ef->address + dp->d_un.d_ptr);
556 			break;
557 		case DT_RELSZ:
558 			ef->relsize = dp->d_un.d_val;
559 			break;
560 		case DT_RELENT:
561 			if (dp->d_un.d_val != sizeof(Elf_Rel))
562 				return (ENOEXEC);
563 			break;
564 		case DT_JMPREL:
565 			ef->pltrel = (const Elf_Rel *) (ef->address + dp->d_un.d_ptr);
566 			break;
567 		case DT_PLTRELSZ:
568 			ef->pltrelsize = dp->d_un.d_val;
569 			break;
570 		case DT_RELA:
571 			ef->rela = (const Elf_Rela *) (ef->address + dp->d_un.d_ptr);
572 			break;
573 		case DT_RELASZ:
574 			ef->relasize = dp->d_un.d_val;
575 			break;
576 		case DT_RELAENT:
577 			if (dp->d_un.d_val != sizeof(Elf_Rela))
578 				return (ENOEXEC);
579 			break;
580 		case DT_PLTREL:
581 			plttype = dp->d_un.d_val;
582 			if (plttype != DT_REL && plttype != DT_RELA)
583 				return (ENOEXEC);
584 			break;
585 #ifdef GDB
586 		case DT_DEBUG:
587 			dp->d_un.d_ptr = (Elf_Addr)&r_debug;
588 			break;
589 #endif
590 		}
591 	}
592 
593 	if (plttype == DT_RELA) {
594 		ef->pltrela = (const Elf_Rela *)ef->pltrel;
595 		ef->pltrel = NULL;
596 		ef->pltrelasize = ef->pltrelsize;
597 		ef->pltrelsize = 0;
598 	}
599 
600 	ef->ddbsymtab = ef->symtab;
601 	ef->ddbsymcnt = ef->nchains;
602 	ef->ddbstrtab = ef->strtab;
603 	ef->ddbstrcnt = ef->strsz;
604 
605 	return (0);
606 }
607 
608 static int
609 parse_dpcpu(elf_file_t ef)
610 {
611 	int count;
612 	int error;
613 
614 	ef->pcpu_start = 0;
615 	ef->pcpu_stop = 0;
616 	error = link_elf_lookup_set(&ef->lf, "pcpu", (void ***)&ef->pcpu_start,
617 	    (void ***)&ef->pcpu_stop, &count);
618 	/* Error just means there is no pcpu set to relocate. */
619 	if (error != 0)
620 		return (0);
621 	count *= sizeof(void *);
622 	/*
623 	 * Allocate space in the primary pcpu area.  Copy in our
624 	 * initialization from the data section and then initialize
625 	 * all per-cpu storage from that.
626 	 */
627 	ef->pcpu_base = (Elf_Addr)(uintptr_t)dpcpu_alloc(count);
628 	if (ef->pcpu_base == 0)
629 		return (ENOSPC);
630 	memcpy((void *)ef->pcpu_base, (void *)ef->pcpu_start, count);
631 	dpcpu_copy((void *)ef->pcpu_base, count);
632 	elf_set_add(&set_pcpu_list, ef->pcpu_start, ef->pcpu_stop,
633 	    ef->pcpu_base);
634 
635 	return (0);
636 }
637 
638 #ifdef VIMAGE
639 static int
640 parse_vnet(elf_file_t ef)
641 {
642 	int count;
643 	int error;
644 
645 	ef->vnet_start = 0;
646 	ef->vnet_stop = 0;
647 	error = link_elf_lookup_set(&ef->lf, "vnet", (void ***)&ef->vnet_start,
648 	    (void ***)&ef->vnet_stop, &count);
649 	/* Error just means there is no vnet data set to relocate. */
650 	if (error != 0)
651 		return (0);
652 	count *= sizeof(void *);
653 	/*
654 	 * Allocate space in the primary vnet area.  Copy in our
655 	 * initialization from the data section and then initialize
656 	 * all per-vnet storage from that.
657 	 */
658 	ef->vnet_base = (Elf_Addr)(uintptr_t)vnet_data_alloc(count);
659 	if (ef->vnet_base == 0)
660 		return (ENOSPC);
661 	memcpy((void *)ef->vnet_base, (void *)ef->vnet_start, count);
662 	vnet_data_copy((void *)ef->vnet_base, count);
663 	elf_set_add(&set_vnet_list, ef->vnet_start, ef->vnet_stop,
664 	    ef->vnet_base);
665 
666 	return (0);
667 }
668 #endif
669 
670 static int
671 link_elf_link_preload(linker_class_t cls,
672     const char* filename, linker_file_t *result)
673 {
674 	Elf_Addr *ctors_addrp;
675 	Elf_Size *ctors_sizep;
676 	caddr_t modptr, baseptr, sizeptr, dynptr;
677 	char *type;
678 	elf_file_t ef;
679 	linker_file_t lf;
680 	int error;
681 	vm_offset_t dp;
682 
683 	/* Look to see if we have the file preloaded */
684 	modptr = preload_search_by_name(filename);
685 	if (modptr == NULL)
686 		return (ENOENT);
687 
688 	type = (char *)preload_search_info(modptr, MODINFO_TYPE);
689 	baseptr = preload_search_info(modptr, MODINFO_ADDR);
690 	sizeptr = preload_search_info(modptr, MODINFO_SIZE);
691 	dynptr = preload_search_info(modptr,
692 	    MODINFO_METADATA | MODINFOMD_DYNAMIC);
693 	if (type == NULL ||
694 	    (strcmp(type, "elf" __XSTRING(__ELF_WORD_SIZE) " module") != 0 &&
695 	     strcmp(type, "elf module") != 0))
696 		return (EFTYPE);
697 	if (baseptr == NULL || sizeptr == NULL || dynptr == NULL)
698 		return (EINVAL);
699 
700 	lf = linker_make_file(filename, &link_elf_class);
701 	if (lf == NULL)
702 		return (ENOMEM);
703 
704 	ef = (elf_file_t) lf;
705 	ef->preloaded = 1;
706 	ef->modptr = modptr;
707 	ef->address = *(caddr_t *)baseptr;
708 #ifdef SPARSE_MAPPING
709 	ef->object = 0;
710 #endif
711 	dp = (vm_offset_t)ef->address + *(vm_offset_t *)dynptr;
712 	ef->dynamic = (Elf_Dyn *)dp;
713 	lf->address = ef->address;
714 	lf->size = *(size_t *)sizeptr;
715 
716 	ctors_addrp = (Elf_Addr *)preload_search_info(modptr,
717 	    MODINFO_METADATA | MODINFOMD_CTORS_ADDR);
718 	ctors_sizep = (Elf_Size *)preload_search_info(modptr,
719 	    MODINFO_METADATA | MODINFOMD_CTORS_SIZE);
720 	if (ctors_addrp != NULL && ctors_sizep != NULL) {
721 		lf->ctors_addr = ef->address + *ctors_addrp;
722 		lf->ctors_size = *ctors_sizep;
723 	}
724 
725 	error = parse_dynamic(ef);
726 	if (error == 0)
727 		error = parse_dpcpu(ef);
728 #ifdef VIMAGE
729 	if (error == 0)
730 		error = parse_vnet(ef);
731 #endif
732 	if (error != 0) {
733 		linker_file_unload(lf, LINKER_UNLOAD_FORCE);
734 		return (error);
735 	}
736 	link_elf_reloc_local(lf);
737 	*result = lf;
738 	return (0);
739 }
740 
741 static int
742 link_elf_link_preload_finish(linker_file_t lf)
743 {
744 	elf_file_t ef;
745 	int error;
746 
747 	ef = (elf_file_t) lf;
748 	error = relocate_file(ef);
749 	if (error != 0)
750 		return (error);
751 	(void)link_elf_preload_parse_symbols(ef);
752 
753 	return (link_elf_link_common_finish(lf));
754 }
755 
756 static int
757 link_elf_load_file(linker_class_t cls, const char* filename,
758     linker_file_t* result)
759 {
760 	struct nameidata nd;
761 	struct thread* td = curthread;	/* XXX */
762 	Elf_Ehdr *hdr;
763 	caddr_t firstpage;
764 	int nbytes, i;
765 	Elf_Phdr *phdr;
766 	Elf_Phdr *phlimit;
767 	Elf_Phdr *segs[MAXSEGS];
768 	int nsegs;
769 	Elf_Phdr *phdyn;
770 	caddr_t mapbase;
771 	size_t mapsize;
772 	Elf_Addr base_vaddr;
773 	Elf_Addr base_vlimit;
774 	int error = 0;
775 	ssize_t resid;
776 	int flags;
777 	elf_file_t ef;
778 	linker_file_t lf;
779 	Elf_Shdr *shdr;
780 	int symtabindex;
781 	int symstrindex;
782 	int shstrindex;
783 	int symcnt;
784 	int strcnt;
785 	char *shstrs;
786 
787 	shdr = NULL;
788 	lf = NULL;
789 	shstrs = NULL;
790 
791 	NDINIT(&nd, LOOKUP, FOLLOW, UIO_SYSSPACE, filename, td);
792 	flags = FREAD;
793 	error = vn_open(&nd, &flags, 0, NULL);
794 	if (error != 0)
795 		return (error);
796 	NDFREE(&nd, NDF_ONLY_PNBUF);
797 	if (nd.ni_vp->v_type != VREG) {
798 		error = ENOEXEC;
799 		firstpage = NULL;
800 		goto out;
801 	}
802 #ifdef MAC
803 	error = mac_kld_check_load(curthread->td_ucred, nd.ni_vp);
804 	if (error != 0) {
805 		firstpage = NULL;
806 		goto out;
807 	}
808 #endif
809 
810 	/*
811 	 * Read the elf header from the file.
812 	 */
813 	firstpage = malloc(PAGE_SIZE, M_LINKER, M_WAITOK);
814 	hdr = (Elf_Ehdr *)firstpage;
815 	error = vn_rdwr(UIO_READ, nd.ni_vp, firstpage, PAGE_SIZE, 0,
816 	    UIO_SYSSPACE, IO_NODELOCKED, td->td_ucred, NOCRED,
817 	    &resid, td);
818 	nbytes = PAGE_SIZE - resid;
819 	if (error != 0)
820 		goto out;
821 
822 	if (!IS_ELF(*hdr)) {
823 		error = ENOEXEC;
824 		goto out;
825 	}
826 
827 	if (hdr->e_ident[EI_CLASS] != ELF_TARG_CLASS ||
828 	    hdr->e_ident[EI_DATA] != ELF_TARG_DATA) {
829 		link_elf_error(filename, "Unsupported file layout");
830 		error = ENOEXEC;
831 		goto out;
832 	}
833 	if (hdr->e_ident[EI_VERSION] != EV_CURRENT ||
834 	    hdr->e_version != EV_CURRENT) {
835 		link_elf_error(filename, "Unsupported file version");
836 		error = ENOEXEC;
837 		goto out;
838 	}
839 	if (hdr->e_type != ET_EXEC && hdr->e_type != ET_DYN) {
840 		error = ENOSYS;
841 		goto out;
842 	}
843 	if (hdr->e_machine != ELF_TARG_MACH) {
844 		link_elf_error(filename, "Unsupported machine");
845 		error = ENOEXEC;
846 		goto out;
847 	}
848 
849 	/*
850 	 * We rely on the program header being in the first page.
851 	 * This is not strictly required by the ABI specification, but
852 	 * it seems to always true in practice.  And, it simplifies
853 	 * things considerably.
854 	 */
855 	if (!((hdr->e_phentsize == sizeof(Elf_Phdr)) &&
856 	      (hdr->e_phoff + hdr->e_phnum*sizeof(Elf_Phdr) <= PAGE_SIZE) &&
857 	      (hdr->e_phoff + hdr->e_phnum*sizeof(Elf_Phdr) <= nbytes)))
858 		link_elf_error(filename, "Unreadable program headers");
859 
860 	/*
861 	 * Scan the program header entries, and save key information.
862 	 *
863 	 * We rely on there being exactly two load segments, text and data,
864 	 * in that order.
865 	 */
866 	phdr = (Elf_Phdr *) (firstpage + hdr->e_phoff);
867 	phlimit = phdr + hdr->e_phnum;
868 	nsegs = 0;
869 	phdyn = NULL;
870 	while (phdr < phlimit) {
871 		switch (phdr->p_type) {
872 		case PT_LOAD:
873 			if (nsegs == MAXSEGS) {
874 				link_elf_error(filename, "Too many sections");
875 				error = ENOEXEC;
876 				goto out;
877 			}
878 			/*
879 			 * XXX: We just trust they come in right order ??
880 			 */
881 			segs[nsegs] = phdr;
882 			++nsegs;
883 			break;
884 
885 		case PT_DYNAMIC:
886 			phdyn = phdr;
887 			break;
888 
889 		case PT_INTERP:
890 			error = ENOSYS;
891 			goto out;
892 		}
893 
894 		++phdr;
895 	}
896 	if (phdyn == NULL) {
897 		link_elf_error(filename, "Object is not dynamically-linked");
898 		error = ENOEXEC;
899 		goto out;
900 	}
901 	if (nsegs == 0) {
902 		link_elf_error(filename, "No sections");
903 		error = ENOEXEC;
904 		goto out;
905 	}
906 
907 	/*
908 	 * Allocate the entire address space of the object, to stake
909 	 * out our contiguous region, and to establish the base
910 	 * address for relocation.
911 	 */
912 	base_vaddr = trunc_page(segs[0]->p_vaddr);
913 	base_vlimit = round_page(segs[nsegs - 1]->p_vaddr +
914 	    segs[nsegs - 1]->p_memsz);
915 	mapsize = base_vlimit - base_vaddr;
916 
917 	lf = linker_make_file(filename, &link_elf_class);
918 	if (lf == NULL) {
919 		error = ENOMEM;
920 		goto out;
921 	}
922 
923 	ef = (elf_file_t) lf;
924 #ifdef SPARSE_MAPPING
925 	ef->object = vm_object_allocate(OBJT_DEFAULT, mapsize >> PAGE_SHIFT);
926 	if (ef->object == NULL) {
927 		error = ENOMEM;
928 		goto out;
929 	}
930 	ef->address = (caddr_t) vm_map_min(kernel_map);
931 	error = vm_map_find(kernel_map, ef->object, 0,
932 	    (vm_offset_t *) &ef->address, mapsize, 0, VMFS_OPTIMAL_SPACE,
933 	    VM_PROT_ALL, VM_PROT_ALL, 0);
934 	if (error != 0) {
935 		vm_object_deallocate(ef->object);
936 		ef->object = 0;
937 		goto out;
938 	}
939 #else
940 	ef->address = malloc(mapsize, M_LINKER, M_WAITOK);
941 #endif
942 	mapbase = ef->address;
943 
944 	/*
945 	 * Read the text and data sections and zero the bss.
946 	 */
947 	for (i = 0; i < nsegs; i++) {
948 		caddr_t segbase = mapbase + segs[i]->p_vaddr - base_vaddr;
949 		error = vn_rdwr(UIO_READ, nd.ni_vp,
950 		    segbase, segs[i]->p_filesz, segs[i]->p_offset,
951 		    UIO_SYSSPACE, IO_NODELOCKED, td->td_ucred, NOCRED,
952 		    &resid, td);
953 		if (error != 0)
954 			goto out;
955 		bzero(segbase + segs[i]->p_filesz,
956 		    segs[i]->p_memsz - segs[i]->p_filesz);
957 
958 #ifdef SPARSE_MAPPING
959 		/*
960 		 * Wire down the pages
961 		 */
962 		error = vm_map_wire(kernel_map,
963 		    (vm_offset_t) segbase,
964 		    (vm_offset_t) segbase + segs[i]->p_memsz,
965 		    VM_MAP_WIRE_SYSTEM|VM_MAP_WIRE_NOHOLES);
966 		if (error != KERN_SUCCESS) {
967 			error = ENOMEM;
968 			goto out;
969 		}
970 #endif
971 	}
972 
973 #ifdef GPROF
974 	/* Update profiling information with the new text segment. */
975 	mtx_lock(&Giant);
976 	kmupetext((uintfptr_t)(mapbase + segs[0]->p_vaddr - base_vaddr +
977 	    segs[0]->p_memsz));
978 	mtx_unlock(&Giant);
979 #endif
980 
981 	ef->dynamic = (Elf_Dyn *) (mapbase + phdyn->p_vaddr - base_vaddr);
982 
983 	lf->address = ef->address;
984 	lf->size = mapsize;
985 
986 	error = parse_dynamic(ef);
987 	if (error != 0)
988 		goto out;
989 	error = parse_dpcpu(ef);
990 	if (error != 0)
991 		goto out;
992 #ifdef VIMAGE
993 	error = parse_vnet(ef);
994 	if (error != 0)
995 		goto out;
996 #endif
997 	link_elf_reloc_local(lf);
998 
999 	VOP_UNLOCK(nd.ni_vp, 0);
1000 	error = linker_load_dependencies(lf);
1001 	vn_lock(nd.ni_vp, LK_EXCLUSIVE | LK_RETRY);
1002 	if (error != 0)
1003 		goto out;
1004 	error = relocate_file(ef);
1005 	if (error != 0)
1006 		goto out;
1007 
1008 	/*
1009 	 * Try and load the symbol table if it's present.  (you can
1010 	 * strip it!)
1011 	 */
1012 	nbytes = hdr->e_shnum * hdr->e_shentsize;
1013 	if (nbytes == 0 || hdr->e_shoff == 0)
1014 		goto nosyms;
1015 	shdr = malloc(nbytes, M_LINKER, M_WAITOK | M_ZERO);
1016 	error = vn_rdwr(UIO_READ, nd.ni_vp,
1017 	    (caddr_t)shdr, nbytes, hdr->e_shoff,
1018 	    UIO_SYSSPACE, IO_NODELOCKED, td->td_ucred, NOCRED,
1019 	    &resid, td);
1020 	if (error != 0)
1021 		goto out;
1022 
1023 	/* Read section string table */
1024 	shstrindex = hdr->e_shstrndx;
1025 	if (shstrindex != 0 && shdr[shstrindex].sh_type == SHT_STRTAB &&
1026 	    shdr[shstrindex].sh_size != 0) {
1027 		nbytes = shdr[shstrindex].sh_size;
1028 		shstrs = malloc(nbytes, M_LINKER, M_WAITOK | M_ZERO);
1029 		error = vn_rdwr(UIO_READ, nd.ni_vp, (caddr_t)shstrs, nbytes,
1030 		    shdr[shstrindex].sh_offset, UIO_SYSSPACE, IO_NODELOCKED,
1031 		    td->td_ucred, NOCRED, &resid, td);
1032 		if (error)
1033 			goto out;
1034 	}
1035 
1036 	symtabindex = -1;
1037 	symstrindex = -1;
1038 	for (i = 0; i < hdr->e_shnum; i++) {
1039 		if (shdr[i].sh_type == SHT_SYMTAB) {
1040 			symtabindex = i;
1041 			symstrindex = shdr[i].sh_link;
1042 		} else if (shstrs != NULL && shdr[i].sh_name != 0 &&
1043 		    strcmp(shstrs + shdr[i].sh_name, ".ctors") == 0) {
1044 			/* Record relocated address and size of .ctors. */
1045 			lf->ctors_addr = mapbase + shdr[i].sh_addr - base_vaddr;
1046 			lf->ctors_size = shdr[i].sh_size;
1047 		}
1048 	}
1049 	if (symtabindex < 0 || symstrindex < 0)
1050 		goto nosyms;
1051 
1052 	symcnt = shdr[symtabindex].sh_size;
1053 	ef->symbase = malloc(symcnt, M_LINKER, M_WAITOK);
1054 	strcnt = shdr[symstrindex].sh_size;
1055 	ef->strbase = malloc(strcnt, M_LINKER, M_WAITOK);
1056 
1057 	error = vn_rdwr(UIO_READ, nd.ni_vp,
1058 	    ef->symbase, symcnt, shdr[symtabindex].sh_offset,
1059 	    UIO_SYSSPACE, IO_NODELOCKED, td->td_ucred, NOCRED,
1060 	    &resid, td);
1061 	if (error != 0)
1062 		goto out;
1063 	error = vn_rdwr(UIO_READ, nd.ni_vp,
1064 	    ef->strbase, strcnt, shdr[symstrindex].sh_offset,
1065 	    UIO_SYSSPACE, IO_NODELOCKED, td->td_ucred, NOCRED,
1066 	    &resid, td);
1067 	if (error != 0)
1068 		goto out;
1069 
1070 	ef->ddbsymcnt = symcnt / sizeof(Elf_Sym);
1071 	ef->ddbsymtab = (const Elf_Sym *)ef->symbase;
1072 	ef->ddbstrcnt = strcnt;
1073 	ef->ddbstrtab = ef->strbase;
1074 
1075 nosyms:
1076 	error = link_elf_link_common_finish(lf);
1077 	if (error != 0)
1078 		goto out;
1079 
1080 	*result = lf;
1081 
1082 out:
1083 	VOP_UNLOCK(nd.ni_vp, 0);
1084 	vn_close(nd.ni_vp, FREAD, td->td_ucred, td);
1085 	if (error != 0 && lf != NULL)
1086 		linker_file_unload(lf, LINKER_UNLOAD_FORCE);
1087 	free(shdr, M_LINKER);
1088 	free(firstpage, M_LINKER);
1089 	free(shstrs, M_LINKER);
1090 
1091 	return (error);
1092 }
1093 
1094 Elf_Addr
1095 elf_relocaddr(linker_file_t lf, Elf_Addr x)
1096 {
1097 	elf_file_t ef;
1098 
1099 	ef = (elf_file_t)lf;
1100 	if (x >= ef->pcpu_start && x < ef->pcpu_stop)
1101 		return ((x - ef->pcpu_start) + ef->pcpu_base);
1102 #ifdef VIMAGE
1103 	if (x >= ef->vnet_start && x < ef->vnet_stop)
1104 		return ((x - ef->vnet_start) + ef->vnet_base);
1105 #endif
1106 	return (x);
1107 }
1108 
1109 
1110 static void
1111 link_elf_unload_file(linker_file_t file)
1112 {
1113 	elf_file_t ef = (elf_file_t) file;
1114 
1115 	if (ef->pcpu_base != 0) {
1116 		dpcpu_free((void *)ef->pcpu_base,
1117 		    ef->pcpu_stop - ef->pcpu_start);
1118 		elf_set_delete(&set_pcpu_list, ef->pcpu_start);
1119 	}
1120 #ifdef VIMAGE
1121 	if (ef->vnet_base != 0) {
1122 		vnet_data_free((void *)ef->vnet_base,
1123 		    ef->vnet_stop - ef->vnet_start);
1124 		elf_set_delete(&set_vnet_list, ef->vnet_start);
1125 	}
1126 #endif
1127 #ifdef GDB
1128 	if (ef->gdb.l_ld != NULL) {
1129 		GDB_STATE(RT_DELETE);
1130 		free((void *)(uintptr_t)ef->gdb.l_name, M_LINKER);
1131 		link_elf_delete_gdb(&ef->gdb);
1132 		GDB_STATE(RT_CONSISTENT);
1133 	}
1134 #endif
1135 
1136 	/* Notify MD code that a module is being unloaded. */
1137 	elf_cpu_unload_file(file);
1138 
1139 	if (ef->preloaded) {
1140 		link_elf_unload_preload(file);
1141 		return;
1142 	}
1143 
1144 #ifdef SPARSE_MAPPING
1145 	if (ef->object != NULL) {
1146 		vm_map_remove(kernel_map, (vm_offset_t) ef->address,
1147 		    (vm_offset_t) ef->address
1148 		    + (ef->object->size << PAGE_SHIFT));
1149 	}
1150 #else
1151 	free(ef->address, M_LINKER);
1152 #endif
1153 	free(ef->symbase, M_LINKER);
1154 	free(ef->strbase, M_LINKER);
1155 	free(ef->ctftab, M_LINKER);
1156 	free(ef->ctfoff, M_LINKER);
1157 	free(ef->typoff, M_LINKER);
1158 }
1159 
1160 static void
1161 link_elf_unload_preload(linker_file_t file)
1162 {
1163 	if (file->filename != NULL)
1164 		preload_delete_name(file->filename);
1165 }
1166 
1167 static const char *
1168 symbol_name(elf_file_t ef, Elf_Size r_info)
1169 {
1170 	const Elf_Sym *ref;
1171 
1172 	if (ELF_R_SYM(r_info)) {
1173 		ref = ef->symtab + ELF_R_SYM(r_info);
1174 		return (ef->strtab + ref->st_name);
1175 	}
1176 	return (NULL);
1177 }
1178 
1179 static int
1180 relocate_file(elf_file_t ef)
1181 {
1182 	const Elf_Rel *rellim;
1183 	const Elf_Rel *rel;
1184 	const Elf_Rela *relalim;
1185 	const Elf_Rela *rela;
1186 	const char *symname;
1187 
1188 	/* Perform relocations without addend if there are any: */
1189 	rel = ef->rel;
1190 	if (rel != NULL) {
1191 		rellim = (const Elf_Rel *)
1192 		    ((const char *)ef->rel + ef->relsize);
1193 		while (rel < rellim) {
1194 			if (elf_reloc(&ef->lf, (Elf_Addr)ef->address, rel,
1195 			    ELF_RELOC_REL, elf_lookup)) {
1196 				symname = symbol_name(ef, rel->r_info);
1197 				printf("link_elf: symbol %s undefined\n", symname);
1198 				return (ENOENT);
1199 			}
1200 			rel++;
1201 		}
1202 	}
1203 
1204 	/* Perform relocations with addend if there are any: */
1205 	rela = ef->rela;
1206 	if (rela != NULL) {
1207 		relalim = (const Elf_Rela *)
1208 		    ((const char *)ef->rela + ef->relasize);
1209 		while (rela < relalim) {
1210 			if (elf_reloc(&ef->lf, (Elf_Addr)ef->address, rela,
1211 			    ELF_RELOC_RELA, elf_lookup)) {
1212 				symname = symbol_name(ef, rela->r_info);
1213 				printf("link_elf: symbol %s undefined\n",
1214 				    symname);
1215 				return (ENOENT);
1216 			}
1217 			rela++;
1218 		}
1219 	}
1220 
1221 	/* Perform PLT relocations without addend if there are any: */
1222 	rel = ef->pltrel;
1223 	if (rel != NULL) {
1224 		rellim = (const Elf_Rel *)
1225 		    ((const char *)ef->pltrel + ef->pltrelsize);
1226 		while (rel < rellim) {
1227 			if (elf_reloc(&ef->lf, (Elf_Addr)ef->address, rel,
1228 			    ELF_RELOC_REL, elf_lookup)) {
1229 				symname = symbol_name(ef, rel->r_info);
1230 				printf("link_elf: symbol %s undefined\n",
1231 				    symname);
1232 				return (ENOENT);
1233 			}
1234 			rel++;
1235 		}
1236 	}
1237 
1238 	/* Perform relocations with addend if there are any: */
1239 	rela = ef->pltrela;
1240 	if (rela != NULL) {
1241 		relalim = (const Elf_Rela *)
1242 		    ((const char *)ef->pltrela + ef->pltrelasize);
1243 		while (rela < relalim) {
1244 			if (elf_reloc(&ef->lf, (Elf_Addr)ef->address, rela,
1245 			    ELF_RELOC_RELA, elf_lookup)) {
1246 				symname = symbol_name(ef, rela->r_info);
1247 				printf("link_elf: symbol %s undefined\n",
1248 				    symname);
1249 				return (ENOENT);
1250 			}
1251 			rela++;
1252 		}
1253 	}
1254 
1255 	return (0);
1256 }
1257 
1258 /*
1259  * Hash function for symbol table lookup.  Don't even think about changing
1260  * this.  It is specified by the System V ABI.
1261  */
1262 static unsigned long
1263 elf_hash(const char *name)
1264 {
1265 	const unsigned char *p = (const unsigned char *) name;
1266 	unsigned long h = 0;
1267 	unsigned long g;
1268 
1269 	while (*p != '\0') {
1270 		h = (h << 4) + *p++;
1271 		if ((g = h & 0xf0000000) != 0)
1272 			h ^= g >> 24;
1273 		h &= ~g;
1274 	}
1275 	return (h);
1276 }
1277 
1278 static int
1279 link_elf_lookup_symbol(linker_file_t lf, const char* name, c_linker_sym_t* sym)
1280 {
1281 	elf_file_t ef = (elf_file_t) lf;
1282 	unsigned long symnum;
1283 	const Elf_Sym* symp;
1284 	const char *strp;
1285 	unsigned long hash;
1286 	int i;
1287 
1288 	/* If we don't have a hash, bail. */
1289 	if (ef->buckets == NULL || ef->nbuckets == 0) {
1290 		printf("link_elf_lookup_symbol: missing symbol hash table\n");
1291 		return (ENOENT);
1292 	}
1293 
1294 	/* First, search hashed global symbols */
1295 	hash = elf_hash(name);
1296 	symnum = ef->buckets[hash % ef->nbuckets];
1297 
1298 	while (symnum != STN_UNDEF) {
1299 		if (symnum >= ef->nchains) {
1300 			printf("%s: corrupt symbol table\n", __func__);
1301 			return (ENOENT);
1302 		}
1303 
1304 		symp = ef->symtab + symnum;
1305 		if (symp->st_name == 0) {
1306 			printf("%s: corrupt symbol table\n", __func__);
1307 			return (ENOENT);
1308 		}
1309 
1310 		strp = ef->strtab + symp->st_name;
1311 
1312 		if (strcmp(name, strp) == 0) {
1313 			if (symp->st_shndx != SHN_UNDEF ||
1314 			    (symp->st_value != 0 &&
1315 			     ELF_ST_TYPE(symp->st_info) == STT_FUNC)) {
1316 				*sym = (c_linker_sym_t) symp;
1317 				return (0);
1318 			}
1319 			return (ENOENT);
1320 		}
1321 
1322 		symnum = ef->chains[symnum];
1323 	}
1324 
1325 	/* If we have not found it, look at the full table (if loaded) */
1326 	if (ef->symtab == ef->ddbsymtab)
1327 		return (ENOENT);
1328 
1329 	/* Exhaustive search */
1330 	for (i = 0, symp = ef->ddbsymtab; i < ef->ddbsymcnt; i++, symp++) {
1331 		strp = ef->ddbstrtab + symp->st_name;
1332 		if (strcmp(name, strp) == 0) {
1333 			if (symp->st_shndx != SHN_UNDEF ||
1334 			    (symp->st_value != 0 &&
1335 			     ELF_ST_TYPE(symp->st_info) == STT_FUNC)) {
1336 				*sym = (c_linker_sym_t) symp;
1337 				return (0);
1338 			}
1339 			return (ENOENT);
1340 		}
1341 	}
1342 
1343 	return (ENOENT);
1344 }
1345 
1346 static int
1347 link_elf_symbol_values(linker_file_t lf, c_linker_sym_t sym,
1348     linker_symval_t *symval)
1349 {
1350 	elf_file_t ef = (elf_file_t) lf;
1351 	const Elf_Sym* es = (const Elf_Sym*) sym;
1352 
1353 	if (es >= ef->symtab && es < (ef->symtab + ef->nchains)) {
1354 		symval->name = ef->strtab + es->st_name;
1355 		symval->value = (caddr_t) ef->address + es->st_value;
1356 		symval->size = es->st_size;
1357 		return (0);
1358 	}
1359 	if (ef->symtab == ef->ddbsymtab)
1360 		return (ENOENT);
1361 	if (es >= ef->ddbsymtab && es < (ef->ddbsymtab + ef->ddbsymcnt)) {
1362 		symval->name = ef->ddbstrtab + es->st_name;
1363 		symval->value = (caddr_t) ef->address + es->st_value;
1364 		symval->size = es->st_size;
1365 		return (0);
1366 	}
1367 	return (ENOENT);
1368 }
1369 
1370 static int
1371 link_elf_search_symbol(linker_file_t lf, caddr_t value,
1372     c_linker_sym_t *sym, long *diffp)
1373 {
1374 	elf_file_t ef = (elf_file_t) lf;
1375 	u_long off = (uintptr_t) (void *) value;
1376 	u_long diff = off;
1377 	u_long st_value;
1378 	const Elf_Sym* es;
1379 	const Elf_Sym* best = NULL;
1380 	int i;
1381 
1382 	for (i = 0, es = ef->ddbsymtab; i < ef->ddbsymcnt; i++, es++) {
1383 		if (es->st_name == 0)
1384 			continue;
1385 		st_value = es->st_value + (uintptr_t) (void *) ef->address;
1386 		if (off >= st_value) {
1387 			if (off - st_value < diff) {
1388 				diff = off - st_value;
1389 				best = es;
1390 				if (diff == 0)
1391 					break;
1392 			} else if (off - st_value == diff) {
1393 				best = es;
1394 			}
1395 		}
1396 	}
1397 	if (best == NULL)
1398 		*diffp = off;
1399 	else
1400 		*diffp = diff;
1401 	*sym = (c_linker_sym_t) best;
1402 
1403 	return (0);
1404 }
1405 
1406 /*
1407  * Look up a linker set on an ELF system.
1408  */
1409 static int
1410 link_elf_lookup_set(linker_file_t lf, const char *name,
1411     void ***startp, void ***stopp, int *countp)
1412 {
1413 	c_linker_sym_t sym;
1414 	linker_symval_t symval;
1415 	char *setsym;
1416 	void **start, **stop;
1417 	int len, error = 0, count;
1418 
1419 	len = strlen(name) + sizeof("__start_set_"); /* sizeof includes \0 */
1420 	setsym = malloc(len, M_LINKER, M_WAITOK);
1421 
1422 	/* get address of first entry */
1423 	snprintf(setsym, len, "%s%s", "__start_set_", name);
1424 	error = link_elf_lookup_symbol(lf, setsym, &sym);
1425 	if (error != 0)
1426 		goto out;
1427 	link_elf_symbol_values(lf, sym, &symval);
1428 	if (symval.value == 0) {
1429 		error = ESRCH;
1430 		goto out;
1431 	}
1432 	start = (void **)symval.value;
1433 
1434 	/* get address of last entry */
1435 	snprintf(setsym, len, "%s%s", "__stop_set_", name);
1436 	error = link_elf_lookup_symbol(lf, setsym, &sym);
1437 	if (error != 0)
1438 		goto out;
1439 	link_elf_symbol_values(lf, sym, &symval);
1440 	if (symval.value == 0) {
1441 		error = ESRCH;
1442 		goto out;
1443 	}
1444 	stop = (void **)symval.value;
1445 
1446 	/* and the number of entries */
1447 	count = stop - start;
1448 
1449 	/* and copy out */
1450 	if (startp != NULL)
1451 		*startp = start;
1452 	if (stopp != NULL)
1453 		*stopp = stop;
1454 	if (countp != NULL)
1455 		*countp = count;
1456 
1457 out:
1458 	free(setsym, M_LINKER);
1459 	return (error);
1460 }
1461 
1462 static int
1463 link_elf_each_function_name(linker_file_t file,
1464   int (*callback)(const char *, void *), void *opaque)
1465 {
1466 	elf_file_t ef = (elf_file_t)file;
1467 	const Elf_Sym *symp;
1468 	int i, error;
1469 
1470 	/* Exhaustive search */
1471 	for (i = 0, symp = ef->ddbsymtab; i < ef->ddbsymcnt; i++, symp++) {
1472 		if (symp->st_value != 0 &&
1473 		    ELF_ST_TYPE(symp->st_info) == STT_FUNC) {
1474 			error = callback(ef->ddbstrtab + symp->st_name, opaque);
1475 			if (error != 0)
1476 				return (error);
1477 		}
1478 	}
1479 	return (0);
1480 }
1481 
1482 static int
1483 link_elf_each_function_nameval(linker_file_t file,
1484     linker_function_nameval_callback_t callback, void *opaque)
1485 {
1486 	linker_symval_t symval;
1487 	elf_file_t ef = (elf_file_t)file;
1488 	const Elf_Sym* symp;
1489 	int i, error;
1490 
1491 	/* Exhaustive search */
1492 	for (i = 0, symp = ef->ddbsymtab; i < ef->ddbsymcnt; i++, symp++) {
1493 		if (symp->st_value != 0 &&
1494 		    ELF_ST_TYPE(symp->st_info) == STT_FUNC) {
1495 			error = link_elf_symbol_values(file,
1496 			    (c_linker_sym_t) symp, &symval);
1497 			if (error != 0)
1498 				return (error);
1499 			error = callback(file, i, &symval, opaque);
1500 			if (error != 0)
1501 				return (error);
1502 		}
1503 	}
1504 	return (0);
1505 }
1506 
1507 const Elf_Sym *
1508 elf_get_sym(linker_file_t lf, Elf_Size symidx)
1509 {
1510 	elf_file_t ef = (elf_file_t)lf;
1511 
1512 	if (symidx >= ef->nchains)
1513 		return (NULL);
1514 	return (ef->symtab + symidx);
1515 }
1516 
1517 const char *
1518 elf_get_symname(linker_file_t lf, Elf_Size symidx)
1519 {
1520 	elf_file_t ef = (elf_file_t)lf;
1521 	const Elf_Sym *sym;
1522 
1523 	if (symidx >= ef->nchains)
1524 		return (NULL);
1525 	sym = ef->symtab + symidx;
1526 	return (ef->strtab + sym->st_name);
1527 }
1528 
1529 /*
1530  * Symbol lookup function that can be used when the symbol index is known (ie
1531  * in relocations). It uses the symbol index instead of doing a fully fledged
1532  * hash table based lookup when such is valid. For example for local symbols.
1533  * This is not only more efficient, it's also more correct. It's not always
1534  * the case that the symbol can be found through the hash table.
1535  */
1536 static int
1537 elf_lookup(linker_file_t lf, Elf_Size symidx, int deps, Elf_Addr *res)
1538 {
1539 	elf_file_t ef = (elf_file_t)lf;
1540 	const Elf_Sym *sym;
1541 	const char *symbol;
1542 	Elf_Addr addr, start, base;
1543 
1544 	/* Don't even try to lookup the symbol if the index is bogus. */
1545 	if (symidx >= ef->nchains) {
1546 		*res = 0;
1547 		return (EINVAL);
1548 	}
1549 
1550 	sym = ef->symtab + symidx;
1551 
1552 	/*
1553 	 * Don't do a full lookup when the symbol is local. It may even
1554 	 * fail because it may not be found through the hash table.
1555 	 */
1556 	if (ELF_ST_BIND(sym->st_info) == STB_LOCAL) {
1557 		/* Force lookup failure when we have an insanity. */
1558 		if (sym->st_shndx == SHN_UNDEF || sym->st_value == 0) {
1559 			*res = 0;
1560 			return (EINVAL);
1561 		}
1562 		*res = ((Elf_Addr)ef->address + sym->st_value);
1563 		return (0);
1564 	}
1565 
1566 	/*
1567 	 * XXX we can avoid doing a hash table based lookup for global
1568 	 * symbols as well. This however is not always valid, so we'll
1569 	 * just do it the hard way for now. Performance tweaks can
1570 	 * always be added.
1571 	 */
1572 
1573 	symbol = ef->strtab + sym->st_name;
1574 
1575 	/* Force a lookup failure if the symbol name is bogus. */
1576 	if (*symbol == 0) {
1577 		*res = 0;
1578 		return (EINVAL);
1579 	}
1580 
1581 	addr = ((Elf_Addr)linker_file_lookup_symbol(lf, symbol, deps));
1582 	if (addr == 0 && ELF_ST_BIND(sym->st_info) != STB_WEAK) {
1583 		*res = 0;
1584 		return (EINVAL);
1585 	}
1586 
1587 	if (elf_set_find(&set_pcpu_list, addr, &start, &base))
1588 		addr = addr - start + base;
1589 #ifdef VIMAGE
1590 	else if (elf_set_find(&set_vnet_list, addr, &start, &base))
1591 		addr = addr - start + base;
1592 #endif
1593 	*res = addr;
1594 	return (0);
1595 }
1596 
1597 static void
1598 link_elf_reloc_local(linker_file_t lf)
1599 {
1600 	const Elf_Rel *rellim;
1601 	const Elf_Rel *rel;
1602 	const Elf_Rela *relalim;
1603 	const Elf_Rela *rela;
1604 	elf_file_t ef = (elf_file_t)lf;
1605 
1606 	/* Perform relocations without addend if there are any: */
1607 	if ((rel = ef->rel) != NULL) {
1608 		rellim = (const Elf_Rel *)((const char *)ef->rel + ef->relsize);
1609 		while (rel < rellim) {
1610 			elf_reloc_local(lf, (Elf_Addr)ef->address, rel,
1611 			    ELF_RELOC_REL, elf_lookup);
1612 			rel++;
1613 		}
1614 	}
1615 
1616 	/* Perform relocations with addend if there are any: */
1617 	if ((rela = ef->rela) != NULL) {
1618 		relalim = (const Elf_Rela *)
1619 		    ((const char *)ef->rela + ef->relasize);
1620 		while (rela < relalim) {
1621 			elf_reloc_local(lf, (Elf_Addr)ef->address, rela,
1622 			    ELF_RELOC_RELA, elf_lookup);
1623 			rela++;
1624 		}
1625 	}
1626 }
1627 
1628 static long
1629 link_elf_symtab_get(linker_file_t lf, const Elf_Sym **symtab)
1630 {
1631 	elf_file_t ef = (elf_file_t)lf;
1632 
1633 	*symtab = ef->ddbsymtab;
1634 
1635 	if (*symtab == NULL)
1636 		return (0);
1637 
1638 	return (ef->ddbsymcnt);
1639 }
1640 
1641 static long
1642 link_elf_strtab_get(linker_file_t lf, caddr_t *strtab)
1643 {
1644 	elf_file_t ef = (elf_file_t)lf;
1645 
1646 	*strtab = ef->ddbstrtab;
1647 
1648 	if (*strtab == NULL)
1649 		return (0);
1650 
1651 	return (ef->ddbstrcnt);
1652 }
1653