xref: /illumos-gate/usr/src/lib/libdtrace/common/dt_module.c (revision 66582b606a8194f7f3ba5b3a3a6dca5b0d346361)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 
22 /*
23  * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved.
24  */
25 /*
26  * Copyright (c) 2013, Joyent, Inc.  All rights reserved.
27  */
28 
29 #include <sys/types.h>
30 #include <sys/modctl.h>
31 #include <sys/kobj.h>
32 #include <sys/kobj_impl.h>
33 #include <sys/sysmacros.h>
34 #include <sys/elf.h>
35 #include <sys/task.h>
36 
37 #include <unistd.h>
38 #include <project.h>
39 #include <strings.h>
40 #include <stdlib.h>
41 #include <libelf.h>
42 #include <limits.h>
43 #include <assert.h>
44 #include <errno.h>
45 #include <dirent.h>
46 
47 #include <dt_strtab.h>
48 #include <dt_module.h>
49 #include <dt_impl.h>
50 
51 static const char *dt_module_strtab; /* active strtab for qsort callbacks */
52 
53 static void
54 dt_module_symhash_insert(dt_module_t *dmp, const char *name, uint_t id)
55 {
56 	dt_sym_t *dsp = &dmp->dm_symchains[dmp->dm_symfree];
57 	uint_t h;
58 
59 	assert(dmp->dm_symfree < dmp->dm_nsymelems + 1);
60 
61 	dsp->ds_symid = id;
62 	h = dt_strtab_hash(name, NULL) % dmp->dm_nsymbuckets;
63 	dsp->ds_next = dmp->dm_symbuckets[h];
64 	dmp->dm_symbuckets[h] = dmp->dm_symfree++;
65 }
66 
67 static uint_t
68 dt_module_syminit32(dt_module_t *dmp)
69 {
70 #if STT_NUM != (STT_TLS + 1)
71 #error "STT_NUM has grown. update dt_module_syminit32()"
72 #endif
73 
74 	const Elf32_Sym *sym = dmp->dm_symtab.cts_data;
75 	const char *base = dmp->dm_strtab.cts_data;
76 	size_t ss_size = dmp->dm_strtab.cts_size;
77 	uint_t i, n = dmp->dm_nsymelems;
78 	uint_t asrsv = 0;
79 
80 	for (i = 0; i < n; i++, sym++) {
81 		const char *name = base + sym->st_name;
82 		uchar_t type = ELF32_ST_TYPE(sym->st_info);
83 
84 		if (type >= STT_NUM || type == STT_SECTION)
85 			continue; /* skip sections and unknown types */
86 
87 		if (sym->st_name == 0 || sym->st_name >= ss_size)
88 			continue; /* skip null or invalid names */
89 
90 		if (sym->st_value != 0 &&
91 		    (ELF32_ST_BIND(sym->st_info) != STB_LOCAL || sym->st_size))
92 			asrsv++; /* reserve space in the address map */
93 
94 		dt_module_symhash_insert(dmp, name, i);
95 	}
96 
97 	return (asrsv);
98 }
99 
100 static uint_t
101 dt_module_syminit64(dt_module_t *dmp)
102 {
103 #if STT_NUM != (STT_TLS + 1)
104 #error "STT_NUM has grown. update dt_module_syminit64()"
105 #endif
106 
107 	const Elf64_Sym *sym = dmp->dm_symtab.cts_data;
108 	const char *base = dmp->dm_strtab.cts_data;
109 	size_t ss_size = dmp->dm_strtab.cts_size;
110 	uint_t i, n = dmp->dm_nsymelems;
111 	uint_t asrsv = 0;
112 
113 	for (i = 0; i < n; i++, sym++) {
114 		const char *name = base + sym->st_name;
115 		uchar_t type = ELF64_ST_TYPE(sym->st_info);
116 
117 		if (type >= STT_NUM || type == STT_SECTION)
118 			continue; /* skip sections and unknown types */
119 
120 		if (sym->st_name == 0 || sym->st_name >= ss_size)
121 			continue; /* skip null or invalid names */
122 
123 		if (sym->st_value != 0 &&
124 		    (ELF64_ST_BIND(sym->st_info) != STB_LOCAL || sym->st_size))
125 			asrsv++; /* reserve space in the address map */
126 
127 		dt_module_symhash_insert(dmp, name, i);
128 	}
129 
130 	return (asrsv);
131 }
132 
133 /*
134  * Sort comparison function for 32-bit symbol address-to-name lookups.  We sort
135  * symbols by value.  If values are equal, we prefer the symbol that is
136  * non-zero sized, typed, not weak, or lexically first, in that order.
137  */
138 static int
139 dt_module_symcomp32(const void *lp, const void *rp)
140 {
141 	Elf32_Sym *lhs = *((Elf32_Sym **)lp);
142 	Elf32_Sym *rhs = *((Elf32_Sym **)rp);
143 
144 	if (lhs->st_value != rhs->st_value)
145 		return (lhs->st_value > rhs->st_value ? 1 : -1);
146 
147 	if ((lhs->st_size == 0) != (rhs->st_size == 0))
148 		return (lhs->st_size == 0 ? 1 : -1);
149 
150 	if ((ELF32_ST_TYPE(lhs->st_info) == STT_NOTYPE) !=
151 	    (ELF32_ST_TYPE(rhs->st_info) == STT_NOTYPE))
152 		return (ELF32_ST_TYPE(lhs->st_info) == STT_NOTYPE ? 1 : -1);
153 
154 	if ((ELF32_ST_BIND(lhs->st_info) == STB_WEAK) !=
155 	    (ELF32_ST_BIND(rhs->st_info) == STB_WEAK))
156 		return (ELF32_ST_BIND(lhs->st_info) == STB_WEAK ? 1 : -1);
157 
158 	return (strcmp(dt_module_strtab + lhs->st_name,
159 	    dt_module_strtab + rhs->st_name));
160 }
161 
162 /*
163  * Sort comparison function for 64-bit symbol address-to-name lookups.  We sort
164  * symbols by value.  If values are equal, we prefer the symbol that is
165  * non-zero sized, typed, not weak, or lexically first, in that order.
166  */
167 static int
168 dt_module_symcomp64(const void *lp, const void *rp)
169 {
170 	Elf64_Sym *lhs = *((Elf64_Sym **)lp);
171 	Elf64_Sym *rhs = *((Elf64_Sym **)rp);
172 
173 	if (lhs->st_value != rhs->st_value)
174 		return (lhs->st_value > rhs->st_value ? 1 : -1);
175 
176 	if ((lhs->st_size == 0) != (rhs->st_size == 0))
177 		return (lhs->st_size == 0 ? 1 : -1);
178 
179 	if ((ELF64_ST_TYPE(lhs->st_info) == STT_NOTYPE) !=
180 	    (ELF64_ST_TYPE(rhs->st_info) == STT_NOTYPE))
181 		return (ELF64_ST_TYPE(lhs->st_info) == STT_NOTYPE ? 1 : -1);
182 
183 	if ((ELF64_ST_BIND(lhs->st_info) == STB_WEAK) !=
184 	    (ELF64_ST_BIND(rhs->st_info) == STB_WEAK))
185 		return (ELF64_ST_BIND(lhs->st_info) == STB_WEAK ? 1 : -1);
186 
187 	return (strcmp(dt_module_strtab + lhs->st_name,
188 	    dt_module_strtab + rhs->st_name));
189 }
190 
191 static void
192 dt_module_symsort32(dt_module_t *dmp)
193 {
194 	Elf32_Sym *symtab = (Elf32_Sym *)dmp->dm_symtab.cts_data;
195 	Elf32_Sym **sympp = (Elf32_Sym **)dmp->dm_asmap;
196 	const dt_sym_t *dsp = dmp->dm_symchains + 1;
197 	uint_t i, n = dmp->dm_symfree;
198 
199 	for (i = 1; i < n; i++, dsp++) {
200 		Elf32_Sym *sym = symtab + dsp->ds_symid;
201 		if (sym->st_value != 0 &&
202 		    (ELF32_ST_BIND(sym->st_info) != STB_LOCAL || sym->st_size))
203 			*sympp++ = sym;
204 	}
205 
206 	dmp->dm_aslen = (uint_t)(sympp - (Elf32_Sym **)dmp->dm_asmap);
207 	assert(dmp->dm_aslen <= dmp->dm_asrsv);
208 
209 	dt_module_strtab = dmp->dm_strtab.cts_data;
210 	qsort(dmp->dm_asmap, dmp->dm_aslen,
211 	    sizeof (Elf32_Sym *), dt_module_symcomp32);
212 	dt_module_strtab = NULL;
213 }
214 
215 static void
216 dt_module_symsort64(dt_module_t *dmp)
217 {
218 	Elf64_Sym *symtab = (Elf64_Sym *)dmp->dm_symtab.cts_data;
219 	Elf64_Sym **sympp = (Elf64_Sym **)dmp->dm_asmap;
220 	const dt_sym_t *dsp = dmp->dm_symchains + 1;
221 	uint_t i, n = dmp->dm_symfree;
222 
223 	for (i = 1; i < n; i++, dsp++) {
224 		Elf64_Sym *sym = symtab + dsp->ds_symid;
225 		if (sym->st_value != 0 &&
226 		    (ELF64_ST_BIND(sym->st_info) != STB_LOCAL || sym->st_size))
227 			*sympp++ = sym;
228 	}
229 
230 	dmp->dm_aslen = (uint_t)(sympp - (Elf64_Sym **)dmp->dm_asmap);
231 	assert(dmp->dm_aslen <= dmp->dm_asrsv);
232 
233 	dt_module_strtab = dmp->dm_strtab.cts_data;
234 	qsort(dmp->dm_asmap, dmp->dm_aslen,
235 	    sizeof (Elf64_Sym *), dt_module_symcomp64);
236 	dt_module_strtab = NULL;
237 }
238 
239 static GElf_Sym *
240 dt_module_symgelf32(const Elf32_Sym *src, GElf_Sym *dst)
241 {
242 	if (dst != NULL) {
243 		dst->st_name = src->st_name;
244 		dst->st_info = src->st_info;
245 		dst->st_other = src->st_other;
246 		dst->st_shndx = src->st_shndx;
247 		dst->st_value = src->st_value;
248 		dst->st_size = src->st_size;
249 	}
250 
251 	return (dst);
252 }
253 
254 static GElf_Sym *
255 dt_module_symgelf64(const Elf64_Sym *src, GElf_Sym *dst)
256 {
257 	if (dst != NULL)
258 		bcopy(src, dst, sizeof (GElf_Sym));
259 
260 	return (dst);
261 }
262 
263 static GElf_Sym *
264 dt_module_symname32(dt_module_t *dmp, const char *name,
265     GElf_Sym *symp, uint_t *idp)
266 {
267 	const Elf32_Sym *symtab = dmp->dm_symtab.cts_data;
268 	const char *strtab = dmp->dm_strtab.cts_data;
269 
270 	const Elf32_Sym *sym;
271 	const dt_sym_t *dsp;
272 	uint_t i, h;
273 
274 	if (dmp->dm_nsymelems == 0)
275 		return (NULL);
276 
277 	h = dt_strtab_hash(name, NULL) % dmp->dm_nsymbuckets;
278 
279 	for (i = dmp->dm_symbuckets[h]; i != 0; i = dsp->ds_next) {
280 		dsp = &dmp->dm_symchains[i];
281 		sym = symtab + dsp->ds_symid;
282 
283 		if (strcmp(name, strtab + sym->st_name) == 0) {
284 			if (idp != NULL)
285 				*idp = dsp->ds_symid;
286 			return (dt_module_symgelf32(sym, symp));
287 		}
288 	}
289 
290 	return (NULL);
291 }
292 
293 static GElf_Sym *
294 dt_module_symname64(dt_module_t *dmp, const char *name,
295     GElf_Sym *symp, uint_t *idp)
296 {
297 	const Elf64_Sym *symtab = dmp->dm_symtab.cts_data;
298 	const char *strtab = dmp->dm_strtab.cts_data;
299 
300 	const Elf64_Sym *sym;
301 	const dt_sym_t *dsp;
302 	uint_t i, h;
303 
304 	if (dmp->dm_nsymelems == 0)
305 		return (NULL);
306 
307 	h = dt_strtab_hash(name, NULL) % dmp->dm_nsymbuckets;
308 
309 	for (i = dmp->dm_symbuckets[h]; i != 0; i = dsp->ds_next) {
310 		dsp = &dmp->dm_symchains[i];
311 		sym = symtab + dsp->ds_symid;
312 
313 		if (strcmp(name, strtab + sym->st_name) == 0) {
314 			if (idp != NULL)
315 				*idp = dsp->ds_symid;
316 			return (dt_module_symgelf64(sym, symp));
317 		}
318 	}
319 
320 	return (NULL);
321 }
322 
323 static GElf_Sym *
324 dt_module_symaddr32(dt_module_t *dmp, GElf_Addr addr,
325     GElf_Sym *symp, uint_t *idp)
326 {
327 	const Elf32_Sym **asmap = (const Elf32_Sym **)dmp->dm_asmap;
328 	const Elf32_Sym *symtab = dmp->dm_symtab.cts_data;
329 	const Elf32_Sym *sym;
330 
331 	uint_t i, mid, lo = 0, hi = dmp->dm_aslen - 1;
332 	Elf32_Addr v;
333 
334 	if (dmp->dm_aslen == 0)
335 		return (NULL);
336 
337 	while (hi - lo > 1) {
338 		mid = (lo + hi) / 2;
339 		if (addr >= asmap[mid]->st_value)
340 			lo = mid;
341 		else
342 			hi = mid;
343 	}
344 
345 	i = addr < asmap[hi]->st_value ? lo : hi;
346 	sym = asmap[i];
347 	v = sym->st_value;
348 
349 	/*
350 	 * If the previous entry has the same value, improve our choice.  The
351 	 * order of equal-valued symbols is determined by the comparison func.
352 	 */
353 	while (i-- != 0 && asmap[i]->st_value == v)
354 		sym = asmap[i];
355 
356 	if (addr - sym->st_value < MAX(sym->st_size, 1)) {
357 		if (idp != NULL)
358 			*idp = (uint_t)(sym - symtab);
359 		return (dt_module_symgelf32(sym, symp));
360 	}
361 
362 	return (NULL);
363 }
364 
365 static GElf_Sym *
366 dt_module_symaddr64(dt_module_t *dmp, GElf_Addr addr,
367     GElf_Sym *symp, uint_t *idp)
368 {
369 	const Elf64_Sym **asmap = (const Elf64_Sym **)dmp->dm_asmap;
370 	const Elf64_Sym *symtab = dmp->dm_symtab.cts_data;
371 	const Elf64_Sym *sym;
372 
373 	uint_t i, mid, lo = 0, hi = dmp->dm_aslen - 1;
374 	Elf64_Addr v;
375 
376 	if (dmp->dm_aslen == 0)
377 		return (NULL);
378 
379 	while (hi - lo > 1) {
380 		mid = (lo + hi) / 2;
381 		if (addr >= asmap[mid]->st_value)
382 			lo = mid;
383 		else
384 			hi = mid;
385 	}
386 
387 	i = addr < asmap[hi]->st_value ? lo : hi;
388 	sym = asmap[i];
389 	v = sym->st_value;
390 
391 	/*
392 	 * If the previous entry has the same value, improve our choice.  The
393 	 * order of equal-valued symbols is determined by the comparison func.
394 	 */
395 	while (i-- != 0 && asmap[i]->st_value == v)
396 		sym = asmap[i];
397 
398 	if (addr - sym->st_value < MAX(sym->st_size, 1)) {
399 		if (idp != NULL)
400 			*idp = (uint_t)(sym - symtab);
401 		return (dt_module_symgelf64(sym, symp));
402 	}
403 
404 	return (NULL);
405 }
406 
407 static const dt_modops_t dt_modops_32 = {
408 	dt_module_syminit32,
409 	dt_module_symsort32,
410 	dt_module_symname32,
411 	dt_module_symaddr32
412 };
413 
414 static const dt_modops_t dt_modops_64 = {
415 	dt_module_syminit64,
416 	dt_module_symsort64,
417 	dt_module_symname64,
418 	dt_module_symaddr64
419 };
420 
421 dt_module_t *
422 dt_module_create(dtrace_hdl_t *dtp, const char *name)
423 {
424 	long pid;
425 	char *eptr;
426 	dt_ident_t *idp;
427 	uint_t h = dt_strtab_hash(name, NULL) % dtp->dt_modbuckets;
428 	dt_module_t *dmp;
429 
430 	for (dmp = dtp->dt_mods[h]; dmp != NULL; dmp = dmp->dm_next) {
431 		if (strcmp(dmp->dm_name, name) == 0)
432 			return (dmp);
433 	}
434 
435 	if ((dmp = malloc(sizeof (dt_module_t))) == NULL)
436 		return (NULL); /* caller must handle allocation failure */
437 
438 	bzero(dmp, sizeof (dt_module_t));
439 	(void) strlcpy(dmp->dm_name, name, sizeof (dmp->dm_name));
440 	dt_list_append(&dtp->dt_modlist, dmp);
441 	dmp->dm_next = dtp->dt_mods[h];
442 	dtp->dt_mods[h] = dmp;
443 	dtp->dt_nmods++;
444 
445 	if (dtp->dt_conf.dtc_ctfmodel == CTF_MODEL_LP64)
446 		dmp->dm_ops = &dt_modops_64;
447 	else
448 		dmp->dm_ops = &dt_modops_32;
449 
450 	/*
451 	 * Modules for userland processes are special. They always refer to a
452 	 * specific process and have a copy of their CTF data from a specific
453 	 * instant in time. Any dt_module_t that begins with 'pid' is a module
454 	 * for a specific process, much like how any probe description that
455 	 * begins with 'pid' is special. pid123 refers to process 123. A module
456 	 * that is just 'pid' refers specifically to pid$target. This is
457 	 * generally done as D does not currently allow for macros to be
458 	 * evaluated when working with types.
459 	 */
460 	if (strncmp(dmp->dm_name, "pid", 3) == 0) {
461 		errno = 0;
462 		if (dmp->dm_name[3] == '\0') {
463 			idp = dt_idhash_lookup(dtp->dt_macros, "target");
464 			if (idp != NULL && idp->di_id != 0)
465 				dmp->dm_pid = idp->di_id;
466 		} else {
467 			pid = strtol(dmp->dm_name + 3, &eptr, 10);
468 			if (errno == 0 && *eptr == '\0')
469 				dmp->dm_pid = (pid_t)pid;
470 			else
471 				dt_dprintf("encountered malformed pid "
472 				    "module: %s\n", dmp->dm_name);
473 		}
474 	}
475 
476 	return (dmp);
477 }
478 
479 dt_module_t *
480 dt_module_lookup_by_name(dtrace_hdl_t *dtp, const char *name)
481 {
482 	uint_t h = dt_strtab_hash(name, NULL) % dtp->dt_modbuckets;
483 	dt_module_t *dmp;
484 
485 	for (dmp = dtp->dt_mods[h]; dmp != NULL; dmp = dmp->dm_next) {
486 		if (strcmp(dmp->dm_name, name) == 0)
487 			return (dmp);
488 	}
489 
490 	return (NULL);
491 }
492 
493 /*ARGSUSED*/
494 dt_module_t *
495 dt_module_lookup_by_ctf(dtrace_hdl_t *dtp, ctf_file_t *ctfp)
496 {
497 	return (ctfp ? ctf_getspecific(ctfp) : NULL);
498 }
499 
500 static int
501 dt_module_load_sect(dtrace_hdl_t *dtp, dt_module_t *dmp, ctf_sect_t *ctsp)
502 {
503 	const char *s;
504 	size_t shstrs;
505 	GElf_Shdr sh;
506 	Elf_Data *dp;
507 	Elf_Scn *sp;
508 
509 	if (elf_getshdrstrndx(dmp->dm_elf, &shstrs) == -1)
510 		return (dt_set_errno(dtp, EDT_NOTLOADED));
511 
512 	for (sp = NULL; (sp = elf_nextscn(dmp->dm_elf, sp)) != NULL; ) {
513 		if (gelf_getshdr(sp, &sh) == NULL || sh.sh_type == SHT_NULL ||
514 		    (s = elf_strptr(dmp->dm_elf, shstrs, sh.sh_name)) == NULL)
515 			continue; /* skip any malformed sections */
516 
517 		if (sh.sh_type == ctsp->cts_type &&
518 		    sh.sh_entsize == ctsp->cts_entsize &&
519 		    strcmp(s, ctsp->cts_name) == 0)
520 			break; /* section matches specification */
521 	}
522 
523 	/*
524 	 * If the section isn't found, return success but leave cts_data set
525 	 * to NULL and cts_size set to zero for our caller.
526 	 */
527 	if (sp == NULL || (dp = elf_getdata(sp, NULL)) == NULL)
528 		return (0);
529 
530 	ctsp->cts_data = dp->d_buf;
531 	ctsp->cts_size = dp->d_size;
532 
533 	dt_dprintf("loaded %s [%s] (%lu bytes)\n",
534 	    dmp->dm_name, ctsp->cts_name, (ulong_t)ctsp->cts_size);
535 
536 	return (0);
537 }
538 
539 typedef struct dt_module_cb_arg {
540 	struct ps_prochandle *dpa_proc;
541 	dtrace_hdl_t *dpa_dtp;
542 	dt_module_t *dpa_dmp;
543 	uint_t dpa_count;
544 } dt_module_cb_arg_t;
545 
546 /* ARGSUSED */
547 static int
548 dt_module_load_proc_count(void *arg, const prmap_t *prmap, const char *obj)
549 {
550 	ctf_file_t *fp;
551 	dt_module_cb_arg_t *dcp = arg;
552 
553 	/* Try to grab a ctf container if it exists */
554 	fp = Pname_to_ctf(dcp->dpa_proc, obj);
555 	if (fp != NULL)
556 		dcp->dpa_count++;
557 	return (0);
558 }
559 
560 /* ARGSUSED */
561 static int
562 dt_module_load_proc_build(void *arg, const prmap_t *prmap, const char *obj)
563 {
564 	ctf_file_t *fp;
565 	char buf[MAXPATHLEN], *p;
566 	dt_module_cb_arg_t *dcp = arg;
567 	int count = dcp->dpa_count;
568 	Lmid_t lmid;
569 
570 	fp = Pname_to_ctf(dcp->dpa_proc, obj);
571 	if (fp == NULL)
572 		return (0);
573 	fp = ctf_dup(fp);
574 	if (fp == NULL)
575 		return (0);
576 	dcp->dpa_dmp->dm_libctfp[count] = fp;
577 	/*
578 	 * While it'd be nice to simply use objname here, because of our prior
579 	 * actions we'll always get a resolved object name to its on disk file.
580 	 * Like the pid provider, we need to tell a bit of a lie here. The type
581 	 * that the user thinks of is in terms of the libraries they requested,
582 	 * eg. libc.so.1, they don't care about the fact that it's
583 	 * libc_hwcap.so.1.
584 	 */
585 	(void) Pobjname(dcp->dpa_proc, prmap->pr_vaddr, buf, sizeof (buf));
586 	if ((p = strrchr(buf, '/')) == NULL)
587 		p = buf;
588 	else
589 		p++;
590 
591 	/*
592 	 * If for some reason we can't find a link map id for this module, which
593 	 * would be really quite weird. We instead just say the link map id is
594 	 * zero.
595 	 */
596 	if (Plmid(dcp->dpa_proc, prmap->pr_vaddr, &lmid) != 0)
597 		lmid = 0;
598 
599 	if (lmid == 0)
600 		dcp->dpa_dmp->dm_libctfn[count] = strdup(p);
601 	else
602 		(void) asprintf(&dcp->dpa_dmp->dm_libctfn[count],
603 		    "LM%lx`%s", lmid, p);
604 	if (dcp->dpa_dmp->dm_libctfn[count] == NULL)
605 		return (1);
606 	ctf_setspecific(fp, dcp->dpa_dmp);
607 	dcp->dpa_count++;
608 	return (0);
609 }
610 
611 /*
612  * We've been asked to load data that belongs to another process. As such we're
613  * going to pgrab it at this instant, load everything that we might ever care
614  * about, and then drive on. The reason for this is that the process that we're
615  * interested in might be changing. As long as we have grabbed it, then this
616  * can't be a problem for us.
617  *
618  * For now, we're actually going to punt on most things and just try to get CTF
619  * data, nothing else. Basically this is only useful as a source of type
620  * information, we can't go and do the stacktrace lookups, etc.
621  */
622 static int
623 dt_module_load_proc(dtrace_hdl_t *dtp, dt_module_t *dmp)
624 {
625 	struct ps_prochandle *p;
626 	dt_module_cb_arg_t arg;
627 
628 	/*
629 	 * Note that on success we do not release this hold. We must hold this
630 	 * for our life time.
631 	 */
632 	p = dt_proc_grab(dtp, dmp->dm_pid, 0, PGRAB_RDONLY | PGRAB_FORCE);
633 	if (p == NULL) {
634 		dt_dprintf("failed to grab pid: %d\n", (int)dmp->dm_pid);
635 		return (dt_set_errno(dtp, EDT_CANTLOAD));
636 	}
637 	dt_proc_lock(dtp, p);
638 
639 	arg.dpa_proc = p;
640 	arg.dpa_dtp = dtp;
641 	arg.dpa_dmp = dmp;
642 	arg.dpa_count = 0;
643 	if (Pobject_iter_resolved(p, dt_module_load_proc_count, &arg) != 0) {
644 		dt_dprintf("failed to iterate objects\n");
645 		dt_proc_release(dtp, p);
646 		return (dt_set_errno(dtp, EDT_CANTLOAD));
647 	}
648 
649 	if (arg.dpa_count == 0) {
650 		dt_dprintf("no ctf data present\n");
651 		dt_proc_unlock(dtp, p);
652 		dt_proc_release(dtp, p);
653 		return (dt_set_errno(dtp, EDT_CANTLOAD));
654 	}
655 
656 	dmp->dm_libctfp = malloc(sizeof (ctf_file_t *) * arg.dpa_count);
657 	if (dmp->dm_libctfp == NULL) {
658 		dt_proc_unlock(dtp, p);
659 		dt_proc_release(dtp, p);
660 		return (dt_set_errno(dtp, EDT_NOMEM));
661 	}
662 	bzero(dmp->dm_libctfp, sizeof (ctf_file_t *) * arg.dpa_count);
663 
664 	dmp->dm_libctfn = malloc(sizeof (char *) * arg.dpa_count);
665 	if (dmp->dm_libctfn == NULL) {
666 		free(dmp->dm_libctfp);
667 		dt_proc_unlock(dtp, p);
668 		dt_proc_release(dtp, p);
669 		return (dt_set_errno(dtp, EDT_NOMEM));
670 	}
671 	bzero(dmp->dm_libctfn, sizeof (char *) * arg.dpa_count);
672 
673 	dmp->dm_nctflibs = arg.dpa_count;
674 
675 	arg.dpa_count = 0;
676 	if (Pobject_iter_resolved(p, dt_module_load_proc_build, &arg) != 0) {
677 		dt_proc_unlock(dtp, p);
678 		dt_module_unload(dtp, dmp);
679 		dt_proc_release(dtp, p);
680 		return (dt_set_errno(dtp, EDT_CANTLOAD));
681 	}
682 	assert(arg.dpa_count == dmp->dm_nctflibs);
683 	dt_dprintf("loaded %d ctf modules for pid %d\n", arg.dpa_count,
684 	    (int)dmp->dm_pid);
685 
686 	dt_proc_unlock(dtp, p);
687 	dt_proc_release(dtp, p);
688 	dmp->dm_flags |= DT_DM_LOADED;
689 
690 	return (0);
691 }
692 
693 int
694 dt_module_load(dtrace_hdl_t *dtp, dt_module_t *dmp)
695 {
696 	if (dmp->dm_flags & DT_DM_LOADED)
697 		return (0); /* module is already loaded */
698 
699 	if (dmp->dm_pid != 0)
700 		return (dt_module_load_proc(dtp, dmp));
701 
702 	dmp->dm_ctdata.cts_name = ".SUNW_ctf";
703 	dmp->dm_ctdata.cts_type = SHT_PROGBITS;
704 	dmp->dm_ctdata.cts_flags = 0;
705 	dmp->dm_ctdata.cts_data = NULL;
706 	dmp->dm_ctdata.cts_size = 0;
707 	dmp->dm_ctdata.cts_entsize = 0;
708 	dmp->dm_ctdata.cts_offset = 0;
709 
710 	dmp->dm_symtab.cts_name = ".symtab";
711 	dmp->dm_symtab.cts_type = SHT_SYMTAB;
712 	dmp->dm_symtab.cts_flags = 0;
713 	dmp->dm_symtab.cts_data = NULL;
714 	dmp->dm_symtab.cts_size = 0;
715 	dmp->dm_symtab.cts_entsize = dmp->dm_ops == &dt_modops_64 ?
716 	    sizeof (Elf64_Sym) : sizeof (Elf32_Sym);
717 	dmp->dm_symtab.cts_offset = 0;
718 
719 	dmp->dm_strtab.cts_name = ".strtab";
720 	dmp->dm_strtab.cts_type = SHT_STRTAB;
721 	dmp->dm_strtab.cts_flags = 0;
722 	dmp->dm_strtab.cts_data = NULL;
723 	dmp->dm_strtab.cts_size = 0;
724 	dmp->dm_strtab.cts_entsize = 0;
725 	dmp->dm_strtab.cts_offset = 0;
726 
727 	/*
728 	 * Attempt to load the module's CTF section, symbol table section, and
729 	 * string table section.  Note that modules may not contain CTF data:
730 	 * this will result in a successful load_sect but data of size zero.
731 	 * We will then fail if dt_module_getctf() is called, as shown below.
732 	 */
733 	if (dt_module_load_sect(dtp, dmp, &dmp->dm_ctdata) == -1 ||
734 	    dt_module_load_sect(dtp, dmp, &dmp->dm_symtab) == -1 ||
735 	    dt_module_load_sect(dtp, dmp, &dmp->dm_strtab) == -1) {
736 		dt_module_unload(dtp, dmp);
737 		return (-1); /* dt_errno is set for us */
738 	}
739 
740 	/*
741 	 * Allocate the hash chains and hash buckets for symbol name lookup.
742 	 * This is relatively simple since the symbol table is of fixed size
743 	 * and is known in advance.  We allocate one extra element since we
744 	 * use element indices instead of pointers and zero is our sentinel.
745 	 */
746 	dmp->dm_nsymelems =
747 	    dmp->dm_symtab.cts_size / dmp->dm_symtab.cts_entsize;
748 
749 	dmp->dm_nsymbuckets = _dtrace_strbuckets;
750 	dmp->dm_symfree = 1;		/* first free element is index 1 */
751 
752 	dmp->dm_symbuckets = malloc(sizeof (uint_t) * dmp->dm_nsymbuckets);
753 	dmp->dm_symchains = malloc(sizeof (dt_sym_t) * dmp->dm_nsymelems + 1);
754 
755 	if (dmp->dm_symbuckets == NULL || dmp->dm_symchains == NULL) {
756 		dt_module_unload(dtp, dmp);
757 		return (dt_set_errno(dtp, EDT_NOMEM));
758 	}
759 
760 	bzero(dmp->dm_symbuckets, sizeof (uint_t) * dmp->dm_nsymbuckets);
761 	bzero(dmp->dm_symchains, sizeof (dt_sym_t) * dmp->dm_nsymelems + 1);
762 
763 	/*
764 	 * Iterate over the symbol table data buffer and insert each symbol
765 	 * name into the name hash if the name and type are valid.  Then
766 	 * allocate the address map, fill it in, and sort it.
767 	 */
768 	dmp->dm_asrsv = dmp->dm_ops->do_syminit(dmp);
769 
770 	dt_dprintf("hashed %s [%s] (%u symbols)\n",
771 	    dmp->dm_name, dmp->dm_symtab.cts_name, dmp->dm_symfree - 1);
772 
773 	if ((dmp->dm_asmap = malloc(sizeof (void *) * dmp->dm_asrsv)) == NULL) {
774 		dt_module_unload(dtp, dmp);
775 		return (dt_set_errno(dtp, EDT_NOMEM));
776 	}
777 
778 	dmp->dm_ops->do_symsort(dmp);
779 
780 	dt_dprintf("sorted %s [%s] (%u symbols)\n",
781 	    dmp->dm_name, dmp->dm_symtab.cts_name, dmp->dm_aslen);
782 
783 	dmp->dm_flags |= DT_DM_LOADED;
784 	return (0);
785 }
786 
787 int
788 dt_module_hasctf(dtrace_hdl_t *dtp, dt_module_t *dmp)
789 {
790 	if (dmp->dm_pid != 0 && dmp->dm_nctflibs > 0)
791 		return (1);
792 	return (dt_module_getctf(dtp, dmp) != NULL);
793 }
794 
795 ctf_file_t *
796 dt_module_getctf(dtrace_hdl_t *dtp, dt_module_t *dmp)
797 {
798 	const char *parent;
799 	dt_module_t *pmp;
800 	ctf_file_t *pfp;
801 	int model;
802 
803 	if (dmp->dm_ctfp != NULL || dt_module_load(dtp, dmp) != 0)
804 		return (dmp->dm_ctfp);
805 
806 	if (dmp->dm_ops == &dt_modops_64)
807 		model = CTF_MODEL_LP64;
808 	else
809 		model = CTF_MODEL_ILP32;
810 
811 	/*
812 	 * If the data model of the module does not match our program data
813 	 * model, then do not permit CTF from this module to be opened and
814 	 * returned to the compiler.  If we support mixed data models in the
815 	 * future for combined kernel/user tracing, this can be removed.
816 	 */
817 	if (dtp->dt_conf.dtc_ctfmodel != model) {
818 		(void) dt_set_errno(dtp, EDT_DATAMODEL);
819 		return (NULL);
820 	}
821 
822 	if (dmp->dm_ctdata.cts_size == 0) {
823 		(void) dt_set_errno(dtp, EDT_NOCTF);
824 		return (NULL);
825 	}
826 
827 	dmp->dm_ctfp = ctf_bufopen(&dmp->dm_ctdata,
828 	    &dmp->dm_symtab, &dmp->dm_strtab, &dtp->dt_ctferr);
829 
830 	if (dmp->dm_ctfp == NULL) {
831 		(void) dt_set_errno(dtp, EDT_CTF);
832 		return (NULL);
833 	}
834 
835 	(void) ctf_setmodel(dmp->dm_ctfp, model);
836 	ctf_setspecific(dmp->dm_ctfp, dmp);
837 
838 	if ((parent = ctf_parent_name(dmp->dm_ctfp)) != NULL) {
839 		if ((pmp = dt_module_create(dtp, parent)) == NULL ||
840 		    (pfp = dt_module_getctf(dtp, pmp)) == NULL) {
841 			if (pmp == NULL)
842 				(void) dt_set_errno(dtp, EDT_NOMEM);
843 			goto err;
844 		}
845 
846 		if (ctf_import(dmp->dm_ctfp, pfp) == CTF_ERR) {
847 			dtp->dt_ctferr = ctf_errno(dmp->dm_ctfp);
848 			(void) dt_set_errno(dtp, EDT_CTF);
849 			goto err;
850 		}
851 	}
852 
853 	dt_dprintf("loaded CTF container for %s (%p)\n",
854 	    dmp->dm_name, (void *)dmp->dm_ctfp);
855 
856 	return (dmp->dm_ctfp);
857 
858 err:
859 	ctf_close(dmp->dm_ctfp);
860 	dmp->dm_ctfp = NULL;
861 	return (NULL);
862 }
863 
864 /*ARGSUSED*/
865 void
866 dt_module_unload(dtrace_hdl_t *dtp, dt_module_t *dmp)
867 {
868 	int i;
869 
870 	ctf_close(dmp->dm_ctfp);
871 	dmp->dm_ctfp = NULL;
872 
873 	if (dmp->dm_libctfp != NULL) {
874 		for (i = 0; i < dmp->dm_nctflibs; i++) {
875 			ctf_close(dmp->dm_libctfp[i]);
876 			free(dmp->dm_libctfn[i]);
877 		}
878 		free(dmp->dm_libctfp);
879 		free(dmp->dm_libctfn);
880 		dmp->dm_libctfp = NULL;
881 		dmp->dm_nctflibs = 0;
882 	}
883 
884 	bzero(&dmp->dm_ctdata, sizeof (ctf_sect_t));
885 	bzero(&dmp->dm_symtab, sizeof (ctf_sect_t));
886 	bzero(&dmp->dm_strtab, sizeof (ctf_sect_t));
887 
888 	if (dmp->dm_symbuckets != NULL) {
889 		free(dmp->dm_symbuckets);
890 		dmp->dm_symbuckets = NULL;
891 	}
892 
893 	if (dmp->dm_symchains != NULL) {
894 		free(dmp->dm_symchains);
895 		dmp->dm_symchains = NULL;
896 	}
897 
898 	if (dmp->dm_asmap != NULL) {
899 		free(dmp->dm_asmap);
900 		dmp->dm_asmap = NULL;
901 	}
902 
903 	dmp->dm_symfree = 0;
904 	dmp->dm_nsymbuckets = 0;
905 	dmp->dm_nsymelems = 0;
906 	dmp->dm_asrsv = 0;
907 	dmp->dm_aslen = 0;
908 
909 	dmp->dm_text_va = 0;
910 	dmp->dm_text_size = 0;
911 	dmp->dm_data_va = 0;
912 	dmp->dm_data_size = 0;
913 	dmp->dm_bss_va = 0;
914 	dmp->dm_bss_size = 0;
915 
916 	if (dmp->dm_extern != NULL) {
917 		dt_idhash_destroy(dmp->dm_extern);
918 		dmp->dm_extern = NULL;
919 	}
920 
921 	(void) elf_end(dmp->dm_elf);
922 	dmp->dm_elf = NULL;
923 
924 	dmp->dm_pid = 0;
925 
926 	dmp->dm_flags &= ~DT_DM_LOADED;
927 }
928 
929 void
930 dt_module_destroy(dtrace_hdl_t *dtp, dt_module_t *dmp)
931 {
932 	uint_t h = dt_strtab_hash(dmp->dm_name, NULL) % dtp->dt_modbuckets;
933 	dt_module_t **dmpp = &dtp->dt_mods[h];
934 
935 	dt_list_delete(&dtp->dt_modlist, dmp);
936 	assert(dtp->dt_nmods != 0);
937 	dtp->dt_nmods--;
938 
939 	/*
940 	 * Now remove this module from its hash chain.  We expect to always
941 	 * find the module on its hash chain, so in this loop we assert that
942 	 * we don't run off the end of the list.
943 	 */
944 	while (*dmpp != dmp) {
945 		dmpp = &((*dmpp)->dm_next);
946 		assert(*dmpp != NULL);
947 	}
948 
949 	*dmpp = dmp->dm_next;
950 
951 	dt_module_unload(dtp, dmp);
952 	free(dmp);
953 }
954 
955 /*
956  * Insert a new external symbol reference into the specified module.  The new
957  * symbol will be marked as undefined and is assigned a symbol index beyond
958  * any existing cached symbols from this module.  We use the ident's di_data
959  * field to store a pointer to a copy of the dtrace_syminfo_t for this symbol.
960  */
961 dt_ident_t *
962 dt_module_extern(dtrace_hdl_t *dtp, dt_module_t *dmp,
963     const char *name, const dtrace_typeinfo_t *tip)
964 {
965 	dtrace_syminfo_t *sip;
966 	dt_ident_t *idp;
967 	uint_t id;
968 
969 	if (dmp->dm_extern == NULL && (dmp->dm_extern = dt_idhash_create(
970 	    "extern", NULL, dmp->dm_nsymelems, UINT_MAX)) == NULL) {
971 		(void) dt_set_errno(dtp, EDT_NOMEM);
972 		return (NULL);
973 	}
974 
975 	if (dt_idhash_nextid(dmp->dm_extern, &id) == -1) {
976 		(void) dt_set_errno(dtp, EDT_SYMOFLOW);
977 		return (NULL);
978 	}
979 
980 	if ((sip = malloc(sizeof (dtrace_syminfo_t))) == NULL) {
981 		(void) dt_set_errno(dtp, EDT_NOMEM);
982 		return (NULL);
983 	}
984 
985 	idp = dt_idhash_insert(dmp->dm_extern, name, DT_IDENT_SYMBOL, 0, id,
986 	    _dtrace_symattr, 0, &dt_idops_thaw, NULL, dtp->dt_gen);
987 
988 	if (idp == NULL) {
989 		(void) dt_set_errno(dtp, EDT_NOMEM);
990 		free(sip);
991 		return (NULL);
992 	}
993 
994 	sip->dts_object = dmp->dm_name;
995 	sip->dts_name = idp->di_name;
996 	sip->dts_id = idp->di_id;
997 
998 	idp->di_data = sip;
999 	idp->di_ctfp = tip->dtt_ctfp;
1000 	idp->di_type = tip->dtt_type;
1001 
1002 	return (idp);
1003 }
1004 
1005 const char *
1006 dt_module_modelname(dt_module_t *dmp)
1007 {
1008 	if (dmp->dm_ops == &dt_modops_64)
1009 		return ("64-bit");
1010 	else
1011 		return ("32-bit");
1012 }
1013 
1014 /* ARGSUSED */
1015 int
1016 dt_module_getlibid(dtrace_hdl_t *dtp, dt_module_t *dmp, const ctf_file_t *fp)
1017 {
1018 	int i;
1019 
1020 	for (i = 0; i < dmp->dm_nctflibs; i++) {
1021 		if (dmp->dm_libctfp[i] == fp)
1022 			return (i);
1023 	}
1024 
1025 	return (-1);
1026 }
1027 
1028 /* ARGSUSED */
1029 ctf_file_t *
1030 dt_module_getctflib(dtrace_hdl_t *dtp, dt_module_t *dmp, const char *name)
1031 {
1032 	int i;
1033 
1034 	for (i = 0; i < dmp->dm_nctflibs; i++) {
1035 		if (strcmp(dmp->dm_libctfn[i], name) == 0)
1036 			return (dmp->dm_libctfp[i]);
1037 	}
1038 
1039 	return (NULL);
1040 }
1041 
1042 /*
1043  * Update our module cache by adding an entry for the specified module 'name'.
1044  * We create the dt_module_t and populate it using /system/object/<name>/.
1045  */
1046 static void
1047 dt_module_update(dtrace_hdl_t *dtp, const char *name)
1048 {
1049 	char fname[MAXPATHLEN];
1050 	struct stat64 st;
1051 	int fd, err, bits;
1052 
1053 	dt_module_t *dmp;
1054 	const char *s;
1055 	size_t shstrs;
1056 	GElf_Shdr sh;
1057 	Elf_Data *dp;
1058 	Elf_Scn *sp;
1059 
1060 	(void) snprintf(fname, sizeof (fname),
1061 	    "%s/%s/object", OBJFS_ROOT, name);
1062 
1063 	if ((fd = open(fname, O_RDONLY)) == -1 || fstat64(fd, &st) == -1 ||
1064 	    (dmp = dt_module_create(dtp, name)) == NULL) {
1065 		dt_dprintf("failed to open %s: %s\n", fname, strerror(errno));
1066 		(void) close(fd);
1067 		return;
1068 	}
1069 
1070 	/*
1071 	 * Since the module can unload out from under us (and /system/object
1072 	 * will return ENOENT), tell libelf to cook the entire file now and
1073 	 * then close the underlying file descriptor immediately.  If this
1074 	 * succeeds, we know that we can continue safely using dmp->dm_elf.
1075 	 */
1076 	dmp->dm_elf = elf_begin(fd, ELF_C_READ, NULL);
1077 	err = elf_cntl(dmp->dm_elf, ELF_C_FDREAD);
1078 	(void) close(fd);
1079 
1080 	if (dmp->dm_elf == NULL || err == -1 ||
1081 	    elf_getshdrstrndx(dmp->dm_elf, &shstrs) == -1) {
1082 		dt_dprintf("failed to load %s: %s\n",
1083 		    fname, elf_errmsg(elf_errno()));
1084 		dt_module_destroy(dtp, dmp);
1085 		return;
1086 	}
1087 
1088 	switch (gelf_getclass(dmp->dm_elf)) {
1089 	case ELFCLASS32:
1090 		dmp->dm_ops = &dt_modops_32;
1091 		bits = 32;
1092 		break;
1093 	case ELFCLASS64:
1094 		dmp->dm_ops = &dt_modops_64;
1095 		bits = 64;
1096 		break;
1097 	default:
1098 		dt_dprintf("failed to load %s: unknown ELF class\n", fname);
1099 		dt_module_destroy(dtp, dmp);
1100 		return;
1101 	}
1102 
1103 	/*
1104 	 * Iterate over the section headers locating various sections of
1105 	 * interest and use their attributes to flesh out the dt_module_t.
1106 	 */
1107 	for (sp = NULL; (sp = elf_nextscn(dmp->dm_elf, sp)) != NULL; ) {
1108 		if (gelf_getshdr(sp, &sh) == NULL || sh.sh_type == SHT_NULL ||
1109 		    (s = elf_strptr(dmp->dm_elf, shstrs, sh.sh_name)) == NULL)
1110 			continue; /* skip any malformed sections */
1111 
1112 		if (strcmp(s, ".text") == 0) {
1113 			dmp->dm_text_size = sh.sh_size;
1114 			dmp->dm_text_va = sh.sh_addr;
1115 		} else if (strcmp(s, ".data") == 0) {
1116 			dmp->dm_data_size = sh.sh_size;
1117 			dmp->dm_data_va = sh.sh_addr;
1118 		} else if (strcmp(s, ".bss") == 0) {
1119 			dmp->dm_bss_size = sh.sh_size;
1120 			dmp->dm_bss_va = sh.sh_addr;
1121 		} else if (strcmp(s, ".info") == 0 &&
1122 		    (dp = elf_getdata(sp, NULL)) != NULL) {
1123 			bcopy(dp->d_buf, &dmp->dm_info,
1124 			    MIN(sh.sh_size, sizeof (dmp->dm_info)));
1125 		} else if (strcmp(s, ".filename") == 0 &&
1126 		    (dp = elf_getdata(sp, NULL)) != NULL) {
1127 			(void) strlcpy(dmp->dm_file,
1128 			    dp->d_buf, sizeof (dmp->dm_file));
1129 		}
1130 	}
1131 
1132 	dmp->dm_flags |= DT_DM_KERNEL;
1133 	dmp->dm_modid = (int)OBJFS_MODID(st.st_ino);
1134 
1135 	if (dmp->dm_info.objfs_info_primary)
1136 		dmp->dm_flags |= DT_DM_PRIMARY;
1137 
1138 	dt_dprintf("opened %d-bit module %s (%s) [%d]\n",
1139 	    bits, dmp->dm_name, dmp->dm_file, dmp->dm_modid);
1140 }
1141 
1142 /*
1143  * Unload all the loaded modules and then refresh the module cache with the
1144  * latest list of loaded modules and their address ranges.
1145  */
1146 void
1147 dtrace_update(dtrace_hdl_t *dtp)
1148 {
1149 	dt_module_t *dmp;
1150 	DIR *dirp;
1151 
1152 	for (dmp = dt_list_next(&dtp->dt_modlist);
1153 	    dmp != NULL; dmp = dt_list_next(dmp))
1154 		dt_module_unload(dtp, dmp);
1155 
1156 	/*
1157 	 * Open /system/object and attempt to create a libdtrace module for
1158 	 * each kernel module that is loaded on the current system.
1159 	 */
1160 	if (!(dtp->dt_oflags & DTRACE_O_NOSYS) &&
1161 	    (dirp = opendir(OBJFS_ROOT)) != NULL) {
1162 		struct dirent *dp;
1163 
1164 		while ((dp = readdir(dirp)) != NULL) {
1165 			if (dp->d_name[0] != '.')
1166 				dt_module_update(dtp, dp->d_name);
1167 		}
1168 
1169 		(void) closedir(dirp);
1170 	}
1171 
1172 	/*
1173 	 * Look up all the macro identifiers and set di_id to the latest value.
1174 	 * This code collaborates with dt_lex.l on the use of di_id.  We will
1175 	 * need to implement something fancier if we need to support non-ints.
1176 	 */
1177 	dt_idhash_lookup(dtp->dt_macros, "egid")->di_id = getegid();
1178 	dt_idhash_lookup(dtp->dt_macros, "euid")->di_id = geteuid();
1179 	dt_idhash_lookup(dtp->dt_macros, "gid")->di_id = getgid();
1180 	dt_idhash_lookup(dtp->dt_macros, "pid")->di_id = getpid();
1181 	dt_idhash_lookup(dtp->dt_macros, "pgid")->di_id = getpgid(0);
1182 	dt_idhash_lookup(dtp->dt_macros, "ppid")->di_id = getppid();
1183 	dt_idhash_lookup(dtp->dt_macros, "projid")->di_id = getprojid();
1184 	dt_idhash_lookup(dtp->dt_macros, "sid")->di_id = getsid(0);
1185 	dt_idhash_lookup(dtp->dt_macros, "taskid")->di_id = gettaskid();
1186 	dt_idhash_lookup(dtp->dt_macros, "uid")->di_id = getuid();
1187 
1188 	/*
1189 	 * Cache the pointers to the modules representing the base executable
1190 	 * and the run-time linker in the dtrace client handle. Note that on
1191 	 * x86 krtld is folded into unix, so if we don't find it, use unix
1192 	 * instead.
1193 	 */
1194 	dtp->dt_exec = dt_module_lookup_by_name(dtp, "genunix");
1195 	dtp->dt_rtld = dt_module_lookup_by_name(dtp, "krtld");
1196 	if (dtp->dt_rtld == NULL)
1197 		dtp->dt_rtld = dt_module_lookup_by_name(dtp, "unix");
1198 
1199 	/*
1200 	 * If this is the first time we are initializing the module list,
1201 	 * remove the module for genunix from the module list and then move it
1202 	 * to the front of the module list.  We do this so that type and symbol
1203 	 * queries encounter genunix and thereby optimize for the common case
1204 	 * in dtrace_lookup_by_name() and dtrace_lookup_by_type(), below.
1205 	 */
1206 	if (dtp->dt_exec != NULL &&
1207 	    dtp->dt_cdefs == NULL && dtp->dt_ddefs == NULL) {
1208 		dt_list_delete(&dtp->dt_modlist, dtp->dt_exec);
1209 		dt_list_prepend(&dtp->dt_modlist, dtp->dt_exec);
1210 	}
1211 }
1212 
1213 static dt_module_t *
1214 dt_module_from_object(dtrace_hdl_t *dtp, const char *object)
1215 {
1216 	int err = EDT_NOMOD;
1217 	dt_module_t *dmp;
1218 
1219 	switch ((uintptr_t)object) {
1220 	case (uintptr_t)DTRACE_OBJ_EXEC:
1221 		dmp = dtp->dt_exec;
1222 		break;
1223 	case (uintptr_t)DTRACE_OBJ_RTLD:
1224 		dmp = dtp->dt_rtld;
1225 		break;
1226 	case (uintptr_t)DTRACE_OBJ_CDEFS:
1227 		dmp = dtp->dt_cdefs;
1228 		break;
1229 	case (uintptr_t)DTRACE_OBJ_DDEFS:
1230 		dmp = dtp->dt_ddefs;
1231 		break;
1232 	default:
1233 		dmp = dt_module_create(dtp, object);
1234 		err = EDT_NOMEM;
1235 	}
1236 
1237 	if (dmp == NULL)
1238 		(void) dt_set_errno(dtp, err);
1239 
1240 	return (dmp);
1241 }
1242 
1243 /*
1244  * Exported interface to look up a symbol by name.  We return the GElf_Sym and
1245  * complete symbol information for the matching symbol.
1246  */
1247 int
1248 dtrace_lookup_by_name(dtrace_hdl_t *dtp, const char *object, const char *name,
1249     GElf_Sym *symp, dtrace_syminfo_t *sip)
1250 {
1251 	dt_module_t *dmp;
1252 	dt_ident_t *idp;
1253 	uint_t n, id;
1254 	GElf_Sym sym;
1255 
1256 	uint_t mask = 0; /* mask of dt_module flags to match */
1257 	uint_t bits = 0; /* flag bits that must be present */
1258 
1259 	if (object != DTRACE_OBJ_EVERY &&
1260 	    object != DTRACE_OBJ_KMODS &&
1261 	    object != DTRACE_OBJ_UMODS) {
1262 		if ((dmp = dt_module_from_object(dtp, object)) == NULL)
1263 			return (-1); /* dt_errno is set for us */
1264 
1265 		if (dt_module_load(dtp, dmp) == -1)
1266 			return (-1); /* dt_errno is set for us */
1267 		n = 1;
1268 
1269 	} else {
1270 		if (object == DTRACE_OBJ_KMODS)
1271 			mask = bits = DT_DM_KERNEL;
1272 		else if (object == DTRACE_OBJ_UMODS)
1273 			mask = DT_DM_KERNEL;
1274 
1275 		dmp = dt_list_next(&dtp->dt_modlist);
1276 		n = dtp->dt_nmods;
1277 	}
1278 
1279 	if (symp == NULL)
1280 		symp = &sym;
1281 
1282 	for (; n > 0; n--, dmp = dt_list_next(dmp)) {
1283 		if ((dmp->dm_flags & mask) != bits)
1284 			continue; /* failed to match required attributes */
1285 
1286 		if (dt_module_load(dtp, dmp) == -1)
1287 			continue; /* failed to load symbol table */
1288 
1289 		if (dmp->dm_ops->do_symname(dmp, name, symp, &id) != NULL) {
1290 			if (sip != NULL) {
1291 				sip->dts_object = dmp->dm_name;
1292 				sip->dts_name = (const char *)
1293 				    dmp->dm_strtab.cts_data + symp->st_name;
1294 				sip->dts_id = id;
1295 			}
1296 			return (0);
1297 		}
1298 
1299 		if (dmp->dm_extern != NULL &&
1300 		    (idp = dt_idhash_lookup(dmp->dm_extern, name)) != NULL) {
1301 			if (symp != &sym) {
1302 				symp->st_name = (uintptr_t)idp->di_name;
1303 				symp->st_info =
1304 				    GELF_ST_INFO(STB_GLOBAL, STT_NOTYPE);
1305 				symp->st_other = 0;
1306 				symp->st_shndx = SHN_UNDEF;
1307 				symp->st_value = 0;
1308 				symp->st_size =
1309 				    ctf_type_size(idp->di_ctfp, idp->di_type);
1310 			}
1311 
1312 			if (sip != NULL) {
1313 				sip->dts_object = dmp->dm_name;
1314 				sip->dts_name = idp->di_name;
1315 				sip->dts_id = idp->di_id;
1316 			}
1317 
1318 			return (0);
1319 		}
1320 	}
1321 
1322 	return (dt_set_errno(dtp, EDT_NOSYM));
1323 }
1324 
1325 /*
1326  * Exported interface to look up a symbol by address.  We return the GElf_Sym
1327  * and complete symbol information for the matching symbol.
1328  */
1329 int
1330 dtrace_lookup_by_addr(dtrace_hdl_t *dtp, GElf_Addr addr,
1331     GElf_Sym *symp, dtrace_syminfo_t *sip)
1332 {
1333 	dt_module_t *dmp;
1334 	uint_t id;
1335 	const dtrace_vector_t *v = dtp->dt_vector;
1336 
1337 	if (v != NULL)
1338 		return (v->dtv_lookup_by_addr(dtp->dt_varg, addr, symp, sip));
1339 
1340 	for (dmp = dt_list_next(&dtp->dt_modlist); dmp != NULL;
1341 	    dmp = dt_list_next(dmp)) {
1342 		if (addr - dmp->dm_text_va < dmp->dm_text_size ||
1343 		    addr - dmp->dm_data_va < dmp->dm_data_size ||
1344 		    addr - dmp->dm_bss_va < dmp->dm_bss_size)
1345 			break;
1346 	}
1347 
1348 	if (dmp == NULL)
1349 		return (dt_set_errno(dtp, EDT_NOSYMADDR));
1350 
1351 	if (dt_module_load(dtp, dmp) == -1)
1352 		return (-1); /* dt_errno is set for us */
1353 
1354 	if (symp != NULL) {
1355 		if (dmp->dm_ops->do_symaddr(dmp, addr, symp, &id) == NULL)
1356 			return (dt_set_errno(dtp, EDT_NOSYMADDR));
1357 	}
1358 
1359 	if (sip != NULL) {
1360 		sip->dts_object = dmp->dm_name;
1361 
1362 		if (symp != NULL) {
1363 			sip->dts_name = (const char *)
1364 			    dmp->dm_strtab.cts_data + symp->st_name;
1365 			sip->dts_id = id;
1366 		} else {
1367 			sip->dts_name = NULL;
1368 			sip->dts_id = 0;
1369 		}
1370 	}
1371 
1372 	return (0);
1373 }
1374 
1375 int
1376 dtrace_lookup_by_type(dtrace_hdl_t *dtp, const char *object, const char *name,
1377     dtrace_typeinfo_t *tip)
1378 {
1379 	dtrace_typeinfo_t ti;
1380 	dt_module_t *dmp;
1381 	int found = 0;
1382 	ctf_id_t id;
1383 	uint_t n, i;
1384 	int justone;
1385 	ctf_file_t *fp;
1386 	char *buf, *p, *q;
1387 
1388 	uint_t mask = 0; /* mask of dt_module flags to match */
1389 	uint_t bits = 0; /* flag bits that must be present */
1390 
1391 	if (object != DTRACE_OBJ_EVERY &&
1392 	    object != DTRACE_OBJ_KMODS &&
1393 	    object != DTRACE_OBJ_UMODS) {
1394 		if ((dmp = dt_module_from_object(dtp, object)) == NULL)
1395 			return (-1); /* dt_errno is set for us */
1396 
1397 		if (dt_module_load(dtp, dmp) == -1)
1398 			return (-1); /* dt_errno is set for us */
1399 		n = 1;
1400 		justone = 1;
1401 	} else {
1402 		if (object == DTRACE_OBJ_KMODS)
1403 			mask = bits = DT_DM_KERNEL;
1404 		else if (object == DTRACE_OBJ_UMODS)
1405 			mask = DT_DM_KERNEL;
1406 
1407 		dmp = dt_list_next(&dtp->dt_modlist);
1408 		n = dtp->dt_nmods;
1409 		justone = 0;
1410 	}
1411 
1412 	if (tip == NULL)
1413 		tip = &ti;
1414 
1415 	for (; n > 0; n--, dmp = dt_list_next(dmp)) {
1416 		if ((dmp->dm_flags & mask) != bits)
1417 			continue; /* failed to match required attributes */
1418 
1419 		/*
1420 		 * If we can't load the CTF container, continue on to the next
1421 		 * module.  If our search was scoped to only one module then
1422 		 * return immediately leaving dt_errno unmodified.
1423 		 */
1424 		if (dt_module_hasctf(dtp, dmp) == 0) {
1425 			if (justone)
1426 				return (-1);
1427 			continue;
1428 		}
1429 
1430 		/*
1431 		 * Look up the type in the module's CTF container.  If our
1432 		 * match is a forward declaration tag, save this choice in
1433 		 * 'tip' and keep going in the hope that we will locate the
1434 		 * underlying structure definition.  Otherwise just return.
1435 		 */
1436 		if (dmp->dm_pid == 0) {
1437 			id = ctf_lookup_by_name(dmp->dm_ctfp, name);
1438 			fp = dmp->dm_ctfp;
1439 		} else {
1440 			if ((p = strchr(name, '`')) != NULL) {
1441 				buf = strdup(name);
1442 				if (buf == NULL)
1443 					return (dt_set_errno(dtp, EDT_NOMEM));
1444 				p = strchr(buf, '`');
1445 				if ((q = strchr(p + 1, '`')) != NULL)
1446 					p = q;
1447 				*p = '\0';
1448 				fp = dt_module_getctflib(dtp, dmp, buf);
1449 				if (fp == NULL || (id = ctf_lookup_by_name(fp,
1450 				    p + 1)) == CTF_ERR)
1451 					id = CTF_ERR;
1452 				free(buf);
1453 			} else {
1454 				for (i = 0; i < dmp->dm_nctflibs; i++) {
1455 					fp = dmp->dm_libctfp[i];
1456 					id = ctf_lookup_by_name(fp, name);
1457 					if (id != CTF_ERR)
1458 						break;
1459 				}
1460 			}
1461 		}
1462 		if (id != CTF_ERR) {
1463 			tip->dtt_object = dmp->dm_name;
1464 			tip->dtt_ctfp = fp;
1465 			tip->dtt_type = id;
1466 			if (ctf_type_kind(fp, ctf_type_resolve(fp, id)) !=
1467 			    CTF_K_FORWARD)
1468 				return (0);
1469 
1470 			found++;
1471 		}
1472 	}
1473 
1474 	if (found == 0)
1475 		return (dt_set_errno(dtp, EDT_NOTYPE));
1476 
1477 	return (0);
1478 }
1479 
1480 int
1481 dtrace_symbol_type(dtrace_hdl_t *dtp, const GElf_Sym *symp,
1482     const dtrace_syminfo_t *sip, dtrace_typeinfo_t *tip)
1483 {
1484 	dt_module_t *dmp;
1485 
1486 	tip->dtt_object = NULL;
1487 	tip->dtt_ctfp = NULL;
1488 	tip->dtt_type = CTF_ERR;
1489 	tip->dtt_flags = 0;
1490 
1491 	if ((dmp = dt_module_lookup_by_name(dtp, sip->dts_object)) == NULL)
1492 		return (dt_set_errno(dtp, EDT_NOMOD));
1493 
1494 	if (symp->st_shndx == SHN_UNDEF && dmp->dm_extern != NULL) {
1495 		dt_ident_t *idp =
1496 		    dt_idhash_lookup(dmp->dm_extern, sip->dts_name);
1497 
1498 		if (idp == NULL)
1499 			return (dt_set_errno(dtp, EDT_NOSYM));
1500 
1501 		tip->dtt_ctfp = idp->di_ctfp;
1502 		tip->dtt_type = idp->di_type;
1503 
1504 	} else if (GELF_ST_TYPE(symp->st_info) != STT_FUNC) {
1505 		if (dt_module_getctf(dtp, dmp) == NULL)
1506 			return (-1); /* errno is set for us */
1507 
1508 		tip->dtt_ctfp = dmp->dm_ctfp;
1509 		tip->dtt_type = ctf_lookup_by_symbol(dmp->dm_ctfp, sip->dts_id);
1510 
1511 		if (tip->dtt_type == CTF_ERR) {
1512 			dtp->dt_ctferr = ctf_errno(tip->dtt_ctfp);
1513 			return (dt_set_errno(dtp, EDT_CTF));
1514 		}
1515 
1516 	} else {
1517 		tip->dtt_ctfp = DT_FPTR_CTFP(dtp);
1518 		tip->dtt_type = DT_FPTR_TYPE(dtp);
1519 	}
1520 
1521 	tip->dtt_object = dmp->dm_name;
1522 	return (0);
1523 }
1524 
1525 static dtrace_objinfo_t *
1526 dt_module_info(const dt_module_t *dmp, dtrace_objinfo_t *dto)
1527 {
1528 	dto->dto_name = dmp->dm_name;
1529 	dto->dto_file = dmp->dm_file;
1530 	dto->dto_id = dmp->dm_modid;
1531 	dto->dto_flags = 0;
1532 
1533 	if (dmp->dm_flags & DT_DM_KERNEL)
1534 		dto->dto_flags |= DTRACE_OBJ_F_KERNEL;
1535 	if (dmp->dm_flags & DT_DM_PRIMARY)
1536 		dto->dto_flags |= DTRACE_OBJ_F_PRIMARY;
1537 
1538 	dto->dto_text_va = dmp->dm_text_va;
1539 	dto->dto_text_size = dmp->dm_text_size;
1540 	dto->dto_data_va = dmp->dm_data_va;
1541 	dto->dto_data_size = dmp->dm_data_size;
1542 	dto->dto_bss_va = dmp->dm_bss_va;
1543 	dto->dto_bss_size = dmp->dm_bss_size;
1544 
1545 	return (dto);
1546 }
1547 
1548 int
1549 dtrace_object_iter(dtrace_hdl_t *dtp, dtrace_obj_f *func, void *data)
1550 {
1551 	const dt_module_t *dmp = dt_list_next(&dtp->dt_modlist);
1552 	dtrace_objinfo_t dto;
1553 	int rv;
1554 
1555 	for (; dmp != NULL; dmp = dt_list_next(dmp)) {
1556 		if ((rv = (*func)(dtp, dt_module_info(dmp, &dto), data)) != 0)
1557 			return (rv);
1558 	}
1559 
1560 	return (0);
1561 }
1562 
1563 int
1564 dtrace_object_info(dtrace_hdl_t *dtp, const char *object, dtrace_objinfo_t *dto)
1565 {
1566 	dt_module_t *dmp;
1567 
1568 	if (object == DTRACE_OBJ_EVERY || object == DTRACE_OBJ_KMODS ||
1569 	    object == DTRACE_OBJ_UMODS || dto == NULL)
1570 		return (dt_set_errno(dtp, EINVAL));
1571 
1572 	if ((dmp = dt_module_from_object(dtp, object)) == NULL)
1573 		return (-1); /* dt_errno is set for us */
1574 
1575 	if (dt_module_load(dtp, dmp) == -1)
1576 		return (-1); /* dt_errno is set for us */
1577 
1578 	(void) dt_module_info(dmp, dto);
1579 	return (0);
1580 }
1581