xref: /linux/tools/bpf/resolve_btfids/main.c (revision d1b803f4ca4f25d6f171219d039f9410a10b29ee)
1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2 
3 /*
4  * resolve_btfids scans Elf object for .BTF_ids section and resolves
5  * its symbols with BTF ID values.
6  *
7  * Each symbol points to 4 bytes data and is expected to have
8  * following name syntax:
9  *
10  * __BTF_ID__<type>__<symbol>[__<id>]
11  *
12  * type is:
13  *
14  *   func    - lookup BTF_KIND_FUNC symbol with <symbol> name
15  *             and store its ID into the data:
16  *
17  *             __BTF_ID__func__vfs_close__1:
18  *             .zero 4
19  *
20  *   struct  - lookup BTF_KIND_STRUCT symbol with <symbol> name
21  *             and store its ID into the data:
22  *
23  *             __BTF_ID__struct__sk_buff__1:
24  *             .zero 4
25  *
26  *   union   - lookup BTF_KIND_UNION symbol with <symbol> name
27  *             and store its ID into the data:
28  *
29  *             __BTF_ID__union__thread_union__1:
30  *             .zero 4
31  *
32  *   typedef - lookup BTF_KIND_TYPEDEF symbol with <symbol> name
33  *             and store its ID into the data:
34  *
35  *             __BTF_ID__typedef__pid_t__1:
36  *             .zero 4
37  *
38  *   set     - store symbol size into first 4 bytes and sort following
39  *             ID list
40  *
41  *             __BTF_ID__set__list:
42  *             .zero 4
43  *             list:
44  *             __BTF_ID__func__vfs_getattr__3:
45  *             .zero 4
46  *             __BTF_ID__func__vfs_fallocate__4:
47  *             .zero 4
48  */
49 
50 #define  _GNU_SOURCE
51 #include <stdio.h>
52 #include <string.h>
53 #include <unistd.h>
54 #include <stdlib.h>
55 #include <libelf.h>
56 #include <gelf.h>
57 #include <sys/stat.h>
58 #include <fcntl.h>
59 #include <errno.h>
60 #include <linux/rbtree.h>
61 #include <linux/zalloc.h>
62 #include <linux/err.h>
63 #include <btf.h>
64 #include <libbpf.h>
65 #include <parse-options.h>
66 
67 #define BTF_IDS_SECTION	".BTF_ids"
68 #define BTF_ID		"__BTF_ID__"
69 
70 #define BTF_STRUCT	"struct"
71 #define BTF_UNION	"union"
72 #define BTF_TYPEDEF	"typedef"
73 #define BTF_FUNC	"func"
74 #define BTF_SET		"set"
75 
76 #define ADDR_CNT	100
77 
78 struct btf_id {
79 	struct rb_node	 rb_node;
80 	char		*name;
81 	union {
82 		int	 id;
83 		int	 cnt;
84 	};
85 	int		 addr_cnt;
86 	Elf64_Addr	 addr[ADDR_CNT];
87 };
88 
89 struct object {
90 	const char *path;
91 	const char *btf;
92 
93 	struct {
94 		int		 fd;
95 		Elf		*elf;
96 		Elf_Data	*symbols;
97 		Elf_Data	*idlist;
98 		int		 symbols_shndx;
99 		int		 idlist_shndx;
100 		size_t		 strtabidx;
101 		unsigned long	 idlist_addr;
102 	} efile;
103 
104 	struct rb_root	sets;
105 	struct rb_root	structs;
106 	struct rb_root	unions;
107 	struct rb_root	typedefs;
108 	struct rb_root	funcs;
109 
110 	int nr_funcs;
111 	int nr_structs;
112 	int nr_unions;
113 	int nr_typedefs;
114 };
115 
116 static int verbose;
117 
118 static int eprintf(int level, int var, const char *fmt, ...)
119 {
120 	va_list args;
121 	int ret = 0;
122 
123 	if (var >= level) {
124 		va_start(args, fmt);
125 		ret = vfprintf(stderr, fmt, args);
126 		va_end(args);
127 	}
128 	return ret;
129 }
130 
131 #ifndef pr_fmt
132 #define pr_fmt(fmt) fmt
133 #endif
134 
135 #define pr_debug(fmt, ...) \
136 	eprintf(1, verbose, pr_fmt(fmt), ##__VA_ARGS__)
137 #define pr_debugN(n, fmt, ...) \
138 	eprintf(n, verbose, pr_fmt(fmt), ##__VA_ARGS__)
139 #define pr_debug2(fmt, ...) pr_debugN(2, pr_fmt(fmt), ##__VA_ARGS__)
140 #define pr_err(fmt, ...) \
141 	eprintf(0, verbose, pr_fmt(fmt), ##__VA_ARGS__)
142 #define pr_info(fmt, ...) \
143 	eprintf(0, verbose, pr_fmt(fmt), ##__VA_ARGS__)
144 
145 static bool is_btf_id(const char *name)
146 {
147 	return name && !strncmp(name, BTF_ID, sizeof(BTF_ID) - 1);
148 }
149 
150 static struct btf_id *btf_id__find(struct rb_root *root, const char *name)
151 {
152 	struct rb_node *p = root->rb_node;
153 	struct btf_id *id;
154 	int cmp;
155 
156 	while (p) {
157 		id = rb_entry(p, struct btf_id, rb_node);
158 		cmp = strcmp(id->name, name);
159 		if (cmp < 0)
160 			p = p->rb_left;
161 		else if (cmp > 0)
162 			p = p->rb_right;
163 		else
164 			return id;
165 	}
166 	return NULL;
167 }
168 
169 static struct btf_id*
170 btf_id__add(struct rb_root *root, char *name, bool unique)
171 {
172 	struct rb_node **p = &root->rb_node;
173 	struct rb_node *parent = NULL;
174 	struct btf_id *id;
175 	int cmp;
176 
177 	while (*p != NULL) {
178 		parent = *p;
179 		id = rb_entry(parent, struct btf_id, rb_node);
180 		cmp = strcmp(id->name, name);
181 		if (cmp < 0)
182 			p = &(*p)->rb_left;
183 		else if (cmp > 0)
184 			p = &(*p)->rb_right;
185 		else
186 			return unique ? NULL : id;
187 	}
188 
189 	id = zalloc(sizeof(*id));
190 	if (id) {
191 		pr_debug("adding symbol %s\n", name);
192 		id->name = name;
193 		rb_link_node(&id->rb_node, parent, p);
194 		rb_insert_color(&id->rb_node, root);
195 	}
196 	return id;
197 }
198 
199 static char *get_id(const char *prefix_end)
200 {
201 	/*
202 	 * __BTF_ID__func__vfs_truncate__0
203 	 * prefix_end =  ^
204 	 * pos        =    ^
205 	 */
206 	int len = strlen(prefix_end);
207 	int pos = sizeof("__") - 1;
208 	char *p, *id;
209 
210 	if (pos >= len)
211 		return NULL;
212 
213 	id = strdup(prefix_end + pos);
214 	if (id) {
215 		/*
216 		 * __BTF_ID__func__vfs_truncate__0
217 		 * id =            ^
218 		 *
219 		 * cut the unique id part
220 		 */
221 		p = strrchr(id, '_');
222 		p--;
223 		if (*p != '_') {
224 			free(id);
225 			return NULL;
226 		}
227 		*p = '\0';
228 	}
229 	return id;
230 }
231 
232 static struct btf_id *add_set(struct object *obj, char *name)
233 {
234 	/*
235 	 * __BTF_ID__set__name
236 	 * name =    ^
237 	 * id   =         ^
238 	 */
239 	char *id = name + sizeof(BTF_SET "__") - 1;
240 	int len = strlen(name);
241 
242 	if (id >= name + len) {
243 		pr_err("FAILED to parse set name: %s\n", name);
244 		return NULL;
245 	}
246 
247 	return btf_id__add(&obj->sets, id, true);
248 }
249 
250 static struct btf_id *add_symbol(struct rb_root *root, char *name, size_t size)
251 {
252 	char *id;
253 
254 	id = get_id(name + size);
255 	if (!id) {
256 		pr_err("FAILED to parse symbol name: %s\n", name);
257 		return NULL;
258 	}
259 
260 	return btf_id__add(root, id, false);
261 }
262 
263 /* Older libelf.h and glibc elf.h might not yet define the ELF compression types. */
264 #ifndef SHF_COMPRESSED
265 #define SHF_COMPRESSED (1 << 11) /* Section with compressed data. */
266 #endif
267 
268 /*
269  * The data of compressed section should be aligned to 4
270  * (for 32bit) or 8 (for 64 bit) bytes. The binutils ld
271  * sets sh_addralign to 1, which makes libelf fail with
272  * misaligned section error during the update:
273  *    FAILED elf_update(WRITE): invalid section alignment
274  *
275  * While waiting for ld fix, we fix the compressed sections
276  * sh_addralign value manualy.
277  */
278 static int compressed_section_fix(Elf *elf, Elf_Scn *scn, GElf_Shdr *sh)
279 {
280 	int expected = gelf_getclass(elf) == ELFCLASS32 ? 4 : 8;
281 
282 	if (!(sh->sh_flags & SHF_COMPRESSED))
283 		return 0;
284 
285 	if (sh->sh_addralign == expected)
286 		return 0;
287 
288 	pr_debug2(" - fixing wrong alignment sh_addralign %u, expected %u\n",
289 		  sh->sh_addralign, expected);
290 
291 	sh->sh_addralign = expected;
292 
293 	if (gelf_update_shdr(scn, sh) == 0) {
294 		pr_err("FAILED cannot update section header: %s\n",
295 			elf_errmsg(-1));
296 		return -1;
297 	}
298 	return 0;
299 }
300 
301 static int elf_collect(struct object *obj)
302 {
303 	Elf_Scn *scn = NULL;
304 	size_t shdrstrndx;
305 	int idx = 0;
306 	Elf *elf;
307 	int fd;
308 
309 	fd = open(obj->path, O_RDWR, 0666);
310 	if (fd == -1) {
311 		pr_err("FAILED cannot open %s: %s\n",
312 			obj->path, strerror(errno));
313 		return -1;
314 	}
315 
316 	elf_version(EV_CURRENT);
317 
318 	elf = elf_begin(fd, ELF_C_RDWR_MMAP, NULL);
319 	if (!elf) {
320 		close(fd);
321 		pr_err("FAILED cannot create ELF descriptor: %s\n",
322 			elf_errmsg(-1));
323 		return -1;
324 	}
325 
326 	obj->efile.fd  = fd;
327 	obj->efile.elf = elf;
328 
329 	elf_flagelf(elf, ELF_C_SET, ELF_F_LAYOUT);
330 
331 	if (elf_getshdrstrndx(elf, &shdrstrndx) != 0) {
332 		pr_err("FAILED cannot get shdr str ndx\n");
333 		return -1;
334 	}
335 
336 	/*
337 	 * Scan all the elf sections and look for save data
338 	 * from .BTF_ids section and symbols.
339 	 */
340 	while ((scn = elf_nextscn(elf, scn)) != NULL) {
341 		Elf_Data *data;
342 		GElf_Shdr sh;
343 		char *name;
344 
345 		idx++;
346 		if (gelf_getshdr(scn, &sh) != &sh) {
347 			pr_err("FAILED get section(%d) header\n", idx);
348 			return -1;
349 		}
350 
351 		name = elf_strptr(elf, shdrstrndx, sh.sh_name);
352 		if (!name) {
353 			pr_err("FAILED get section(%d) name\n", idx);
354 			return -1;
355 		}
356 
357 		data = elf_getdata(scn, 0);
358 		if (!data) {
359 			pr_err("FAILED to get section(%d) data from %s\n",
360 				idx, name);
361 			return -1;
362 		}
363 
364 		pr_debug2("section(%d) %s, size %ld, link %d, flags %lx, type=%d\n",
365 			  idx, name, (unsigned long) data->d_size,
366 			  (int) sh.sh_link, (unsigned long) sh.sh_flags,
367 			  (int) sh.sh_type);
368 
369 		if (sh.sh_type == SHT_SYMTAB) {
370 			obj->efile.symbols       = data;
371 			obj->efile.symbols_shndx = idx;
372 			obj->efile.strtabidx     = sh.sh_link;
373 		} else if (!strcmp(name, BTF_IDS_SECTION)) {
374 			obj->efile.idlist       = data;
375 			obj->efile.idlist_shndx = idx;
376 			obj->efile.idlist_addr  = sh.sh_addr;
377 		}
378 
379 		if (compressed_section_fix(elf, scn, &sh))
380 			return -1;
381 	}
382 
383 	return 0;
384 }
385 
386 static int symbols_collect(struct object *obj)
387 {
388 	Elf_Scn *scn = NULL;
389 	int n, i;
390 	GElf_Shdr sh;
391 	char *name;
392 
393 	scn = elf_getscn(obj->efile.elf, obj->efile.symbols_shndx);
394 	if (!scn)
395 		return -1;
396 
397 	if (gelf_getshdr(scn, &sh) != &sh)
398 		return -1;
399 
400 	n = sh.sh_size / sh.sh_entsize;
401 
402 	/*
403 	 * Scan symbols and look for the ones starting with
404 	 * __BTF_ID__* over .BTF_ids section.
405 	 */
406 	for (i = 0; i < n; i++) {
407 		char *prefix;
408 		struct btf_id *id;
409 		GElf_Sym sym;
410 
411 		if (!gelf_getsym(obj->efile.symbols, i, &sym))
412 			return -1;
413 
414 		if (sym.st_shndx != obj->efile.idlist_shndx)
415 			continue;
416 
417 		name = elf_strptr(obj->efile.elf, obj->efile.strtabidx,
418 				  sym.st_name);
419 
420 		if (!is_btf_id(name))
421 			continue;
422 
423 		/*
424 		 * __BTF_ID__TYPE__vfs_truncate__0
425 		 * prefix =  ^
426 		 */
427 		prefix = name + sizeof(BTF_ID) - 1;
428 
429 		/* struct */
430 		if (!strncmp(prefix, BTF_STRUCT, sizeof(BTF_STRUCT) - 1)) {
431 			obj->nr_structs++;
432 			id = add_symbol(&obj->structs, prefix, sizeof(BTF_STRUCT) - 1);
433 		/* union  */
434 		} else if (!strncmp(prefix, BTF_UNION, sizeof(BTF_UNION) - 1)) {
435 			obj->nr_unions++;
436 			id = add_symbol(&obj->unions, prefix, sizeof(BTF_UNION) - 1);
437 		/* typedef */
438 		} else if (!strncmp(prefix, BTF_TYPEDEF, sizeof(BTF_TYPEDEF) - 1)) {
439 			obj->nr_typedefs++;
440 			id = add_symbol(&obj->typedefs, prefix, sizeof(BTF_TYPEDEF) - 1);
441 		/* func */
442 		} else if (!strncmp(prefix, BTF_FUNC, sizeof(BTF_FUNC) - 1)) {
443 			obj->nr_funcs++;
444 			id = add_symbol(&obj->funcs, prefix, sizeof(BTF_FUNC) - 1);
445 		/* set */
446 		} else if (!strncmp(prefix, BTF_SET, sizeof(BTF_SET) - 1)) {
447 			id = add_set(obj, prefix);
448 			/*
449 			 * SET objects store list's count, which is encoded
450 			 * in symbol's size, together with 'cnt' field hence
451 			 * that - 1.
452 			 */
453 			if (id)
454 				id->cnt = sym.st_size / sizeof(int) - 1;
455 		} else {
456 			pr_err("FAILED unsupported prefix %s\n", prefix);
457 			return -1;
458 		}
459 
460 		if (!id)
461 			return -ENOMEM;
462 
463 		if (id->addr_cnt >= ADDR_CNT) {
464 			pr_err("FAILED symbol %s crossed the number of allowed lists\n",
465 				id->name);
466 			return -1;
467 		}
468 		id->addr[id->addr_cnt++] = sym.st_value;
469 	}
470 
471 	return 0;
472 }
473 
474 static int symbols_resolve(struct object *obj)
475 {
476 	int nr_typedefs = obj->nr_typedefs;
477 	int nr_structs  = obj->nr_structs;
478 	int nr_unions   = obj->nr_unions;
479 	int nr_funcs    = obj->nr_funcs;
480 	int err, type_id;
481 	struct btf *btf;
482 	__u32 nr_types;
483 
484 	btf = btf__parse(obj->btf ?: obj->path, NULL);
485 	err = libbpf_get_error(btf);
486 	if (err) {
487 		pr_err("FAILED: load BTF from %s: %s\n",
488 			obj->btf ?: obj->path, strerror(-err));
489 		return -1;
490 	}
491 
492 	err = -1;
493 	nr_types = btf__get_nr_types(btf);
494 
495 	/*
496 	 * Iterate all the BTF types and search for collected symbol IDs.
497 	 */
498 	for (type_id = 1; type_id <= nr_types; type_id++) {
499 		const struct btf_type *type;
500 		struct rb_root *root;
501 		struct btf_id *id;
502 		const char *str;
503 		int *nr;
504 
505 		type = btf__type_by_id(btf, type_id);
506 		if (!type) {
507 			pr_err("FAILED: malformed BTF, can't resolve type for ID %d\n",
508 				type_id);
509 			goto out;
510 		}
511 
512 		if (btf_is_func(type) && nr_funcs) {
513 			nr   = &nr_funcs;
514 			root = &obj->funcs;
515 		} else if (btf_is_struct(type) && nr_structs) {
516 			nr   = &nr_structs;
517 			root = &obj->structs;
518 		} else if (btf_is_union(type) && nr_unions) {
519 			nr   = &nr_unions;
520 			root = &obj->unions;
521 		} else if (btf_is_typedef(type) && nr_typedefs) {
522 			nr   = &nr_typedefs;
523 			root = &obj->typedefs;
524 		} else
525 			continue;
526 
527 		str = btf__name_by_offset(btf, type->name_off);
528 		if (!str) {
529 			pr_err("FAILED: malformed BTF, can't resolve name for ID %d\n",
530 				type_id);
531 			goto out;
532 		}
533 
534 		id = btf_id__find(root, str);
535 		if (id) {
536 			if (id->id) {
537 				pr_info("WARN: multiple IDs found for '%s': %d, %d - using %d\n",
538 					str, id->id, type_id, id->id);
539 			} else {
540 				id->id = type_id;
541 				(*nr)--;
542 			}
543 		}
544 	}
545 
546 	err = 0;
547 out:
548 	btf__free(btf);
549 	return err;
550 }
551 
552 static int id_patch(struct object *obj, struct btf_id *id)
553 {
554 	Elf_Data *data = obj->efile.idlist;
555 	int *ptr = data->d_buf;
556 	int i;
557 
558 	if (!id->id) {
559 		pr_err("WARN: resolve_btfids: unresolved symbol %s\n", id->name);
560 	}
561 
562 	for (i = 0; i < id->addr_cnt; i++) {
563 		unsigned long addr = id->addr[i];
564 		unsigned long idx = addr - obj->efile.idlist_addr;
565 
566 		pr_debug("patching addr %5lu: ID %7d [%s]\n",
567 			 idx, id->id, id->name);
568 
569 		if (idx >= data->d_size) {
570 			pr_err("FAILED patching index %lu out of bounds %lu\n",
571 				idx, data->d_size);
572 			return -1;
573 		}
574 
575 		idx = idx / sizeof(int);
576 		ptr[idx] = id->id;
577 	}
578 
579 	return 0;
580 }
581 
582 static int __symbols_patch(struct object *obj, struct rb_root *root)
583 {
584 	struct rb_node *next;
585 	struct btf_id *id;
586 
587 	next = rb_first(root);
588 	while (next) {
589 		id = rb_entry(next, struct btf_id, rb_node);
590 
591 		if (id_patch(obj, id))
592 			return -1;
593 
594 		next = rb_next(next);
595 	}
596 	return 0;
597 }
598 
599 static int cmp_id(const void *pa, const void *pb)
600 {
601 	const int *a = pa, *b = pb;
602 
603 	return *a - *b;
604 }
605 
606 static int sets_patch(struct object *obj)
607 {
608 	Elf_Data *data = obj->efile.idlist;
609 	int *ptr = data->d_buf;
610 	struct rb_node *next;
611 
612 	next = rb_first(&obj->sets);
613 	while (next) {
614 		unsigned long addr, idx;
615 		struct btf_id *id;
616 		int *base;
617 		int cnt;
618 
619 		id   = rb_entry(next, struct btf_id, rb_node);
620 		addr = id->addr[0];
621 		idx  = addr - obj->efile.idlist_addr;
622 
623 		/* sets are unique */
624 		if (id->addr_cnt != 1) {
625 			pr_err("FAILED malformed data for set '%s'\n",
626 				id->name);
627 			return -1;
628 		}
629 
630 		idx = idx / sizeof(int);
631 		base = &ptr[idx] + 1;
632 		cnt = ptr[idx];
633 
634 		pr_debug("sorting  addr %5lu: cnt %6d [%s]\n",
635 			 (idx + 1) * sizeof(int), cnt, id->name);
636 
637 		qsort(base, cnt, sizeof(int), cmp_id);
638 
639 		next = rb_next(next);
640 	}
641 	return 0;
642 }
643 
644 static int symbols_patch(struct object *obj)
645 {
646 	int err;
647 
648 	if (__symbols_patch(obj, &obj->structs)  ||
649 	    __symbols_patch(obj, &obj->unions)   ||
650 	    __symbols_patch(obj, &obj->typedefs) ||
651 	    __symbols_patch(obj, &obj->funcs)    ||
652 	    __symbols_patch(obj, &obj->sets))
653 		return -1;
654 
655 	if (sets_patch(obj))
656 		return -1;
657 
658 	/* Set type to ensure endian translation occurs. */
659 	obj->efile.idlist->d_type = ELF_T_WORD;
660 
661 	elf_flagdata(obj->efile.idlist, ELF_C_SET, ELF_F_DIRTY);
662 
663 	err = elf_update(obj->efile.elf, ELF_C_WRITE);
664 	if (err < 0) {
665 		pr_err("FAILED elf_update(WRITE): %s\n",
666 			elf_errmsg(-1));
667 	}
668 
669 	pr_debug("update %s for %s\n",
670 		 err >= 0 ? "ok" : "failed", obj->path);
671 	return err < 0 ? -1 : 0;
672 }
673 
674 static const char * const resolve_btfids_usage[] = {
675 	"resolve_btfids [<options>] <ELF object>",
676 	NULL
677 };
678 
679 int main(int argc, const char **argv)
680 {
681 	bool no_fail = false;
682 	struct object obj = {
683 		.efile = {
684 			.idlist_shndx  = -1,
685 			.symbols_shndx = -1,
686 		},
687 		.structs  = RB_ROOT,
688 		.unions   = RB_ROOT,
689 		.typedefs = RB_ROOT,
690 		.funcs    = RB_ROOT,
691 		.sets     = RB_ROOT,
692 	};
693 	struct option btfid_options[] = {
694 		OPT_INCR('v', "verbose", &verbose,
695 			 "be more verbose (show errors, etc)"),
696 		OPT_STRING(0, "btf", &obj.btf, "BTF data",
697 			   "BTF data"),
698 		OPT_BOOLEAN(0, "no-fail", &no_fail,
699 			   "do not fail if " BTF_IDS_SECTION " section is not found"),
700 		OPT_END()
701 	};
702 	int err = -1;
703 
704 	argc = parse_options(argc, argv, btfid_options, resolve_btfids_usage,
705 			     PARSE_OPT_STOP_AT_NON_OPTION);
706 	if (argc != 1)
707 		usage_with_options(resolve_btfids_usage, btfid_options);
708 
709 	obj.path = argv[0];
710 
711 	if (elf_collect(&obj))
712 		goto out;
713 
714 	/*
715 	 * We did not find .BTF_ids section or symbols section,
716 	 * nothing to do..
717 	 */
718 	if (obj.efile.idlist_shndx == -1 ||
719 	    obj.efile.symbols_shndx == -1) {
720 		if (no_fail)
721 			return 0;
722 		pr_err("FAILED to find needed sections\n");
723 		return -1;
724 	}
725 
726 	if (symbols_collect(&obj))
727 		goto out;
728 
729 	if (symbols_resolve(&obj))
730 		goto out;
731 
732 	if (symbols_patch(&obj))
733 		goto out;
734 
735 	err = 0;
736 out:
737 	if (obj.efile.elf) {
738 		elf_end(obj.efile.elf);
739 		close(obj.efile.fd);
740 	}
741 	return err;
742 }
743