xref: /linux/tools/perf/builtin-annotate.c (revision 273b281fa22c293963ee3e6eec418f5dda2dbc83)
1 /*
2  * builtin-annotate.c
3  *
4  * Builtin annotate command: Analyze the perf.data input file,
5  * look up and read DSOs and symbol information and display
6  * a histogram of results, along various sorting keys.
7  */
8 #include "builtin.h"
9 
10 #include "util/util.h"
11 
12 #include "util/color.h"
13 #include <linux/list.h>
14 #include "util/cache.h"
15 #include <linux/rbtree.h>
16 #include "util/symbol.h"
17 #include "util/string.h"
18 
19 #include "perf.h"
20 #include "util/debug.h"
21 
22 #include "util/event.h"
23 #include "util/parse-options.h"
24 #include "util/parse-events.h"
25 #include "util/thread.h"
26 #include "util/sort.h"
27 #include "util/hist.h"
28 #include "util/data_map.h"
29 
30 static char		const *input_name = "perf.data";
31 
32 static int		force;
33 
34 static int		full_paths;
35 
36 static int		print_line;
37 
38 struct sym_hist {
39 	u64		sum;
40 	u64		ip[0];
41 };
42 
43 struct sym_ext {
44 	struct rb_node	node;
45 	double		percent;
46 	char		*path;
47 };
48 
49 struct sym_priv {
50 	struct sym_hist	*hist;
51 	struct sym_ext	*ext;
52 };
53 
54 static struct symbol_conf symbol_conf = {
55 	.priv_size	  = sizeof(struct sym_priv),
56 	.try_vmlinux_path = true,
57 };
58 
59 static const char *sym_hist_filter;
60 
61 static int symbol_filter(struct map *map __used, struct symbol *sym)
62 {
63 	if (sym_hist_filter == NULL ||
64 	    strcmp(sym->name, sym_hist_filter) == 0) {
65 		struct sym_priv *priv = symbol__priv(sym);
66 		const int size = (sizeof(*priv->hist) +
67 				  (sym->end - sym->start) * sizeof(u64));
68 
69 		priv->hist = malloc(size);
70 		if (priv->hist)
71 			memset(priv->hist, 0, size);
72 		return 0;
73 	}
74 	/*
75 	 * FIXME: We should really filter it out, as we don't want to go thru symbols
76 	 * we're not interested, and if a DSO ends up with no symbols, delete it too,
77 	 * but right now the kernel loading routines in symbol.c bail out if no symbols
78 	 * are found, fix it later.
79 	 */
80 	return 0;
81 }
82 
83 /*
84  * collect histogram counts
85  */
86 static void hist_hit(struct hist_entry *he, u64 ip)
87 {
88 	unsigned int sym_size, offset;
89 	struct symbol *sym = he->sym;
90 	struct sym_priv *priv;
91 	struct sym_hist *h;
92 
93 	he->count++;
94 
95 	if (!sym || !he->map)
96 		return;
97 
98 	priv = symbol__priv(sym);
99 	if (!priv->hist)
100 		return;
101 
102 	sym_size = sym->end - sym->start;
103 	offset = ip - sym->start;
104 
105 	if (verbose)
106 		fprintf(stderr, "%s: ip=%Lx\n", __func__,
107 			he->map->unmap_ip(he->map, ip));
108 
109 	if (offset >= sym_size)
110 		return;
111 
112 	h = priv->hist;
113 	h->sum++;
114 	h->ip[offset]++;
115 
116 	if (verbose >= 3)
117 		printf("%p %s: count++ [ip: %p, %08Lx] => %Ld\n",
118 			(void *)(unsigned long)he->sym->start,
119 			he->sym->name,
120 			(void *)(unsigned long)ip, ip - he->sym->start,
121 			h->ip[offset]);
122 }
123 
124 static int hist_entry__add(struct addr_location *al, u64 count)
125 {
126 	bool hit;
127 	struct hist_entry *he = __hist_entry__add(al, NULL, count, &hit);
128 	if (he == NULL)
129 		return -ENOMEM;
130 	hist_hit(he, al->addr);
131 	return 0;
132 }
133 
134 static int process_sample_event(event_t *event)
135 {
136 	struct addr_location al;
137 
138 	dump_printf("(IP, %d): %d: %p\n", event->header.misc,
139 		    event->ip.pid, (void *)(long)event->ip.ip);
140 
141 	if (event__preprocess_sample(event, &al, symbol_filter) < 0) {
142 		fprintf(stderr, "problem processing %d event, skipping it.\n",
143 			event->header.type);
144 		return -1;
145 	}
146 
147 	if (hist_entry__add(&al, 1)) {
148 		fprintf(stderr, "problem incrementing symbol count, "
149 				"skipping event\n");
150 		return -1;
151 	}
152 
153 	return 0;
154 }
155 
156 static int parse_line(FILE *file, struct hist_entry *he, u64 len)
157 {
158 	struct symbol *sym = he->sym;
159 	char *line = NULL, *tmp, *tmp2;
160 	static const char *prev_line;
161 	static const char *prev_color;
162 	unsigned int offset;
163 	size_t line_len;
164 	u64 start;
165 	s64 line_ip;
166 	int ret;
167 	char *c;
168 
169 	if (getline(&line, &line_len, file) < 0)
170 		return -1;
171 	if (!line)
172 		return -1;
173 
174 	c = strchr(line, '\n');
175 	if (c)
176 		*c = 0;
177 
178 	line_ip = -1;
179 	offset = 0;
180 	ret = -2;
181 
182 	/*
183 	 * Strip leading spaces:
184 	 */
185 	tmp = line;
186 	while (*tmp) {
187 		if (*tmp != ' ')
188 			break;
189 		tmp++;
190 	}
191 
192 	if (*tmp) {
193 		/*
194 		 * Parse hexa addresses followed by ':'
195 		 */
196 		line_ip = strtoull(tmp, &tmp2, 16);
197 		if (*tmp2 != ':')
198 			line_ip = -1;
199 	}
200 
201 	start = he->map->unmap_ip(he->map, sym->start);
202 
203 	if (line_ip != -1) {
204 		const char *path = NULL;
205 		unsigned int hits = 0;
206 		double percent = 0.0;
207 		const char *color;
208 		struct sym_priv *priv = symbol__priv(sym);
209 		struct sym_ext *sym_ext = priv->ext;
210 		struct sym_hist *h = priv->hist;
211 
212 		offset = line_ip - start;
213 		if (offset < len)
214 			hits = h->ip[offset];
215 
216 		if (offset < len && sym_ext) {
217 			path = sym_ext[offset].path;
218 			percent = sym_ext[offset].percent;
219 		} else if (h->sum)
220 			percent = 100.0 * hits / h->sum;
221 
222 		color = get_percent_color(percent);
223 
224 		/*
225 		 * Also color the filename and line if needed, with
226 		 * the same color than the percentage. Don't print it
227 		 * twice for close colored ip with the same filename:line
228 		 */
229 		if (path) {
230 			if (!prev_line || strcmp(prev_line, path)
231 				       || color != prev_color) {
232 				color_fprintf(stdout, color, " %s", path);
233 				prev_line = path;
234 				prev_color = color;
235 			}
236 		}
237 
238 		color_fprintf(stdout, color, " %7.2f", percent);
239 		printf(" :	");
240 		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", line);
241 	} else {
242 		if (!*line)
243 			printf("         :\n");
244 		else
245 			printf("         :	%s\n", line);
246 	}
247 
248 	return 0;
249 }
250 
251 static struct rb_root root_sym_ext;
252 
253 static void insert_source_line(struct sym_ext *sym_ext)
254 {
255 	struct sym_ext *iter;
256 	struct rb_node **p = &root_sym_ext.rb_node;
257 	struct rb_node *parent = NULL;
258 
259 	while (*p != NULL) {
260 		parent = *p;
261 		iter = rb_entry(parent, struct sym_ext, node);
262 
263 		if (sym_ext->percent > iter->percent)
264 			p = &(*p)->rb_left;
265 		else
266 			p = &(*p)->rb_right;
267 	}
268 
269 	rb_link_node(&sym_ext->node, parent, p);
270 	rb_insert_color(&sym_ext->node, &root_sym_ext);
271 }
272 
273 static void free_source_line(struct hist_entry *he, int len)
274 {
275 	struct sym_priv *priv = symbol__priv(he->sym);
276 	struct sym_ext *sym_ext = priv->ext;
277 	int i;
278 
279 	if (!sym_ext)
280 		return;
281 
282 	for (i = 0; i < len; i++)
283 		free(sym_ext[i].path);
284 	free(sym_ext);
285 
286 	priv->ext = NULL;
287 	root_sym_ext = RB_ROOT;
288 }
289 
290 /* Get the filename:line for the colored entries */
291 static void
292 get_source_line(struct hist_entry *he, int len, const char *filename)
293 {
294 	struct symbol *sym = he->sym;
295 	u64 start;
296 	int i;
297 	char cmd[PATH_MAX * 2];
298 	struct sym_ext *sym_ext;
299 	struct sym_priv *priv = symbol__priv(sym);
300 	struct sym_hist *h = priv->hist;
301 
302 	if (!h->sum)
303 		return;
304 
305 	sym_ext = priv->ext = calloc(len, sizeof(struct sym_ext));
306 	if (!priv->ext)
307 		return;
308 
309 	start = he->map->unmap_ip(he->map, sym->start);
310 
311 	for (i = 0; i < len; i++) {
312 		char *path = NULL;
313 		size_t line_len;
314 		u64 offset;
315 		FILE *fp;
316 
317 		sym_ext[i].percent = 100.0 * h->ip[i] / h->sum;
318 		if (sym_ext[i].percent <= 0.5)
319 			continue;
320 
321 		offset = start + i;
322 		sprintf(cmd, "addr2line -e %s %016llx", filename, offset);
323 		fp = popen(cmd, "r");
324 		if (!fp)
325 			continue;
326 
327 		if (getline(&path, &line_len, fp) < 0 || !line_len)
328 			goto next;
329 
330 		sym_ext[i].path = malloc(sizeof(char) * line_len + 1);
331 		if (!sym_ext[i].path)
332 			goto next;
333 
334 		strcpy(sym_ext[i].path, path);
335 		insert_source_line(&sym_ext[i]);
336 
337 	next:
338 		pclose(fp);
339 	}
340 }
341 
342 static void print_summary(const char *filename)
343 {
344 	struct sym_ext *sym_ext;
345 	struct rb_node *node;
346 
347 	printf("\nSorted summary for file %s\n", filename);
348 	printf("----------------------------------------------\n\n");
349 
350 	if (RB_EMPTY_ROOT(&root_sym_ext)) {
351 		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
352 		return;
353 	}
354 
355 	node = rb_first(&root_sym_ext);
356 	while (node) {
357 		double percent;
358 		const char *color;
359 		char *path;
360 
361 		sym_ext = rb_entry(node, struct sym_ext, node);
362 		percent = sym_ext->percent;
363 		color = get_percent_color(percent);
364 		path = sym_ext->path;
365 
366 		color_fprintf(stdout, color, " %7.2f %s", percent, path);
367 		node = rb_next(node);
368 	}
369 }
370 
371 static void annotate_sym(struct hist_entry *he)
372 {
373 	struct map *map = he->map;
374 	struct dso *dso = map->dso;
375 	struct symbol *sym = he->sym;
376 	const char *filename = dso->long_name, *d_filename;
377 	u64 len;
378 	char command[PATH_MAX*2];
379 	FILE *file;
380 
381 	if (!filename)
382 		return;
383 
384 	if (verbose)
385 		fprintf(stderr, "%s: filename=%s, sym=%s, start=%Lx, end=%Lx\n",
386 			__func__, filename, sym->name,
387 			map->unmap_ip(map, sym->start),
388 			map->unmap_ip(map, sym->end));
389 
390 	if (full_paths)
391 		d_filename = filename;
392 	else
393 		d_filename = basename(filename);
394 
395 	len = sym->end - sym->start;
396 
397 	if (print_line) {
398 		get_source_line(he, len, filename);
399 		print_summary(filename);
400 	}
401 
402 	printf("\n\n------------------------------------------------\n");
403 	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
404 	printf("------------------------------------------------\n");
405 
406 	if (verbose >= 2)
407 		printf("annotating [%p] %30s : [%p] %30s\n",
408 		       dso, dso->long_name, sym, sym->name);
409 
410 	sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s",
411 		map->unmap_ip(map, sym->start), map->unmap_ip(map, sym->end),
412 		filename, filename);
413 
414 	if (verbose >= 3)
415 		printf("doing: %s\n", command);
416 
417 	file = popen(command, "r");
418 	if (!file)
419 		return;
420 
421 	while (!feof(file)) {
422 		if (parse_line(file, he, len) < 0)
423 			break;
424 	}
425 
426 	pclose(file);
427 	if (print_line)
428 		free_source_line(he, len);
429 }
430 
431 static void find_annotations(void)
432 {
433 	struct rb_node *nd;
434 
435 	for (nd = rb_first(&output_hists); nd; nd = rb_next(nd)) {
436 		struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
437 		struct sym_priv *priv;
438 
439 		if (he->sym == NULL)
440 			continue;
441 
442 		priv = symbol__priv(he->sym);
443 		if (priv->hist == NULL)
444 			continue;
445 
446 		annotate_sym(he);
447 		/*
448 		 * Since we have a hist_entry per IP for the same symbol, free
449 		 * he->sym->hist to signal we already processed this symbol.
450 		 */
451 		free(priv->hist);
452 		priv->hist = NULL;
453 	}
454 }
455 
456 static struct perf_file_handler file_handler = {
457 	.process_sample_event	= process_sample_event,
458 	.process_mmap_event	= event__process_mmap,
459 	.process_comm_event	= event__process_comm,
460 	.process_fork_event	= event__process_task,
461 };
462 
463 static int __cmd_annotate(void)
464 {
465 	struct perf_header *header;
466 	struct thread *idle;
467 	int ret;
468 
469 	idle = register_idle_thread();
470 	register_perf_file_handler(&file_handler);
471 
472 	ret = mmap_dispatch_perf_file(&header, input_name, 0, 0,
473 				      &event__cwdlen, &event__cwd);
474 	if (ret)
475 		return ret;
476 
477 	if (dump_trace) {
478 		event__print_totals();
479 		return 0;
480 	}
481 
482 	if (verbose > 3)
483 		threads__fprintf(stdout);
484 
485 	if (verbose > 2)
486 		dsos__fprintf(stdout);
487 
488 	collapse__resort();
489 	output__resort(event__total[0]);
490 
491 	find_annotations();
492 
493 	return ret;
494 }
495 
496 static const char * const annotate_usage[] = {
497 	"perf annotate [<options>] <command>",
498 	NULL
499 };
500 
501 static const struct option options[] = {
502 	OPT_STRING('i', "input", &input_name, "file",
503 		    "input file name"),
504 	OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
505 		    "symbol to annotate"),
506 	OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
507 	OPT_BOOLEAN('v', "verbose", &verbose,
508 		    "be more verbose (show symbol address, etc)"),
509 	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
510 		    "dump raw trace in ASCII"),
511 	OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
512 		   "file", "vmlinux pathname"),
513 	OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
514 		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
515 	OPT_BOOLEAN('l', "print-line", &print_line,
516 		    "print matching source lines (may be slow)"),
517 	OPT_BOOLEAN('P', "full-paths", &full_paths,
518 		    "Don't shorten the displayed pathnames"),
519 	OPT_END()
520 };
521 
522 static void setup_sorting(void)
523 {
524 	char *tmp, *tok, *str = strdup(sort_order);
525 
526 	for (tok = strtok_r(str, ", ", &tmp);
527 			tok; tok = strtok_r(NULL, ", ", &tmp)) {
528 		if (sort_dimension__add(tok) < 0) {
529 			error("Unknown --sort key: `%s'", tok);
530 			usage_with_options(annotate_usage, options);
531 		}
532 	}
533 
534 	free(str);
535 }
536 
537 int cmd_annotate(int argc, const char **argv, const char *prefix __used)
538 {
539 	if (symbol__init(&symbol_conf) < 0)
540 		return -1;
541 
542 	argc = parse_options(argc, argv, options, annotate_usage, 0);
543 
544 	setup_sorting();
545 
546 	if (argc) {
547 		/*
548 		 * Special case: if there's an argument left then assume tha
549 		 * it's a symbol filter:
550 		 */
551 		if (argc > 1)
552 			usage_with_options(annotate_usage, options);
553 
554 		sym_hist_filter = argv[0];
555 	}
556 
557 	setup_pager();
558 
559 	if (field_sep && *field_sep == '.') {
560 		fputs("'.' is the only non valid --field-separator argument\n",
561 				stderr);
562 		exit(129);
563 	}
564 
565 	return __cmd_annotate();
566 }
567