xref: /linux/tools/perf/builtin-annotate.c (revision ac6a0cf6716bb46813d0161024c66c2af66e53d1)
1 /*
2  * builtin-annotate.c
3  *
4  * Builtin annotate command: Analyze the perf.data input file,
5  * look up and read DSOs and symbol information and display
6  * a histogram of results, along various sorting keys.
7  */
8 #include "builtin.h"
9 
10 #include "util/util.h"
11 
12 #include "util/color.h"
13 #include <linux/list.h>
14 #include "util/cache.h"
15 #include <linux/rbtree.h>
16 #include "util/symbol.h"
17 #include "util/string.h"
18 
19 #include "perf.h"
20 
21 #include "util/parse-options.h"
22 #include "util/parse-events.h"
23 
24 #define SHOW_KERNEL	1
25 #define SHOW_USER	2
26 #define SHOW_HV		4
27 
28 static char		const *input_name = "perf.data";
29 static char		*vmlinux = "vmlinux";
30 
31 static char		default_sort_order[] = "comm,symbol";
32 static char		*sort_order = default_sort_order;
33 
34 static int		input;
35 static int		show_mask = SHOW_KERNEL | SHOW_USER | SHOW_HV;
36 
37 static int		dump_trace = 0;
38 #define dprintf(x...)	do { if (dump_trace) printf(x); } while (0)
39 
40 static int		verbose;
41 
42 static int		modules;
43 
44 static int		full_paths;
45 
46 static int		print_line;
47 
48 static unsigned long	page_size;
49 static unsigned long	mmap_window = 32;
50 
51 struct ip_event {
52 	struct perf_event_header header;
53 	u64 ip;
54 	u32 pid, tid;
55 };
56 
57 struct mmap_event {
58 	struct perf_event_header header;
59 	u32 pid, tid;
60 	u64 start;
61 	u64 len;
62 	u64 pgoff;
63 	char filename[PATH_MAX];
64 };
65 
66 struct comm_event {
67 	struct perf_event_header header;
68 	u32 pid, tid;
69 	char comm[16];
70 };
71 
72 struct fork_event {
73 	struct perf_event_header header;
74 	u32 pid, ppid;
75 };
76 
77 typedef union event_union {
78 	struct perf_event_header	header;
79 	struct ip_event			ip;
80 	struct mmap_event		mmap;
81 	struct comm_event		comm;
82 	struct fork_event		fork;
83 } event_t;
84 
85 
86 struct sym_ext {
87 	struct rb_node	node;
88 	double		percent;
89 	char		*path;
90 };
91 
92 static LIST_HEAD(dsos);
93 static struct dso *kernel_dso;
94 static struct dso *vdso;
95 
96 
97 static void dsos__add(struct dso *dso)
98 {
99 	list_add_tail(&dso->node, &dsos);
100 }
101 
102 static struct dso *dsos__find(const char *name)
103 {
104 	struct dso *pos;
105 
106 	list_for_each_entry(pos, &dsos, node)
107 		if (strcmp(pos->name, name) == 0)
108 			return pos;
109 	return NULL;
110 }
111 
112 static struct dso *dsos__findnew(const char *name)
113 {
114 	struct dso *dso = dsos__find(name);
115 	int nr;
116 
117 	if (dso)
118 		return dso;
119 
120 	dso = dso__new(name, 0);
121 	if (!dso)
122 		goto out_delete_dso;
123 
124 	nr = dso__load(dso, NULL, verbose);
125 	if (nr < 0) {
126 		if (verbose)
127 			fprintf(stderr, "Failed to open: %s\n", name);
128 		goto out_delete_dso;
129 	}
130 	if (!nr && verbose) {
131 		fprintf(stderr,
132 		"No symbols found in: %s, maybe install a debug package?\n",
133 				name);
134 	}
135 
136 	dsos__add(dso);
137 
138 	return dso;
139 
140 out_delete_dso:
141 	dso__delete(dso);
142 	return NULL;
143 }
144 
145 static void dsos__fprintf(FILE *fp)
146 {
147 	struct dso *pos;
148 
149 	list_for_each_entry(pos, &dsos, node)
150 		dso__fprintf(pos, fp);
151 }
152 
153 static struct symbol *vdso__find_symbol(struct dso *dso, u64 ip)
154 {
155 	return dso__find_symbol(dso, ip);
156 }
157 
158 static int load_kernel(void)
159 {
160 	int err;
161 
162 	kernel_dso = dso__new("[kernel]", 0);
163 	if (!kernel_dso)
164 		return -1;
165 
166 	err = dso__load_kernel(kernel_dso, vmlinux, NULL, verbose, modules);
167 	if (err <= 0) {
168 		dso__delete(kernel_dso);
169 		kernel_dso = NULL;
170 	} else
171 		dsos__add(kernel_dso);
172 
173 	vdso = dso__new("[vdso]", 0);
174 	if (!vdso)
175 		return -1;
176 
177 	vdso->find_symbol = vdso__find_symbol;
178 
179 	dsos__add(vdso);
180 
181 	return err;
182 }
183 
184 struct map {
185 	struct list_head node;
186 	u64	 start;
187 	u64	 end;
188 	u64	 pgoff;
189 	u64	 (*map_ip)(struct map *, u64);
190 	struct dso	 *dso;
191 };
192 
193 static u64 map__map_ip(struct map *map, u64 ip)
194 {
195 	return ip - map->start + map->pgoff;
196 }
197 
198 static u64 vdso__map_ip(struct map *map __used, u64 ip)
199 {
200 	return ip;
201 }
202 
203 static struct map *map__new(struct mmap_event *event)
204 {
205 	struct map *self = malloc(sizeof(*self));
206 
207 	if (self != NULL) {
208 		const char *filename = event->filename;
209 
210 		self->start = event->start;
211 		self->end   = event->start + event->len;
212 		self->pgoff = event->pgoff;
213 
214 		self->dso = dsos__findnew(filename);
215 		if (self->dso == NULL)
216 			goto out_delete;
217 
218 		if (self->dso == vdso)
219 			self->map_ip = vdso__map_ip;
220 		else
221 			self->map_ip = map__map_ip;
222 	}
223 	return self;
224 out_delete:
225 	free(self);
226 	return NULL;
227 }
228 
229 static struct map *map__clone(struct map *self)
230 {
231 	struct map *map = malloc(sizeof(*self));
232 
233 	if (!map)
234 		return NULL;
235 
236 	memcpy(map, self, sizeof(*self));
237 
238 	return map;
239 }
240 
241 static int map__overlap(struct map *l, struct map *r)
242 {
243 	if (l->start > r->start) {
244 		struct map *t = l;
245 		l = r;
246 		r = t;
247 	}
248 
249 	if (l->end > r->start)
250 		return 1;
251 
252 	return 0;
253 }
254 
255 static size_t map__fprintf(struct map *self, FILE *fp)
256 {
257 	return fprintf(fp, " %Lx-%Lx %Lx %s\n",
258 		       self->start, self->end, self->pgoff, self->dso->name);
259 }
260 
261 
262 struct thread {
263 	struct rb_node	 rb_node;
264 	struct list_head maps;
265 	pid_t		 pid;
266 	char		 *comm;
267 };
268 
269 static struct thread *thread__new(pid_t pid)
270 {
271 	struct thread *self = malloc(sizeof(*self));
272 
273 	if (self != NULL) {
274 		self->pid = pid;
275 		self->comm = malloc(32);
276 		if (self->comm)
277 			snprintf(self->comm, 32, ":%d", self->pid);
278 		INIT_LIST_HEAD(&self->maps);
279 	}
280 
281 	return self;
282 }
283 
284 static int thread__set_comm(struct thread *self, const char *comm)
285 {
286 	if (self->comm)
287 		free(self->comm);
288 	self->comm = strdup(comm);
289 	return self->comm ? 0 : -ENOMEM;
290 }
291 
292 static size_t thread__fprintf(struct thread *self, FILE *fp)
293 {
294 	struct map *pos;
295 	size_t ret = fprintf(fp, "Thread %d %s\n", self->pid, self->comm);
296 
297 	list_for_each_entry(pos, &self->maps, node)
298 		ret += map__fprintf(pos, fp);
299 
300 	return ret;
301 }
302 
303 
304 static struct rb_root threads;
305 static struct thread *last_match;
306 
307 static struct thread *threads__findnew(pid_t pid)
308 {
309 	struct rb_node **p = &threads.rb_node;
310 	struct rb_node *parent = NULL;
311 	struct thread *th;
312 
313 	/*
314 	 * Font-end cache - PID lookups come in blocks,
315 	 * so most of the time we dont have to look up
316 	 * the full rbtree:
317 	 */
318 	if (last_match && last_match->pid == pid)
319 		return last_match;
320 
321 	while (*p != NULL) {
322 		parent = *p;
323 		th = rb_entry(parent, struct thread, rb_node);
324 
325 		if (th->pid == pid) {
326 			last_match = th;
327 			return th;
328 		}
329 
330 		if (pid < th->pid)
331 			p = &(*p)->rb_left;
332 		else
333 			p = &(*p)->rb_right;
334 	}
335 
336 	th = thread__new(pid);
337 	if (th != NULL) {
338 		rb_link_node(&th->rb_node, parent, p);
339 		rb_insert_color(&th->rb_node, &threads);
340 		last_match = th;
341 	}
342 
343 	return th;
344 }
345 
346 static void thread__insert_map(struct thread *self, struct map *map)
347 {
348 	struct map *pos, *tmp;
349 
350 	list_for_each_entry_safe(pos, tmp, &self->maps, node) {
351 		if (map__overlap(pos, map)) {
352 			list_del_init(&pos->node);
353 			/* XXX leaks dsos */
354 			free(pos);
355 		}
356 	}
357 
358 	list_add_tail(&map->node, &self->maps);
359 }
360 
361 static int thread__fork(struct thread *self, struct thread *parent)
362 {
363 	struct map *map;
364 
365 	if (self->comm)
366 		free(self->comm);
367 	self->comm = strdup(parent->comm);
368 	if (!self->comm)
369 		return -ENOMEM;
370 
371 	list_for_each_entry(map, &parent->maps, node) {
372 		struct map *new = map__clone(map);
373 		if (!new)
374 			return -ENOMEM;
375 		thread__insert_map(self, new);
376 	}
377 
378 	return 0;
379 }
380 
381 static struct map *thread__find_map(struct thread *self, u64 ip)
382 {
383 	struct map *pos;
384 
385 	if (self == NULL)
386 		return NULL;
387 
388 	list_for_each_entry(pos, &self->maps, node)
389 		if (ip >= pos->start && ip <= pos->end)
390 			return pos;
391 
392 	return NULL;
393 }
394 
395 static size_t threads__fprintf(FILE *fp)
396 {
397 	size_t ret = 0;
398 	struct rb_node *nd;
399 
400 	for (nd = rb_first(&threads); nd; nd = rb_next(nd)) {
401 		struct thread *pos = rb_entry(nd, struct thread, rb_node);
402 
403 		ret += thread__fprintf(pos, fp);
404 	}
405 
406 	return ret;
407 }
408 
409 /*
410  * histogram, sorted on item, collects counts
411  */
412 
413 static struct rb_root hist;
414 
415 struct hist_entry {
416 	struct rb_node	 rb_node;
417 
418 	struct thread	 *thread;
419 	struct map	 *map;
420 	struct dso	 *dso;
421 	struct symbol	 *sym;
422 	u64	 ip;
423 	char		 level;
424 
425 	uint32_t	 count;
426 };
427 
428 /*
429  * configurable sorting bits
430  */
431 
432 struct sort_entry {
433 	struct list_head list;
434 
435 	char *header;
436 
437 	int64_t (*cmp)(struct hist_entry *, struct hist_entry *);
438 	int64_t (*collapse)(struct hist_entry *, struct hist_entry *);
439 	size_t	(*print)(FILE *fp, struct hist_entry *);
440 };
441 
442 /* --sort pid */
443 
444 static int64_t
445 sort__thread_cmp(struct hist_entry *left, struct hist_entry *right)
446 {
447 	return right->thread->pid - left->thread->pid;
448 }
449 
450 static size_t
451 sort__thread_print(FILE *fp, struct hist_entry *self)
452 {
453 	return fprintf(fp, "%16s:%5d", self->thread->comm ?: "", self->thread->pid);
454 }
455 
456 static struct sort_entry sort_thread = {
457 	.header = "         Command:  Pid",
458 	.cmp	= sort__thread_cmp,
459 	.print	= sort__thread_print,
460 };
461 
462 /* --sort comm */
463 
464 static int64_t
465 sort__comm_cmp(struct hist_entry *left, struct hist_entry *right)
466 {
467 	return right->thread->pid - left->thread->pid;
468 }
469 
470 static int64_t
471 sort__comm_collapse(struct hist_entry *left, struct hist_entry *right)
472 {
473 	char *comm_l = left->thread->comm;
474 	char *comm_r = right->thread->comm;
475 
476 	if (!comm_l || !comm_r) {
477 		if (!comm_l && !comm_r)
478 			return 0;
479 		else if (!comm_l)
480 			return -1;
481 		else
482 			return 1;
483 	}
484 
485 	return strcmp(comm_l, comm_r);
486 }
487 
488 static size_t
489 sort__comm_print(FILE *fp, struct hist_entry *self)
490 {
491 	return fprintf(fp, "%16s", self->thread->comm);
492 }
493 
494 static struct sort_entry sort_comm = {
495 	.header		= "         Command",
496 	.cmp		= sort__comm_cmp,
497 	.collapse	= sort__comm_collapse,
498 	.print		= sort__comm_print,
499 };
500 
501 /* --sort dso */
502 
503 static int64_t
504 sort__dso_cmp(struct hist_entry *left, struct hist_entry *right)
505 {
506 	struct dso *dso_l = left->dso;
507 	struct dso *dso_r = right->dso;
508 
509 	if (!dso_l || !dso_r) {
510 		if (!dso_l && !dso_r)
511 			return 0;
512 		else if (!dso_l)
513 			return -1;
514 		else
515 			return 1;
516 	}
517 
518 	return strcmp(dso_l->name, dso_r->name);
519 }
520 
521 static size_t
522 sort__dso_print(FILE *fp, struct hist_entry *self)
523 {
524 	if (self->dso)
525 		return fprintf(fp, "%-25s", self->dso->name);
526 
527 	return fprintf(fp, "%016llx         ", (u64)self->ip);
528 }
529 
530 static struct sort_entry sort_dso = {
531 	.header = "Shared Object            ",
532 	.cmp	= sort__dso_cmp,
533 	.print	= sort__dso_print,
534 };
535 
536 /* --sort symbol */
537 
538 static int64_t
539 sort__sym_cmp(struct hist_entry *left, struct hist_entry *right)
540 {
541 	u64 ip_l, ip_r;
542 
543 	if (left->sym == right->sym)
544 		return 0;
545 
546 	ip_l = left->sym ? left->sym->start : left->ip;
547 	ip_r = right->sym ? right->sym->start : right->ip;
548 
549 	return (int64_t)(ip_r - ip_l);
550 }
551 
552 static size_t
553 sort__sym_print(FILE *fp, struct hist_entry *self)
554 {
555 	size_t ret = 0;
556 
557 	if (verbose)
558 		ret += fprintf(fp, "%#018llx  ", (u64)self->ip);
559 
560 	if (self->sym) {
561 		ret += fprintf(fp, "[%c] %s",
562 			self->dso == kernel_dso ? 'k' : '.', self->sym->name);
563 	} else {
564 		ret += fprintf(fp, "%#016llx", (u64)self->ip);
565 	}
566 
567 	return ret;
568 }
569 
570 static struct sort_entry sort_sym = {
571 	.header = "Symbol",
572 	.cmp	= sort__sym_cmp,
573 	.print	= sort__sym_print,
574 };
575 
576 static int sort__need_collapse = 0;
577 
578 struct sort_dimension {
579 	char			*name;
580 	struct sort_entry	*entry;
581 	int			taken;
582 };
583 
584 static struct sort_dimension sort_dimensions[] = {
585 	{ .name = "pid",	.entry = &sort_thread,	},
586 	{ .name = "comm",	.entry = &sort_comm,	},
587 	{ .name = "dso",	.entry = &sort_dso,	},
588 	{ .name = "symbol",	.entry = &sort_sym,	},
589 };
590 
591 static LIST_HEAD(hist_entry__sort_list);
592 
593 static int sort_dimension__add(char *tok)
594 {
595 	unsigned int i;
596 
597 	for (i = 0; i < ARRAY_SIZE(sort_dimensions); i++) {
598 		struct sort_dimension *sd = &sort_dimensions[i];
599 
600 		if (sd->taken)
601 			continue;
602 
603 		if (strncasecmp(tok, sd->name, strlen(tok)))
604 			continue;
605 
606 		if (sd->entry->collapse)
607 			sort__need_collapse = 1;
608 
609 		list_add_tail(&sd->entry->list, &hist_entry__sort_list);
610 		sd->taken = 1;
611 
612 		return 0;
613 	}
614 
615 	return -ESRCH;
616 }
617 
618 static int64_t
619 hist_entry__cmp(struct hist_entry *left, struct hist_entry *right)
620 {
621 	struct sort_entry *se;
622 	int64_t cmp = 0;
623 
624 	list_for_each_entry(se, &hist_entry__sort_list, list) {
625 		cmp = se->cmp(left, right);
626 		if (cmp)
627 			break;
628 	}
629 
630 	return cmp;
631 }
632 
633 static int64_t
634 hist_entry__collapse(struct hist_entry *left, struct hist_entry *right)
635 {
636 	struct sort_entry *se;
637 	int64_t cmp = 0;
638 
639 	list_for_each_entry(se, &hist_entry__sort_list, list) {
640 		int64_t (*f)(struct hist_entry *, struct hist_entry *);
641 
642 		f = se->collapse ?: se->cmp;
643 
644 		cmp = f(left, right);
645 		if (cmp)
646 			break;
647 	}
648 
649 	return cmp;
650 }
651 
652 /*
653  * collect histogram counts
654  */
655 static void hist_hit(struct hist_entry *he, u64 ip)
656 {
657 	unsigned int sym_size, offset;
658 	struct symbol *sym = he->sym;
659 
660 	he->count++;
661 
662 	if (!sym || !sym->hist)
663 		return;
664 
665 	sym_size = sym->end - sym->start;
666 	offset = ip - sym->start;
667 
668 	if (offset >= sym_size)
669 		return;
670 
671 	sym->hist_sum++;
672 	sym->hist[offset]++;
673 
674 	if (verbose >= 3)
675 		printf("%p %s: count++ [ip: %p, %08Lx] => %Ld\n",
676 			(void *)(unsigned long)he->sym->start,
677 			he->sym->name,
678 			(void *)(unsigned long)ip, ip - he->sym->start,
679 			sym->hist[offset]);
680 }
681 
682 static int
683 hist_entry__add(struct thread *thread, struct map *map, struct dso *dso,
684 		struct symbol *sym, u64 ip, char level)
685 {
686 	struct rb_node **p = &hist.rb_node;
687 	struct rb_node *parent = NULL;
688 	struct hist_entry *he;
689 	struct hist_entry entry = {
690 		.thread	= thread,
691 		.map	= map,
692 		.dso	= dso,
693 		.sym	= sym,
694 		.ip	= ip,
695 		.level	= level,
696 		.count	= 1,
697 	};
698 	int cmp;
699 
700 	while (*p != NULL) {
701 		parent = *p;
702 		he = rb_entry(parent, struct hist_entry, rb_node);
703 
704 		cmp = hist_entry__cmp(&entry, he);
705 
706 		if (!cmp) {
707 			hist_hit(he, ip);
708 
709 			return 0;
710 		}
711 
712 		if (cmp < 0)
713 			p = &(*p)->rb_left;
714 		else
715 			p = &(*p)->rb_right;
716 	}
717 
718 	he = malloc(sizeof(*he));
719 	if (!he)
720 		return -ENOMEM;
721 	*he = entry;
722 	rb_link_node(&he->rb_node, parent, p);
723 	rb_insert_color(&he->rb_node, &hist);
724 
725 	return 0;
726 }
727 
728 static void hist_entry__free(struct hist_entry *he)
729 {
730 	free(he);
731 }
732 
733 /*
734  * collapse the histogram
735  */
736 
737 static struct rb_root collapse_hists;
738 
739 static void collapse__insert_entry(struct hist_entry *he)
740 {
741 	struct rb_node **p = &collapse_hists.rb_node;
742 	struct rb_node *parent = NULL;
743 	struct hist_entry *iter;
744 	int64_t cmp;
745 
746 	while (*p != NULL) {
747 		parent = *p;
748 		iter = rb_entry(parent, struct hist_entry, rb_node);
749 
750 		cmp = hist_entry__collapse(iter, he);
751 
752 		if (!cmp) {
753 			iter->count += he->count;
754 			hist_entry__free(he);
755 			return;
756 		}
757 
758 		if (cmp < 0)
759 			p = &(*p)->rb_left;
760 		else
761 			p = &(*p)->rb_right;
762 	}
763 
764 	rb_link_node(&he->rb_node, parent, p);
765 	rb_insert_color(&he->rb_node, &collapse_hists);
766 }
767 
768 static void collapse__resort(void)
769 {
770 	struct rb_node *next;
771 	struct hist_entry *n;
772 
773 	if (!sort__need_collapse)
774 		return;
775 
776 	next = rb_first(&hist);
777 	while (next) {
778 		n = rb_entry(next, struct hist_entry, rb_node);
779 		next = rb_next(&n->rb_node);
780 
781 		rb_erase(&n->rb_node, &hist);
782 		collapse__insert_entry(n);
783 	}
784 }
785 
786 /*
787  * reverse the map, sort on count.
788  */
789 
790 static struct rb_root output_hists;
791 
792 static void output__insert_entry(struct hist_entry *he)
793 {
794 	struct rb_node **p = &output_hists.rb_node;
795 	struct rb_node *parent = NULL;
796 	struct hist_entry *iter;
797 
798 	while (*p != NULL) {
799 		parent = *p;
800 		iter = rb_entry(parent, struct hist_entry, rb_node);
801 
802 		if (he->count > iter->count)
803 			p = &(*p)->rb_left;
804 		else
805 			p = &(*p)->rb_right;
806 	}
807 
808 	rb_link_node(&he->rb_node, parent, p);
809 	rb_insert_color(&he->rb_node, &output_hists);
810 }
811 
812 static void output__resort(void)
813 {
814 	struct rb_node *next;
815 	struct hist_entry *n;
816 	struct rb_root *tree = &hist;
817 
818 	if (sort__need_collapse)
819 		tree = &collapse_hists;
820 
821 	next = rb_first(tree);
822 
823 	while (next) {
824 		n = rb_entry(next, struct hist_entry, rb_node);
825 		next = rb_next(&n->rb_node);
826 
827 		rb_erase(&n->rb_node, tree);
828 		output__insert_entry(n);
829 	}
830 }
831 
832 static void register_idle_thread(void)
833 {
834 	struct thread *thread = threads__findnew(0);
835 
836 	if (thread == NULL ||
837 			thread__set_comm(thread, "[idle]")) {
838 		fprintf(stderr, "problem inserting idle task.\n");
839 		exit(-1);
840 	}
841 }
842 
843 static unsigned long total = 0,
844 		     total_mmap = 0,
845 		     total_comm = 0,
846 		     total_fork = 0,
847 		     total_unknown = 0;
848 
849 static int
850 process_sample_event(event_t *event, unsigned long offset, unsigned long head)
851 {
852 	char level;
853 	int show = 0;
854 	struct dso *dso = NULL;
855 	struct thread *thread = threads__findnew(event->ip.pid);
856 	u64 ip = event->ip.ip;
857 	struct map *map = NULL;
858 
859 	dprintf("%p [%p]: PERF_EVENT (IP, %d): %d: %p\n",
860 		(void *)(offset + head),
861 		(void *)(long)(event->header.size),
862 		event->header.misc,
863 		event->ip.pid,
864 		(void *)(long)ip);
865 
866 	dprintf(" ... thread: %s:%d\n", thread->comm, thread->pid);
867 
868 	if (thread == NULL) {
869 		fprintf(stderr, "problem processing %d event, skipping it.\n",
870 			event->header.type);
871 		return -1;
872 	}
873 
874 	if (event->header.misc & PERF_EVENT_MISC_KERNEL) {
875 		show = SHOW_KERNEL;
876 		level = 'k';
877 
878 		dso = kernel_dso;
879 
880 		dprintf(" ...... dso: %s\n", dso->name);
881 
882 	} else if (event->header.misc & PERF_EVENT_MISC_USER) {
883 
884 		show = SHOW_USER;
885 		level = '.';
886 
887 		map = thread__find_map(thread, ip);
888 		if (map != NULL) {
889 			ip = map->map_ip(map, ip);
890 			dso = map->dso;
891 		} else {
892 			/*
893 			 * If this is outside of all known maps,
894 			 * and is a negative address, try to look it
895 			 * up in the kernel dso, as it might be a
896 			 * vsyscall (which executes in user-mode):
897 			 */
898 			if ((long long)ip < 0)
899 				dso = kernel_dso;
900 		}
901 		dprintf(" ...... dso: %s\n", dso ? dso->name : "<not found>");
902 
903 	} else {
904 		show = SHOW_HV;
905 		level = 'H';
906 		dprintf(" ...... dso: [hypervisor]\n");
907 	}
908 
909 	if (show & show_mask) {
910 		struct symbol *sym = NULL;
911 
912 		if (dso)
913 			sym = dso->find_symbol(dso, ip);
914 
915 		if (hist_entry__add(thread, map, dso, sym, ip, level)) {
916 			fprintf(stderr,
917 		"problem incrementing symbol count, skipping event\n");
918 			return -1;
919 		}
920 	}
921 	total++;
922 
923 	return 0;
924 }
925 
926 static int
927 process_mmap_event(event_t *event, unsigned long offset, unsigned long head)
928 {
929 	struct thread *thread = threads__findnew(event->mmap.pid);
930 	struct map *map = map__new(&event->mmap);
931 
932 	dprintf("%p [%p]: PERF_EVENT_MMAP %d: [%p(%p) @ %p]: %s\n",
933 		(void *)(offset + head),
934 		(void *)(long)(event->header.size),
935 		event->mmap.pid,
936 		(void *)(long)event->mmap.start,
937 		(void *)(long)event->mmap.len,
938 		(void *)(long)event->mmap.pgoff,
939 		event->mmap.filename);
940 
941 	if (thread == NULL || map == NULL) {
942 		dprintf("problem processing PERF_EVENT_MMAP, skipping event.\n");
943 		return 0;
944 	}
945 
946 	thread__insert_map(thread, map);
947 	total_mmap++;
948 
949 	return 0;
950 }
951 
952 static int
953 process_comm_event(event_t *event, unsigned long offset, unsigned long head)
954 {
955 	struct thread *thread = threads__findnew(event->comm.pid);
956 
957 	dprintf("%p [%p]: PERF_EVENT_COMM: %s:%d\n",
958 		(void *)(offset + head),
959 		(void *)(long)(event->header.size),
960 		event->comm.comm, event->comm.pid);
961 
962 	if (thread == NULL ||
963 	    thread__set_comm(thread, event->comm.comm)) {
964 		dprintf("problem processing PERF_EVENT_COMM, skipping event.\n");
965 		return -1;
966 	}
967 	total_comm++;
968 
969 	return 0;
970 }
971 
972 static int
973 process_fork_event(event_t *event, unsigned long offset, unsigned long head)
974 {
975 	struct thread *thread = threads__findnew(event->fork.pid);
976 	struct thread *parent = threads__findnew(event->fork.ppid);
977 
978 	dprintf("%p [%p]: PERF_EVENT_FORK: %d:%d\n",
979 		(void *)(offset + head),
980 		(void *)(long)(event->header.size),
981 		event->fork.pid, event->fork.ppid);
982 
983 	/*
984 	 * A thread clone will have the same PID for both
985 	 * parent and child.
986 	 */
987 	if (thread == parent)
988 		return 0;
989 
990 	if (!thread || !parent || thread__fork(thread, parent)) {
991 		dprintf("problem processing PERF_EVENT_FORK, skipping event.\n");
992 		return -1;
993 	}
994 	total_fork++;
995 
996 	return 0;
997 }
998 
999 static int
1000 process_event(event_t *event, unsigned long offset, unsigned long head)
1001 {
1002 	switch (event->header.type) {
1003 	case PERF_EVENT_SAMPLE:
1004 		return process_sample_event(event, offset, head);
1005 
1006 	case PERF_EVENT_MMAP:
1007 		return process_mmap_event(event, offset, head);
1008 
1009 	case PERF_EVENT_COMM:
1010 		return process_comm_event(event, offset, head);
1011 
1012 	case PERF_EVENT_FORK:
1013 		return process_fork_event(event, offset, head);
1014 	/*
1015 	 * We dont process them right now but they are fine:
1016 	 */
1017 
1018 	case PERF_EVENT_THROTTLE:
1019 	case PERF_EVENT_UNTHROTTLE:
1020 		return 0;
1021 
1022 	default:
1023 		return -1;
1024 	}
1025 
1026 	return 0;
1027 }
1028 
1029 static int
1030 parse_line(FILE *file, struct symbol *sym, u64 start, u64 len)
1031 {
1032 	char *line = NULL, *tmp, *tmp2;
1033 	static const char *prev_line;
1034 	static const char *prev_color;
1035 	unsigned int offset;
1036 	size_t line_len;
1037 	s64 line_ip;
1038 	int ret;
1039 	char *c;
1040 
1041 	if (getline(&line, &line_len, file) < 0)
1042 		return -1;
1043 	if (!line)
1044 		return -1;
1045 
1046 	c = strchr(line, '\n');
1047 	if (c)
1048 		*c = 0;
1049 
1050 	line_ip = -1;
1051 	offset = 0;
1052 	ret = -2;
1053 
1054 	/*
1055 	 * Strip leading spaces:
1056 	 */
1057 	tmp = line;
1058 	while (*tmp) {
1059 		if (*tmp != ' ')
1060 			break;
1061 		tmp++;
1062 	}
1063 
1064 	if (*tmp) {
1065 		/*
1066 		 * Parse hexa addresses followed by ':'
1067 		 */
1068 		line_ip = strtoull(tmp, &tmp2, 16);
1069 		if (*tmp2 != ':')
1070 			line_ip = -1;
1071 	}
1072 
1073 	if (line_ip != -1) {
1074 		const char *path = NULL;
1075 		unsigned int hits = 0;
1076 		double percent = 0.0;
1077 		char *color;
1078 		struct sym_ext *sym_ext = sym->priv;
1079 
1080 		offset = line_ip - start;
1081 		if (offset < len)
1082 			hits = sym->hist[offset];
1083 
1084 		if (offset < len && sym_ext) {
1085 			path = sym_ext[offset].path;
1086 			percent = sym_ext[offset].percent;
1087 		} else if (sym->hist_sum)
1088 			percent = 100.0 * hits / sym->hist_sum;
1089 
1090 		color = get_percent_color(percent);
1091 
1092 		/*
1093 		 * Also color the filename and line if needed, with
1094 		 * the same color than the percentage. Don't print it
1095 		 * twice for close colored ip with the same filename:line
1096 		 */
1097 		if (path) {
1098 			if (!prev_line || strcmp(prev_line, path)
1099 				       || color != prev_color) {
1100 				color_fprintf(stdout, color, " %s", path);
1101 				prev_line = path;
1102 				prev_color = color;
1103 			}
1104 		}
1105 
1106 		color_fprintf(stdout, color, " %7.2f", percent);
1107 		printf(" :	");
1108 		color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", line);
1109 	} else {
1110 		if (!*line)
1111 			printf("         :\n");
1112 		else
1113 			printf("         :	%s\n", line);
1114 	}
1115 
1116 	return 0;
1117 }
1118 
1119 static struct rb_root root_sym_ext;
1120 
1121 static void insert_source_line(struct sym_ext *sym_ext)
1122 {
1123 	struct sym_ext *iter;
1124 	struct rb_node **p = &root_sym_ext.rb_node;
1125 	struct rb_node *parent = NULL;
1126 
1127 	while (*p != NULL) {
1128 		parent = *p;
1129 		iter = rb_entry(parent, struct sym_ext, node);
1130 
1131 		if (sym_ext->percent > iter->percent)
1132 			p = &(*p)->rb_left;
1133 		else
1134 			p = &(*p)->rb_right;
1135 	}
1136 
1137 	rb_link_node(&sym_ext->node, parent, p);
1138 	rb_insert_color(&sym_ext->node, &root_sym_ext);
1139 }
1140 
1141 static void free_source_line(struct symbol *sym, int len)
1142 {
1143 	struct sym_ext *sym_ext = sym->priv;
1144 	int i;
1145 
1146 	if (!sym_ext)
1147 		return;
1148 
1149 	for (i = 0; i < len; i++)
1150 		free(sym_ext[i].path);
1151 	free(sym_ext);
1152 
1153 	sym->priv = NULL;
1154 	root_sym_ext = RB_ROOT;
1155 }
1156 
1157 /* Get the filename:line for the colored entries */
1158 static void
1159 get_source_line(struct symbol *sym, u64 start, int len, char *filename)
1160 {
1161 	int i;
1162 	char cmd[PATH_MAX * 2];
1163 	struct sym_ext *sym_ext;
1164 
1165 	if (!sym->hist_sum)
1166 		return;
1167 
1168 	sym->priv = calloc(len, sizeof(struct sym_ext));
1169 	if (!sym->priv)
1170 		return;
1171 
1172 	sym_ext = sym->priv;
1173 
1174 	for (i = 0; i < len; i++) {
1175 		char *path = NULL;
1176 		size_t line_len;
1177 		u64 offset;
1178 		FILE *fp;
1179 
1180 		sym_ext[i].percent = 100.0 * sym->hist[i] / sym->hist_sum;
1181 		if (sym_ext[i].percent <= 0.5)
1182 			continue;
1183 
1184 		offset = start + i;
1185 		sprintf(cmd, "addr2line -e %s %016llx", filename, offset);
1186 		fp = popen(cmd, "r");
1187 		if (!fp)
1188 			continue;
1189 
1190 		if (getline(&path, &line_len, fp) < 0 || !line_len)
1191 			goto next;
1192 
1193 		sym_ext[i].path = malloc(sizeof(char) * line_len + 1);
1194 		if (!sym_ext[i].path)
1195 			goto next;
1196 
1197 		strcpy(sym_ext[i].path, path);
1198 		insert_source_line(&sym_ext[i]);
1199 
1200 	next:
1201 		pclose(fp);
1202 	}
1203 }
1204 
1205 static void print_summary(char *filename)
1206 {
1207 	struct sym_ext *sym_ext;
1208 	struct rb_node *node;
1209 
1210 	printf("\nSorted summary for file %s\n", filename);
1211 	printf("----------------------------------------------\n\n");
1212 
1213 	if (RB_EMPTY_ROOT(&root_sym_ext)) {
1214 		printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
1215 		return;
1216 	}
1217 
1218 	node = rb_first(&root_sym_ext);
1219 	while (node) {
1220 		double percent;
1221 		char *color;
1222 		char *path;
1223 
1224 		sym_ext = rb_entry(node, struct sym_ext, node);
1225 		percent = sym_ext->percent;
1226 		color = get_percent_color(percent);
1227 		path = sym_ext->path;
1228 
1229 		color_fprintf(stdout, color, " %7.2f %s", percent, path);
1230 		node = rb_next(node);
1231 	}
1232 }
1233 
1234 static void annotate_sym(struct dso *dso, struct symbol *sym)
1235 {
1236 	char *filename = dso->name, *d_filename;
1237 	u64 start, end, len;
1238 	char command[PATH_MAX*2];
1239 	FILE *file;
1240 
1241 	if (!filename)
1242 		return;
1243 	if (sym->module)
1244 		filename = sym->module->path;
1245 	else if (dso == kernel_dso)
1246 		filename = vmlinux;
1247 
1248 	start = sym->obj_start;
1249 	if (!start)
1250 		start = sym->start;
1251 	if (full_paths)
1252 		d_filename = filename;
1253 	else
1254 		d_filename = basename(filename);
1255 
1256 	end = start + sym->end - sym->start + 1;
1257 	len = sym->end - sym->start;
1258 
1259 	if (print_line) {
1260 		get_source_line(sym, start, len, filename);
1261 		print_summary(filename);
1262 	}
1263 
1264 	printf("\n\n------------------------------------------------\n");
1265 	printf(" Percent |	Source code & Disassembly of %s\n", d_filename);
1266 	printf("------------------------------------------------\n");
1267 
1268 	if (verbose >= 2)
1269 		printf("annotating [%p] %30s : [%p] %30s\n", dso, dso->name, sym, sym->name);
1270 
1271 	sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s",
1272 			(u64)start, (u64)end, filename, filename);
1273 
1274 	if (verbose >= 3)
1275 		printf("doing: %s\n", command);
1276 
1277 	file = popen(command, "r");
1278 	if (!file)
1279 		return;
1280 
1281 	while (!feof(file)) {
1282 		if (parse_line(file, sym, start, len) < 0)
1283 			break;
1284 	}
1285 
1286 	pclose(file);
1287 	if (print_line)
1288 		free_source_line(sym, len);
1289 }
1290 
1291 static void find_annotations(void)
1292 {
1293 	struct rb_node *nd;
1294 	struct dso *dso;
1295 	int count = 0;
1296 
1297 	list_for_each_entry(dso, &dsos, node) {
1298 
1299 		for (nd = rb_first(&dso->syms); nd; nd = rb_next(nd)) {
1300 			struct symbol *sym = rb_entry(nd, struct symbol, rb_node);
1301 
1302 			if (sym->hist) {
1303 				annotate_sym(dso, sym);
1304 				count++;
1305 			}
1306 		}
1307 	}
1308 
1309 	if (!count)
1310 		printf(" Error: symbol '%s' not present amongst the samples.\n", sym_hist_filter);
1311 }
1312 
1313 static int __cmd_annotate(void)
1314 {
1315 	int ret, rc = EXIT_FAILURE;
1316 	unsigned long offset = 0;
1317 	unsigned long head = 0;
1318 	struct stat stat;
1319 	event_t *event;
1320 	uint32_t size;
1321 	char *buf;
1322 
1323 	register_idle_thread();
1324 
1325 	input = open(input_name, O_RDONLY);
1326 	if (input < 0) {
1327 		perror("failed to open file");
1328 		exit(-1);
1329 	}
1330 
1331 	ret = fstat(input, &stat);
1332 	if (ret < 0) {
1333 		perror("failed to stat file");
1334 		exit(-1);
1335 	}
1336 
1337 	if (!stat.st_size) {
1338 		fprintf(stderr, "zero-sized file, nothing to do!\n");
1339 		exit(0);
1340 	}
1341 
1342 	if (load_kernel() < 0) {
1343 		perror("failed to load kernel symbols");
1344 		return EXIT_FAILURE;
1345 	}
1346 
1347 remap:
1348 	buf = (char *)mmap(NULL, page_size * mmap_window, PROT_READ,
1349 			   MAP_SHARED, input, offset);
1350 	if (buf == MAP_FAILED) {
1351 		perror("failed to mmap file");
1352 		exit(-1);
1353 	}
1354 
1355 more:
1356 	event = (event_t *)(buf + head);
1357 
1358 	size = event->header.size;
1359 	if (!size)
1360 		size = 8;
1361 
1362 	if (head + event->header.size >= page_size * mmap_window) {
1363 		unsigned long shift = page_size * (head / page_size);
1364 		int ret;
1365 
1366 		ret = munmap(buf, page_size * mmap_window);
1367 		assert(ret == 0);
1368 
1369 		offset += shift;
1370 		head -= shift;
1371 		goto remap;
1372 	}
1373 
1374 	size = event->header.size;
1375 
1376 	dprintf("%p [%p]: event: %d\n",
1377 			(void *)(offset + head),
1378 			(void *)(long)event->header.size,
1379 			event->header.type);
1380 
1381 	if (!size || process_event(event, offset, head) < 0) {
1382 
1383 		dprintf("%p [%p]: skipping unknown header type: %d\n",
1384 			(void *)(offset + head),
1385 			(void *)(long)(event->header.size),
1386 			event->header.type);
1387 
1388 		total_unknown++;
1389 
1390 		/*
1391 		 * assume we lost track of the stream, check alignment, and
1392 		 * increment a single u64 in the hope to catch on again 'soon'.
1393 		 */
1394 
1395 		if (unlikely(head & 7))
1396 			head &= ~7ULL;
1397 
1398 		size = 8;
1399 	}
1400 
1401 	head += size;
1402 
1403 	if (offset + head < (unsigned long)stat.st_size)
1404 		goto more;
1405 
1406 	rc = EXIT_SUCCESS;
1407 	close(input);
1408 
1409 	dprintf("      IP events: %10ld\n", total);
1410 	dprintf("    mmap events: %10ld\n", total_mmap);
1411 	dprintf("    comm events: %10ld\n", total_comm);
1412 	dprintf("    fork events: %10ld\n", total_fork);
1413 	dprintf(" unknown events: %10ld\n", total_unknown);
1414 
1415 	if (dump_trace)
1416 		return 0;
1417 
1418 	if (verbose >= 3)
1419 		threads__fprintf(stdout);
1420 
1421 	if (verbose >= 2)
1422 		dsos__fprintf(stdout);
1423 
1424 	collapse__resort();
1425 	output__resort();
1426 
1427 	find_annotations();
1428 
1429 	return rc;
1430 }
1431 
1432 static const char * const annotate_usage[] = {
1433 	"perf annotate [<options>] <command>",
1434 	NULL
1435 };
1436 
1437 static const struct option options[] = {
1438 	OPT_STRING('i', "input", &input_name, "file",
1439 		    "input file name"),
1440 	OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
1441 		    "symbol to annotate"),
1442 	OPT_BOOLEAN('v', "verbose", &verbose,
1443 		    "be more verbose (show symbol address, etc)"),
1444 	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
1445 		    "dump raw trace in ASCII"),
1446 	OPT_STRING('k', "vmlinux", &vmlinux, "file", "vmlinux pathname"),
1447 	OPT_BOOLEAN('m', "modules", &modules,
1448 		    "load module symbols - WARNING: use only with -k and LIVE kernel"),
1449 	OPT_BOOLEAN('l', "print-line", &print_line,
1450 		    "print matching source lines (may be slow)"),
1451 	OPT_BOOLEAN('P', "full-paths", &full_paths,
1452 		    "Don't shorten the displayed pathnames"),
1453 	OPT_END()
1454 };
1455 
1456 static void setup_sorting(void)
1457 {
1458 	char *tmp, *tok, *str = strdup(sort_order);
1459 
1460 	for (tok = strtok_r(str, ", ", &tmp);
1461 			tok; tok = strtok_r(NULL, ", ", &tmp)) {
1462 		if (sort_dimension__add(tok) < 0) {
1463 			error("Unknown --sort key: `%s'", tok);
1464 			usage_with_options(annotate_usage, options);
1465 		}
1466 	}
1467 
1468 	free(str);
1469 }
1470 
1471 int cmd_annotate(int argc, const char **argv, const char *prefix __used)
1472 {
1473 	symbol__init();
1474 
1475 	page_size = getpagesize();
1476 
1477 	argc = parse_options(argc, argv, options, annotate_usage, 0);
1478 
1479 	setup_sorting();
1480 
1481 	if (argc) {
1482 		/*
1483 		 * Special case: if there's an argument left then assume tha
1484 		 * it's a symbol filter:
1485 		 */
1486 		if (argc > 1)
1487 			usage_with_options(annotate_usage, options);
1488 
1489 		sym_hist_filter = argv[0];
1490 	}
1491 
1492 	if (!sym_hist_filter)
1493 		usage_with_options(annotate_usage, options);
1494 
1495 	setup_pager();
1496 
1497 	return __cmd_annotate();
1498 }
1499