1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3 * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
4 *
5 * Parts came from builtin-annotate.c, see those files for further
6 * copyright notes.
7 */
8
9 #include <errno.h>
10 #include <inttypes.h>
11 #include <libgen.h>
12 #include <stdlib.h>
13 #include "util.h" // hex_width()
14 #include "ui/ui.h"
15 #include "sort.h"
16 #include "build-id.h"
17 #include "color.h"
18 #include "config.h"
19 #include "disasm.h"
20 #include "dso.h"
21 #include "env.h"
22 #include "map.h"
23 #include "maps.h"
24 #include "symbol.h"
25 #include "srcline.h"
26 #include "units.h"
27 #include "debug.h"
28 #include "debuginfo.h"
29 #include "annotate.h"
30 #include "annotate-data.h"
31 #include "evsel.h"
32 #include "evlist.h"
33 #include "bpf-event.h"
34 #include "bpf-utils.h"
35 #include "block-range.h"
36 #include "string2.h"
37 #include "dwarf-regs.h"
38 #include "util/event.h"
39 #include "util/sharded_mutex.h"
40 #include "arch/common.h"
41 #include "namespaces.h"
42 #include "thread.h"
43 #include "hashmap.h"
44 #include "strbuf.h"
45 #include <regex.h>
46 #include <linux/bitops.h>
47 #include <linux/kernel.h>
48 #include <linux/string.h>
49 #include <linux/zalloc.h>
50 #include <subcmd/parse-options.h>
51 #include <subcmd/run-command.h>
52 #include <math.h>
53
54 /* FIXME: For the HE_COLORSET */
55 #include "ui/browser.h"
56
57 /*
58 * FIXME: Using the same values as slang.h,
59 * but that header may not be available everywhere
60 */
61 #define LARROW_CHAR ((unsigned char)',')
62 #define RARROW_CHAR ((unsigned char)'+')
63 #define DARROW_CHAR ((unsigned char)'.')
64 #define UARROW_CHAR ((unsigned char)'-')
65
66 #include <linux/ctype.h>
67
68 /* global annotation options */
69 struct annotation_options annotate_opts;
70
71 /* Data type collection debug statistics */
72 struct annotated_data_stat ann_data_stat;
73 LIST_HEAD(ann_insn_stat);
74
75 /* Pseudo data types */
76 struct annotated_data_type stackop_type = {
77 .self = {
78 .type_name = (char *)"(stack operation)",
79 .children = LIST_HEAD_INIT(stackop_type.self.children),
80 },
81 };
82
83 struct annotated_data_type canary_type = {
84 .self = {
85 .type_name = (char *)"(stack canary)",
86 .children = LIST_HEAD_INIT(canary_type.self.children),
87 },
88 };
89
90 #define NO_TYPE ((struct annotated_data_type *)-1UL)
91
92 /* symbol histogram: key = offset << 16 | evsel->core.idx */
sym_hist_hash(long key,void * ctx __maybe_unused)93 static size_t sym_hist_hash(long key, void *ctx __maybe_unused)
94 {
95 return (key >> 16) + (key & 0xffff);
96 }
97
sym_hist_equal(long key1,long key2,void * ctx __maybe_unused)98 static bool sym_hist_equal(long key1, long key2, void *ctx __maybe_unused)
99 {
100 return key1 == key2;
101 }
102
annotated_source__new(void)103 static struct annotated_source *annotated_source__new(void)
104 {
105 struct annotated_source *src = zalloc(sizeof(*src));
106
107 if (src != NULL)
108 INIT_LIST_HEAD(&src->source);
109
110 return src;
111 }
112
annotated_source__delete(struct annotated_source * src)113 static __maybe_unused void annotated_source__delete(struct annotated_source *src)
114 {
115 struct hashmap_entry *cur;
116 size_t bkt;
117
118 if (src == NULL)
119 return;
120
121 if (src->samples) {
122 hashmap__for_each_entry(src->samples, cur, bkt)
123 zfree(&cur->pvalue);
124 hashmap__free(src->samples);
125 }
126 zfree(&src->histograms);
127 free(src);
128 }
129
annotated_source__alloc_histograms(struct annotated_source * src,int nr_hists)130 static int annotated_source__alloc_histograms(struct annotated_source *src,
131 int nr_hists)
132 {
133 src->nr_histograms = nr_hists;
134 src->histograms = calloc(nr_hists, sizeof(*src->histograms));
135
136 if (src->histograms == NULL)
137 return -1;
138
139 src->samples = hashmap__new(sym_hist_hash, sym_hist_equal, NULL);
140 if (src->samples == NULL)
141 zfree(&src->histograms);
142
143 return src->histograms ? 0 : -1;
144 }
145
symbol__annotate_zero_histograms(struct symbol * sym)146 void symbol__annotate_zero_histograms(struct symbol *sym)
147 {
148 struct annotation *notes = symbol__annotation(sym);
149
150 annotation__lock(notes);
151 if (notes->src != NULL) {
152 memset(notes->src->histograms, 0,
153 notes->src->nr_histograms * sizeof(*notes->src->histograms));
154 hashmap__clear(notes->src->samples);
155 }
156 if (notes->branch && notes->branch->cycles_hist) {
157 memset(notes->branch->cycles_hist, 0,
158 symbol__size(sym) * sizeof(struct cyc_hist));
159 }
160 annotation__unlock(notes);
161 }
162
__symbol__account_cycles(struct cyc_hist * ch,u64 start,unsigned offset,unsigned cycles,unsigned have_start)163 static int __symbol__account_cycles(struct cyc_hist *ch,
164 u64 start,
165 unsigned offset, unsigned cycles,
166 unsigned have_start)
167 {
168 /*
169 * For now we can only account one basic block per
170 * final jump. But multiple could be overlapping.
171 * Always account the longest one. So when
172 * a shorter one has been already seen throw it away.
173 *
174 * We separately always account the full cycles.
175 */
176 ch[offset].num_aggr++;
177 ch[offset].cycles_aggr += cycles;
178
179 if (cycles > ch[offset].cycles_max)
180 ch[offset].cycles_max = cycles;
181
182 if (ch[offset].cycles_min) {
183 if (cycles && cycles < ch[offset].cycles_min)
184 ch[offset].cycles_min = cycles;
185 } else
186 ch[offset].cycles_min = cycles;
187
188 if (!have_start && ch[offset].have_start)
189 return 0;
190 if (ch[offset].num) {
191 if (have_start && (!ch[offset].have_start ||
192 ch[offset].start > start)) {
193 ch[offset].have_start = 0;
194 ch[offset].cycles = 0;
195 ch[offset].num = 0;
196 if (ch[offset].reset < 0xffff)
197 ch[offset].reset++;
198 } else if (have_start &&
199 ch[offset].start < start)
200 return 0;
201 }
202
203 if (ch[offset].num < NUM_SPARKS)
204 ch[offset].cycles_spark[ch[offset].num] = cycles;
205
206 ch[offset].have_start = have_start;
207 ch[offset].start = start;
208 ch[offset].cycles += cycles;
209 ch[offset].num++;
210 return 0;
211 }
212
__symbol__inc_addr_samples(struct map_symbol * ms,struct annotated_source * src,struct evsel * evsel,u64 addr,struct perf_sample * sample)213 static int __symbol__inc_addr_samples(struct map_symbol *ms,
214 struct annotated_source *src, struct evsel *evsel, u64 addr,
215 struct perf_sample *sample)
216 {
217 struct symbol *sym = ms->sym;
218 long hash_key;
219 u64 offset;
220 struct sym_hist *h;
221 struct sym_hist_entry *entry;
222
223 pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, map__unmap_ip(ms->map, addr));
224
225 if ((addr < sym->start || addr >= sym->end) &&
226 (addr != sym->end || sym->start != sym->end)) {
227 pr_debug("%s(%d): ERANGE! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 "\n",
228 __func__, __LINE__, sym->name, sym->start, addr, sym->end);
229 return -ERANGE;
230 }
231
232 offset = addr - sym->start;
233 h = annotated_source__histogram(src, evsel);
234 if (h == NULL) {
235 pr_debug("%s(%d): ENOMEM! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 ", func: %d\n",
236 __func__, __LINE__, sym->name, sym->start, addr, sym->end, sym->type == STT_FUNC);
237 return -ENOMEM;
238 }
239
240 hash_key = offset << 16 | evsel->core.idx;
241 if (!hashmap__find(src->samples, hash_key, &entry)) {
242 entry = zalloc(sizeof(*entry));
243 if (entry == NULL)
244 return -ENOMEM;
245
246 if (hashmap__add(src->samples, hash_key, entry) < 0)
247 return -ENOMEM;
248 }
249
250 h->nr_samples++;
251 h->period += sample->period;
252 entry->nr_samples++;
253 entry->period += sample->period;
254
255 pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64
256 ", evidx=%d] => nr_samples: %" PRIu64 ", period: %" PRIu64 "\n",
257 sym->start, sym->name, addr, addr - sym->start, evsel->core.idx,
258 entry->nr_samples, entry->period);
259 return 0;
260 }
261
annotation__get_branch(struct annotation * notes)262 struct annotated_branch *annotation__get_branch(struct annotation *notes)
263 {
264 if (notes == NULL)
265 return NULL;
266
267 if (notes->branch == NULL)
268 notes->branch = zalloc(sizeof(*notes->branch));
269
270 return notes->branch;
271 }
272
symbol__find_branch_hist(struct symbol * sym,unsigned int br_cntr_nr)273 static struct annotated_branch *symbol__find_branch_hist(struct symbol *sym,
274 unsigned int br_cntr_nr)
275 {
276 struct annotation *notes = symbol__annotation(sym);
277 struct annotated_branch *branch;
278 const size_t size = symbol__size(sym);
279
280 branch = annotation__get_branch(notes);
281 if (branch == NULL)
282 return NULL;
283
284 if (branch->cycles_hist == NULL) {
285 branch->cycles_hist = calloc(size, sizeof(struct cyc_hist));
286 if (!branch->cycles_hist)
287 return NULL;
288 }
289
290 if (br_cntr_nr && branch->br_cntr == NULL) {
291 branch->br_cntr = calloc(br_cntr_nr * size, sizeof(u64));
292 if (!branch->br_cntr)
293 return NULL;
294 }
295
296 return branch;
297 }
298
symbol__hists(struct symbol * sym,int nr_hists)299 struct annotated_source *symbol__hists(struct symbol *sym, int nr_hists)
300 {
301 struct annotation *notes = symbol__annotation(sym);
302
303 if (notes->src == NULL) {
304 notes->src = annotated_source__new();
305 if (notes->src == NULL)
306 return NULL;
307 goto alloc_histograms;
308 }
309
310 if (notes->src->histograms == NULL) {
311 alloc_histograms:
312 annotated_source__alloc_histograms(notes->src, nr_hists);
313 }
314
315 return notes->src;
316 }
317
symbol__inc_addr_samples(struct map_symbol * ms,struct evsel * evsel,u64 addr,struct perf_sample * sample)318 static int symbol__inc_addr_samples(struct map_symbol *ms,
319 struct evsel *evsel, u64 addr,
320 struct perf_sample *sample)
321 {
322 struct symbol *sym = ms->sym;
323 struct annotated_source *src;
324
325 if (sym == NULL)
326 return 0;
327 src = symbol__hists(sym, evsel->evlist->core.nr_entries);
328 return src ? __symbol__inc_addr_samples(ms, src, evsel, addr, sample) : 0;
329 }
330
symbol__account_br_cntr(struct annotated_branch * branch,struct evsel * evsel,unsigned offset,u64 br_cntr)331 static int symbol__account_br_cntr(struct annotated_branch *branch,
332 struct evsel *evsel,
333 unsigned offset,
334 u64 br_cntr)
335 {
336 unsigned int br_cntr_nr = evsel__leader(evsel)->br_cntr_nr;
337 unsigned int base = evsel__leader(evsel)->br_cntr_idx;
338 unsigned int off = offset * evsel->evlist->nr_br_cntr;
339 u64 *branch_br_cntr = branch->br_cntr;
340 unsigned int i, mask, width;
341
342 if (!br_cntr || !branch_br_cntr)
343 return 0;
344
345 perf_env__find_br_cntr_info(evsel__env(evsel), NULL, &width);
346 mask = (1L << width) - 1;
347 for (i = 0; i < br_cntr_nr; i++) {
348 u64 cntr = (br_cntr >> i * width) & mask;
349
350 branch_br_cntr[off + i + base] += cntr;
351 if (cntr == mask)
352 branch_br_cntr[off + i + base] |= ANNOTATION__BR_CNTR_SATURATED_FLAG;
353 }
354
355 return 0;
356 }
357
symbol__account_cycles(u64 addr,u64 start,struct symbol * sym,unsigned cycles,struct evsel * evsel,u64 br_cntr)358 static int symbol__account_cycles(u64 addr, u64 start, struct symbol *sym,
359 unsigned cycles, struct evsel *evsel,
360 u64 br_cntr)
361 {
362 struct annotated_branch *branch;
363 unsigned offset;
364 int ret;
365
366 if (sym == NULL)
367 return 0;
368 branch = symbol__find_branch_hist(sym, evsel->evlist->nr_br_cntr);
369 if (!branch)
370 return -ENOMEM;
371 if (addr < sym->start || addr >= sym->end)
372 return -ERANGE;
373
374 if (start) {
375 if (start < sym->start || start >= sym->end)
376 return -ERANGE;
377 if (start >= addr)
378 start = 0;
379 }
380 offset = addr - sym->start;
381 ret = __symbol__account_cycles(branch->cycles_hist,
382 start ? start - sym->start : 0,
383 offset, cycles,
384 !!start);
385
386 if (ret)
387 return ret;
388
389 return symbol__account_br_cntr(branch, evsel, offset, br_cntr);
390 }
391
addr_map_symbol__account_cycles(struct addr_map_symbol * ams,struct addr_map_symbol * start,unsigned cycles,struct evsel * evsel,u64 br_cntr)392 int addr_map_symbol__account_cycles(struct addr_map_symbol *ams,
393 struct addr_map_symbol *start,
394 unsigned cycles,
395 struct evsel *evsel,
396 u64 br_cntr)
397 {
398 u64 saddr = 0;
399 int err;
400
401 if (!cycles)
402 return 0;
403
404 /*
405 * Only set start when IPC can be computed. We can only
406 * compute it when the basic block is completely in a single
407 * function.
408 * Special case the case when the jump is elsewhere, but
409 * it starts on the function start.
410 */
411 if (start &&
412 (start->ms.sym == ams->ms.sym ||
413 (ams->ms.sym &&
414 start->addr == ams->ms.sym->start + map__start(ams->ms.map))))
415 saddr = start->al_addr;
416 if (saddr == 0)
417 pr_debug2("BB with bad start: addr %"PRIx64" start %"PRIx64" sym %"PRIx64" saddr %"PRIx64"\n",
418 ams->addr,
419 start ? start->addr : 0,
420 ams->ms.sym ? ams->ms.sym->start + map__start(ams->ms.map) : 0,
421 saddr);
422 err = symbol__account_cycles(ams->al_addr, saddr, ams->ms.sym, cycles, evsel, br_cntr);
423 if (err)
424 pr_debug2("account_cycles failed %d\n", err);
425 return err;
426 }
427
annotated_source__get_line(struct annotated_source * src,s64 offset)428 struct annotation_line *annotated_source__get_line(struct annotated_source *src,
429 s64 offset)
430 {
431 struct annotation_line *al;
432
433 list_for_each_entry(al, &src->source, node) {
434 if (al->offset == offset)
435 return al;
436 }
437 return NULL;
438 }
439
annotation__count_insn(struct annotation * notes,u64 start,u64 end)440 static unsigned annotation__count_insn(struct annotation *notes, u64 start, u64 end)
441 {
442 struct annotation_line *al;
443 unsigned n_insn = 0;
444
445 al = annotated_source__get_line(notes->src, start);
446 if (al == NULL)
447 return 0;
448
449 list_for_each_entry_from(al, ¬es->src->source, node) {
450 if (al->offset == -1)
451 continue;
452 if ((u64)al->offset > end)
453 break;
454 n_insn++;
455 }
456 return n_insn;
457 }
458
annotated_branch__delete(struct annotated_branch * branch)459 static void annotated_branch__delete(struct annotated_branch *branch)
460 {
461 if (branch) {
462 zfree(&branch->cycles_hist);
463 free(branch->br_cntr);
464 free(branch);
465 }
466 }
467
annotation__count_and_fill(struct annotation * notes,u64 start,u64 end,struct cyc_hist * ch)468 static void annotation__count_and_fill(struct annotation *notes, u64 start, u64 end, struct cyc_hist *ch)
469 {
470 unsigned n_insn;
471 unsigned int cover_insn = 0;
472
473 n_insn = annotation__count_insn(notes, start, end);
474 if (n_insn && ch->num && ch->cycles) {
475 struct annotation_line *al;
476 struct annotated_branch *branch;
477 float ipc = n_insn / ((double)ch->cycles / (double)ch->num);
478
479 /* Hide data when there are too many overlaps. */
480 if (ch->reset >= 0x7fff)
481 return;
482
483 al = annotated_source__get_line(notes->src, start);
484 if (al == NULL)
485 return;
486
487 list_for_each_entry_from(al, ¬es->src->source, node) {
488 if (al->offset == -1)
489 continue;
490 if ((u64)al->offset > end)
491 break;
492 if (al->cycles && al->cycles->ipc == 0.0) {
493 al->cycles->ipc = ipc;
494 cover_insn++;
495 }
496 }
497
498 branch = annotation__get_branch(notes);
499 if (cover_insn && branch) {
500 branch->hit_cycles += ch->cycles;
501 branch->hit_insn += n_insn * ch->num;
502 branch->cover_insn += cover_insn;
503 }
504 }
505 }
506
annotation__compute_ipc(struct annotation * notes,size_t size,struct evsel * evsel)507 static int annotation__compute_ipc(struct annotation *notes, size_t size,
508 struct evsel *evsel)
509 {
510 unsigned int br_cntr_nr = evsel->evlist->nr_br_cntr;
511 int err = 0;
512 s64 offset;
513
514 if (!notes->branch || !notes->branch->cycles_hist)
515 return 0;
516
517 notes->branch->total_insn = annotation__count_insn(notes, 0, size - 1);
518 notes->branch->hit_cycles = 0;
519 notes->branch->hit_insn = 0;
520 notes->branch->cover_insn = 0;
521
522 annotation__lock(notes);
523 for (offset = size - 1; offset >= 0; --offset) {
524 struct cyc_hist *ch;
525
526 ch = ¬es->branch->cycles_hist[offset];
527 if (ch && ch->cycles) {
528 struct annotation_line *al;
529
530 al = annotated_source__get_line(notes->src, offset);
531 if (al && al->cycles == NULL) {
532 al->cycles = zalloc(sizeof(*al->cycles));
533 if (al->cycles == NULL) {
534 err = ENOMEM;
535 break;
536 }
537 }
538 if (ch->have_start)
539 annotation__count_and_fill(notes, ch->start, offset, ch);
540 if (al && ch->num_aggr) {
541 al->cycles->avg = ch->cycles_aggr / ch->num_aggr;
542 al->cycles->max = ch->cycles_max;
543 al->cycles->min = ch->cycles_min;
544 }
545 if (al && notes->branch->br_cntr) {
546 if (!al->br_cntr) {
547 al->br_cntr = calloc(br_cntr_nr, sizeof(u64));
548 if (!al->br_cntr) {
549 err = ENOMEM;
550 break;
551 }
552 }
553 al->num_aggr = ch->num_aggr;
554 al->br_cntr_nr = br_cntr_nr;
555 al->evsel = evsel;
556 memcpy(al->br_cntr, ¬es->branch->br_cntr[offset * br_cntr_nr],
557 br_cntr_nr * sizeof(u64));
558 }
559 }
560 }
561
562 if (err) {
563 while (++offset < (s64)size) {
564 struct cyc_hist *ch = ¬es->branch->cycles_hist[offset];
565
566 if (ch && ch->cycles) {
567 struct annotation_line *al;
568
569 al = annotated_source__get_line(notes->src, offset);
570 if (al) {
571 zfree(&al->cycles);
572 zfree(&al->br_cntr);
573 }
574 }
575 }
576 }
577
578 annotation__unlock(notes);
579 return 0;
580 }
581
addr_map_symbol__inc_samples(struct addr_map_symbol * ams,struct perf_sample * sample,struct evsel * evsel)582 int addr_map_symbol__inc_samples(struct addr_map_symbol *ams, struct perf_sample *sample,
583 struct evsel *evsel)
584 {
585 return symbol__inc_addr_samples(&ams->ms, evsel, ams->al_addr, sample);
586 }
587
hist_entry__inc_addr_samples(struct hist_entry * he,struct perf_sample * sample,struct evsel * evsel,u64 ip)588 int hist_entry__inc_addr_samples(struct hist_entry *he, struct perf_sample *sample,
589 struct evsel *evsel, u64 ip)
590 {
591 return symbol__inc_addr_samples(&he->ms, evsel, ip, sample);
592 }
593
594
annotation__exit(struct annotation * notes)595 void annotation__exit(struct annotation *notes)
596 {
597 annotated_source__delete(notes->src);
598 annotated_branch__delete(notes->branch);
599 }
600
601 static struct sharded_mutex *sharded_mutex;
602
annotation__init_sharded_mutex(void)603 static void annotation__init_sharded_mutex(void)
604 {
605 /* As many mutexes as there are CPUs. */
606 sharded_mutex = sharded_mutex__new(cpu__max_present_cpu().cpu);
607 }
608
annotation__hash(const struct annotation * notes)609 static size_t annotation__hash(const struct annotation *notes)
610 {
611 return (size_t)notes;
612 }
613
annotation__get_mutex(const struct annotation * notes)614 static struct mutex *annotation__get_mutex(const struct annotation *notes)
615 {
616 static pthread_once_t once = PTHREAD_ONCE_INIT;
617
618 pthread_once(&once, annotation__init_sharded_mutex);
619 if (!sharded_mutex)
620 return NULL;
621
622 return sharded_mutex__get_mutex(sharded_mutex, annotation__hash(notes));
623 }
624
annotation__lock(struct annotation * notes)625 void annotation__lock(struct annotation *notes)
626 NO_THREAD_SAFETY_ANALYSIS
627 {
628 struct mutex *mutex = annotation__get_mutex(notes);
629
630 if (mutex)
631 mutex_lock(mutex);
632 }
633
annotation__unlock(struct annotation * notes)634 void annotation__unlock(struct annotation *notes)
635 NO_THREAD_SAFETY_ANALYSIS
636 {
637 struct mutex *mutex = annotation__get_mutex(notes);
638
639 if (mutex)
640 mutex_unlock(mutex);
641 }
642
annotation__trylock(struct annotation * notes)643 bool annotation__trylock(struct annotation *notes)
644 {
645 struct mutex *mutex = annotation__get_mutex(notes);
646
647 if (!mutex)
648 return false;
649
650 return mutex_trylock(mutex);
651 }
652
annotation_line__add(struct annotation_line * al,struct list_head * head)653 void annotation_line__add(struct annotation_line *al, struct list_head *head)
654 {
655 list_add_tail(&al->node, head);
656 }
657
658 struct annotation_line *
annotation_line__next(struct annotation_line * pos,struct list_head * head)659 annotation_line__next(struct annotation_line *pos, struct list_head *head)
660 {
661 list_for_each_entry_continue(pos, head, node)
662 if (pos->offset >= 0)
663 return pos;
664
665 return NULL;
666 }
667
annotate__address_color(struct block_range * br)668 static const char *annotate__address_color(struct block_range *br)
669 {
670 double cov = block_range__coverage(br);
671
672 if (cov >= 0) {
673 /* mark red for >75% coverage */
674 if (cov > 0.75)
675 return PERF_COLOR_RED;
676
677 /* mark dull for <1% coverage */
678 if (cov < 0.01)
679 return PERF_COLOR_NORMAL;
680 }
681
682 return PERF_COLOR_MAGENTA;
683 }
684
annotate__asm_color(struct block_range * br)685 static const char *annotate__asm_color(struct block_range *br)
686 {
687 double cov = block_range__coverage(br);
688
689 if (cov >= 0) {
690 /* mark dull for <1% coverage */
691 if (cov < 0.01)
692 return PERF_COLOR_NORMAL;
693 }
694
695 return PERF_COLOR_BLUE;
696 }
697
annotate__branch_printf(struct block_range * br,u64 addr)698 static void annotate__branch_printf(struct block_range *br, u64 addr)
699 {
700 bool emit_comment = true;
701
702 if (!br)
703 return;
704
705 #if 1
706 if (br->is_target && br->start == addr) {
707 struct block_range *branch = br;
708 double p;
709
710 /*
711 * Find matching branch to our target.
712 */
713 while (!branch->is_branch)
714 branch = block_range__next(branch);
715
716 p = 100 *(double)br->entry / branch->coverage;
717
718 if (p > 0.1) {
719 if (emit_comment) {
720 emit_comment = false;
721 printf("\t#");
722 }
723
724 /*
725 * The percentage of coverage joined at this target in relation
726 * to the next branch.
727 */
728 printf(" +%.2f%%", p);
729 }
730 }
731 #endif
732 if (br->is_branch && br->end == addr) {
733 double p = 100*(double)br->taken / br->coverage;
734
735 if (p > 0.1) {
736 if (emit_comment) {
737 emit_comment = false;
738 printf("\t#");
739 }
740
741 /*
742 * The percentage of coverage leaving at this branch, and
743 * its prediction ratio.
744 */
745 printf(" -%.2f%% (p:%.2f%%)", p, 100*(double)br->pred / br->taken);
746 }
747 }
748 }
749
disasm_line__print(struct disasm_line * dl,u64 start,int addr_fmt_width)750 static int disasm_line__print(struct disasm_line *dl, u64 start, int addr_fmt_width)
751 {
752 s64 offset = dl->al.offset;
753 const u64 addr = start + offset;
754 struct block_range *br;
755
756 br = block_range__find(addr);
757 color_fprintf(stdout, annotate__address_color(br), " %*" PRIx64 ":", addr_fmt_width, addr);
758 color_fprintf(stdout, annotate__asm_color(br), "%s", dl->al.line);
759 annotate__branch_printf(br, addr);
760 return 0;
761 }
762
763 static struct annotated_data_type *
764 __hist_entry__get_data_type(struct hist_entry *he, struct arch *arch,
765 struct debuginfo *dbg, struct disasm_line *dl,
766 int *type_offset);
767
768 struct annotation_print_data {
769 struct hist_entry *he;
770 struct evsel *evsel;
771 struct arch *arch;
772 struct debuginfo *dbg;
773 u64 start;
774 int addr_fmt_width;
775 };
776
777 static int
annotation_line__print(struct annotation_line * al,struct annotation_print_data * apd,struct annotation_options * opts,int printed,struct annotation_line * queue)778 annotation_line__print(struct annotation_line *al, struct annotation_print_data *apd,
779 struct annotation_options *opts, int printed,
780 struct annotation_line *queue)
781 {
782 struct symbol *sym = apd->he->ms.sym;
783 struct disasm_line *dl = container_of(al, struct disasm_line, al);
784 struct annotation *notes = symbol__annotation(sym);
785 static const char *prev_line;
786 int max_lines = opts->max_lines;
787 int percent_type = opts->percent_type;
788
789 if (al->offset != -1) {
790 double max_percent = 0.0;
791 int i, nr_percent = 1;
792 const char *color;
793
794 for (i = 0; i < al->data_nr; i++) {
795 double percent;
796
797 percent = annotation_data__percent(&al->data[i],
798 percent_type);
799
800 if (percent > max_percent)
801 max_percent = percent;
802 }
803
804 if (al->data_nr > nr_percent)
805 nr_percent = al->data_nr;
806
807 if (max_percent < opts->min_pcnt)
808 return -1;
809
810 if (max_lines && printed >= max_lines)
811 return 1;
812
813 if (queue != NULL) {
814 struct annotation_options queue_opts = {
815 .max_lines = 1,
816 .percent_type = percent_type,
817 };
818
819 list_for_each_entry_from(queue, ¬es->src->source, node) {
820 if (queue == al)
821 break;
822 annotation_line__print(queue, apd, &queue_opts,
823 /*printed=*/0, /*queue=*/NULL);
824 }
825 }
826
827 color = get_percent_color(max_percent);
828
829 for (i = 0; i < nr_percent; i++) {
830 struct annotation_data *data = &al->data[i];
831 double percent;
832
833 percent = annotation_data__percent(data, percent_type);
834 color = get_percent_color(percent);
835
836 if (symbol_conf.show_total_period)
837 color_fprintf(stdout, color, " %11" PRIu64,
838 data->he.period);
839 else if (symbol_conf.show_nr_samples)
840 color_fprintf(stdout, color, " %7" PRIu64,
841 data->he.nr_samples);
842 else
843 color_fprintf(stdout, color, " %7.2f", percent);
844 }
845
846 printf(" : ");
847
848 disasm_line__print(dl, apd->start, apd->addr_fmt_width);
849
850 if (opts->code_with_type && apd->dbg) {
851 struct annotated_data_type *data_type;
852 int offset = 0;
853
854 data_type = __hist_entry__get_data_type(apd->he, apd->arch,
855 apd->dbg, dl, &offset);
856 if (data_type && data_type != NO_TYPE) {
857 char buf[4096];
858
859 printf("\t\t# data-type: %s",
860 data_type->self.type_name);
861
862 if (data_type != &stackop_type &&
863 data_type != &canary_type)
864 printf(" +%#x", offset);
865
866 if (annotated_data_type__get_member_name(data_type,
867 buf,
868 sizeof(buf),
869 offset))
870 printf(" (%s)", buf);
871 }
872 }
873
874 /*
875 * Also color the filename and line if needed, with
876 * the same color than the percentage. Don't print it
877 * twice for close colored addr with the same filename:line
878 */
879 if (al->path) {
880 if (!prev_line || strcmp(prev_line, al->path)) {
881 color_fprintf(stdout, color, " // %s", al->path);
882 prev_line = al->path;
883 }
884 }
885
886 printf("\n");
887 } else if (max_lines && printed >= max_lines)
888 return 1;
889 else {
890 int width = annotation__pcnt_width(notes);
891
892 if (queue)
893 return -1;
894
895 if (!*al->line)
896 printf(" %*s:\n", width, " ");
897 else
898 printf(" %*s: %-*d %s\n", width, " ", apd->addr_fmt_width,
899 al->line_nr, al->line);
900 }
901
902 return 0;
903 }
904
calc_percent(struct annotation * notes,struct evsel * evsel,struct annotation_data * data,s64 offset,s64 end)905 static void calc_percent(struct annotation *notes,
906 struct evsel *evsel,
907 struct annotation_data *data,
908 s64 offset, s64 end)
909 {
910 struct hists *hists = evsel__hists(evsel);
911 struct sym_hist *sym_hist = annotation__histogram(notes, evsel);
912 unsigned int hits = 0;
913 u64 period = 0;
914
915 while (offset < end) {
916 struct sym_hist_entry *entry;
917
918 entry = annotated_source__hist_entry(notes->src, evsel, offset);
919 if (entry) {
920 hits += entry->nr_samples;
921 period += entry->period;
922 }
923 ++offset;
924 }
925
926 if (sym_hist->nr_samples) {
927 data->he.period = period;
928 data->he.nr_samples = hits;
929 data->percent[PERCENT_HITS_LOCAL] = 100.0 * hits / sym_hist->nr_samples;
930 }
931
932 if (hists->stats.nr_non_filtered_samples)
933 data->percent[PERCENT_HITS_GLOBAL] = 100.0 * hits / hists->stats.nr_non_filtered_samples;
934
935 if (sym_hist->period)
936 data->percent[PERCENT_PERIOD_LOCAL] = 100.0 * period / sym_hist->period;
937
938 if (hists->stats.total_period)
939 data->percent[PERCENT_PERIOD_GLOBAL] = 100.0 * period / hists->stats.total_period;
940 }
941
annotation__calc_percent(struct annotation * notes,struct evsel * leader,s64 len)942 static void annotation__calc_percent(struct annotation *notes,
943 struct evsel *leader, s64 len)
944 {
945 struct annotation_line *al, *next;
946 struct evsel *evsel;
947
948 list_for_each_entry(al, ¬es->src->source, node) {
949 s64 end;
950 int i = 0;
951
952 if (al->offset == -1)
953 continue;
954
955 next = annotation_line__next(al, ¬es->src->source);
956 end = next ? next->offset : len;
957
958 for_each_group_evsel(evsel, leader) {
959 struct annotation_data *data;
960
961 BUG_ON(i >= al->data_nr);
962
963 if (symbol_conf.skip_empty &&
964 evsel__hists(evsel)->stats.nr_samples == 0)
965 continue;
966
967 data = &al->data[i++];
968
969 calc_percent(notes, evsel, data, al->offset, end);
970 }
971 }
972 }
973
symbol__calc_percent(struct symbol * sym,struct evsel * evsel)974 void symbol__calc_percent(struct symbol *sym, struct evsel *evsel)
975 {
976 struct annotation *notes = symbol__annotation(sym);
977
978 annotation__calc_percent(notes, evsel, symbol__size(sym));
979 }
980
evsel__get_arch(struct evsel * evsel,struct arch ** parch)981 static int evsel__get_arch(struct evsel *evsel, struct arch **parch)
982 {
983 struct perf_env *env = evsel__env(evsel);
984 const char *arch_name = perf_env__arch(env);
985 struct arch *arch;
986 int err;
987
988 if (!arch_name) {
989 *parch = NULL;
990 return errno;
991 }
992
993 *parch = arch = arch__find(arch_name);
994 if (arch == NULL) {
995 pr_err("%s: unsupported arch %s\n", __func__, arch_name);
996 return ENOTSUP;
997 }
998
999 if (arch->init) {
1000 err = arch->init(arch, env ? env->cpuid : NULL);
1001 if (err) {
1002 pr_err("%s: failed to initialize %s arch priv area\n",
1003 __func__, arch->name);
1004 return err;
1005 }
1006 }
1007 return 0;
1008 }
1009
symbol__annotate(struct map_symbol * ms,struct evsel * evsel,struct arch ** parch)1010 int symbol__annotate(struct map_symbol *ms, struct evsel *evsel,
1011 struct arch **parch)
1012 {
1013 struct symbol *sym = ms->sym;
1014 struct annotation *notes = symbol__annotation(sym);
1015 struct annotate_args args = {
1016 .evsel = evsel,
1017 .options = &annotate_opts,
1018 };
1019 struct arch *arch = NULL;
1020 int err, nr;
1021
1022 err = evsel__get_arch(evsel, &arch);
1023 if (err < 0)
1024 return err;
1025
1026 if (parch)
1027 *parch = arch;
1028
1029 if (notes->src && !list_empty(¬es->src->source))
1030 return 0;
1031
1032 args.arch = arch;
1033 args.ms = *ms;
1034
1035 if (notes->src == NULL) {
1036 notes->src = annotated_source__new();
1037 if (notes->src == NULL)
1038 return -1;
1039 }
1040
1041 nr = 0;
1042 if (evsel__is_group_event(evsel)) {
1043 struct evsel *pos;
1044
1045 for_each_group_evsel(pos, evsel) {
1046 if (symbol_conf.skip_empty &&
1047 evsel__hists(pos)->stats.nr_samples == 0)
1048 continue;
1049 nr++;
1050 }
1051 }
1052 notes->src->nr_events = nr ? nr : 1;
1053
1054 if (annotate_opts.full_addr)
1055 notes->src->start = map__objdump_2mem(ms->map, ms->sym->start);
1056 else
1057 notes->src->start = map__rip_2objdump(ms->map, ms->sym->start);
1058
1059 return symbol__disassemble(sym, &args);
1060 }
1061
insert_source_line(struct rb_root * root,struct annotation_line * al)1062 static void insert_source_line(struct rb_root *root, struct annotation_line *al)
1063 {
1064 struct annotation_line *iter;
1065 struct rb_node **p = &root->rb_node;
1066 struct rb_node *parent = NULL;
1067 unsigned int percent_type = annotate_opts.percent_type;
1068 int i, ret;
1069
1070 while (*p != NULL) {
1071 parent = *p;
1072 iter = rb_entry(parent, struct annotation_line, rb_node);
1073
1074 ret = strcmp(iter->path, al->path);
1075 if (ret == 0) {
1076 for (i = 0; i < al->data_nr; i++) {
1077 iter->data[i].percent_sum += annotation_data__percent(&al->data[i],
1078 percent_type);
1079 }
1080 return;
1081 }
1082
1083 if (ret < 0)
1084 p = &(*p)->rb_left;
1085 else
1086 p = &(*p)->rb_right;
1087 }
1088
1089 for (i = 0; i < al->data_nr; i++) {
1090 al->data[i].percent_sum = annotation_data__percent(&al->data[i],
1091 percent_type);
1092 }
1093
1094 rb_link_node(&al->rb_node, parent, p);
1095 rb_insert_color(&al->rb_node, root);
1096 }
1097
cmp_source_line(struct annotation_line * a,struct annotation_line * b)1098 static int cmp_source_line(struct annotation_line *a, struct annotation_line *b)
1099 {
1100 int i;
1101
1102 for (i = 0; i < a->data_nr; i++) {
1103 if (a->data[i].percent_sum == b->data[i].percent_sum)
1104 continue;
1105 return a->data[i].percent_sum > b->data[i].percent_sum;
1106 }
1107
1108 return 0;
1109 }
1110
__resort_source_line(struct rb_root * root,struct annotation_line * al)1111 static void __resort_source_line(struct rb_root *root, struct annotation_line *al)
1112 {
1113 struct annotation_line *iter;
1114 struct rb_node **p = &root->rb_node;
1115 struct rb_node *parent = NULL;
1116
1117 while (*p != NULL) {
1118 parent = *p;
1119 iter = rb_entry(parent, struct annotation_line, rb_node);
1120
1121 if (cmp_source_line(al, iter))
1122 p = &(*p)->rb_left;
1123 else
1124 p = &(*p)->rb_right;
1125 }
1126
1127 rb_link_node(&al->rb_node, parent, p);
1128 rb_insert_color(&al->rb_node, root);
1129 }
1130
resort_source_line(struct rb_root * dest_root,struct rb_root * src_root)1131 static void resort_source_line(struct rb_root *dest_root, struct rb_root *src_root)
1132 {
1133 struct annotation_line *al;
1134 struct rb_node *node;
1135
1136 node = rb_first(src_root);
1137 while (node) {
1138 struct rb_node *next;
1139
1140 al = rb_entry(node, struct annotation_line, rb_node);
1141 next = rb_next(node);
1142 rb_erase(node, src_root);
1143
1144 __resort_source_line(dest_root, al);
1145 node = next;
1146 }
1147 }
1148
print_summary(struct rb_root * root,const char * filename)1149 static void print_summary(struct rb_root *root, const char *filename)
1150 {
1151 struct annotation_line *al;
1152 struct rb_node *node;
1153
1154 printf("\nSorted summary for file %s\n", filename);
1155 printf("----------------------------------------------\n\n");
1156
1157 if (RB_EMPTY_ROOT(root)) {
1158 printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
1159 return;
1160 }
1161
1162 node = rb_first(root);
1163 while (node) {
1164 double percent, percent_max = 0.0;
1165 const char *color;
1166 char *path;
1167 int i;
1168
1169 al = rb_entry(node, struct annotation_line, rb_node);
1170 for (i = 0; i < al->data_nr; i++) {
1171 percent = al->data[i].percent_sum;
1172 color = get_percent_color(percent);
1173 color_fprintf(stdout, color, " %7.2f", percent);
1174
1175 if (percent > percent_max)
1176 percent_max = percent;
1177 }
1178
1179 path = al->path;
1180 color = get_percent_color(percent_max);
1181 color_fprintf(stdout, color, " %s\n", path);
1182
1183 node = rb_next(node);
1184 }
1185 }
1186
symbol__annotate_hits(struct symbol * sym,struct evsel * evsel)1187 static void symbol__annotate_hits(struct symbol *sym, struct evsel *evsel)
1188 {
1189 struct annotation *notes = symbol__annotation(sym);
1190 struct sym_hist *h = annotation__histogram(notes, evsel);
1191 u64 len = symbol__size(sym), offset;
1192
1193 for (offset = 0; offset < len; ++offset) {
1194 struct sym_hist_entry *entry;
1195
1196 entry = annotated_source__hist_entry(notes->src, evsel, offset);
1197 if (entry && entry->nr_samples != 0)
1198 printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
1199 sym->start + offset, entry->nr_samples);
1200 }
1201 printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->nr_samples", h->nr_samples);
1202 }
1203
annotated_source__addr_fmt_width(struct list_head * lines,u64 start)1204 static int annotated_source__addr_fmt_width(struct list_head *lines, u64 start)
1205 {
1206 char bf[32];
1207 struct annotation_line *line;
1208
1209 list_for_each_entry_reverse(line, lines, node) {
1210 if (line->offset != -1)
1211 return scnprintf(bf, sizeof(bf), "%" PRIx64, start + line->offset);
1212 }
1213
1214 return 0;
1215 }
1216
hist_entry__annotate_printf(struct hist_entry * he,struct evsel * evsel)1217 int hist_entry__annotate_printf(struct hist_entry *he, struct evsel *evsel)
1218 {
1219 struct map_symbol *ms = &he->ms;
1220 struct map *map = ms->map;
1221 struct symbol *sym = ms->sym;
1222 struct dso *dso = map__dso(map);
1223 char *filename;
1224 const char *d_filename;
1225 const char *evsel_name = evsel__name(evsel);
1226 struct annotation *notes = symbol__annotation(sym);
1227 struct sym_hist *h = annotation__histogram(notes, evsel);
1228 struct annotation_line *pos, *queue = NULL;
1229 struct annotation_options *opts = &annotate_opts;
1230 struct annotation_print_data apd = {
1231 .he = he,
1232 .evsel = evsel,
1233 .start = map__rip_2objdump(map, sym->start),
1234 };
1235 int printed = 2, queue_len = 0;
1236 int more = 0;
1237 bool context = opts->context;
1238 int width = annotation__pcnt_width(notes);
1239 int graph_dotted_len;
1240 char buf[512];
1241
1242 filename = strdup(dso__long_name(dso));
1243 if (!filename)
1244 return -ENOMEM;
1245
1246 if (opts->full_path)
1247 d_filename = filename;
1248 else
1249 d_filename = basename(filename);
1250
1251 if (evsel__is_group_event(evsel)) {
1252 evsel__group_desc(evsel, buf, sizeof(buf));
1253 evsel_name = buf;
1254 }
1255
1256 graph_dotted_len = printf(" %-*.*s| Source code & Disassembly of %s for %s (%" PRIu64 " samples, "
1257 "percent: %s)\n",
1258 width, width, symbol_conf.show_total_period ? "Period" :
1259 symbol_conf.show_nr_samples ? "Samples" : "Percent",
1260 d_filename, evsel_name, h->nr_samples,
1261 percent_type_str(opts->percent_type));
1262
1263 printf("%-*.*s----\n",
1264 graph_dotted_len, graph_dotted_len, graph_dotted_line);
1265
1266 if (verbose > 0)
1267 symbol__annotate_hits(sym, evsel);
1268
1269 apd.addr_fmt_width = annotated_source__addr_fmt_width(¬es->src->source,
1270 apd.start);
1271 evsel__get_arch(evsel, &apd.arch);
1272 apd.dbg = debuginfo__new(filename);
1273
1274 list_for_each_entry(pos, ¬es->src->source, node) {
1275 int err;
1276
1277 if (context && queue == NULL) {
1278 queue = pos;
1279 queue_len = 0;
1280 }
1281
1282 err = annotation_line__print(pos, &apd, opts, printed, queue);
1283
1284 switch (err) {
1285 case 0:
1286 ++printed;
1287 if (context) {
1288 printed += queue_len;
1289 queue = NULL;
1290 queue_len = 0;
1291 }
1292 break;
1293 case 1:
1294 /* filtered by max_lines */
1295 ++more;
1296 break;
1297 case -1:
1298 default:
1299 /*
1300 * Filtered by min_pcnt or non IP lines when
1301 * context != 0
1302 */
1303 if (!context)
1304 break;
1305 if (queue_len == context)
1306 queue = list_entry(queue->node.next, typeof(*queue), node);
1307 else
1308 ++queue_len;
1309 break;
1310 }
1311 }
1312
1313 debuginfo__delete(apd.dbg);
1314 free(filename);
1315
1316 return more;
1317 }
1318
FILE__set_percent_color(void * fp __maybe_unused,double percent __maybe_unused,bool current __maybe_unused)1319 static void FILE__set_percent_color(void *fp __maybe_unused,
1320 double percent __maybe_unused,
1321 bool current __maybe_unused)
1322 {
1323 }
1324
FILE__set_jumps_percent_color(void * fp __maybe_unused,int nr __maybe_unused,bool current __maybe_unused)1325 static int FILE__set_jumps_percent_color(void *fp __maybe_unused,
1326 int nr __maybe_unused, bool current __maybe_unused)
1327 {
1328 return 0;
1329 }
1330
FILE__set_color(void * fp __maybe_unused,int color __maybe_unused)1331 static int FILE__set_color(void *fp __maybe_unused, int color __maybe_unused)
1332 {
1333 return 0;
1334 }
1335
FILE__printf(void * fp,const char * fmt,...)1336 static void FILE__printf(void *fp, const char *fmt, ...)
1337 {
1338 va_list args;
1339
1340 va_start(args, fmt);
1341 vfprintf(fp, fmt, args);
1342 va_end(args);
1343 }
1344
FILE__write_graph(void * fp,int graph)1345 static void FILE__write_graph(void *fp, int graph)
1346 {
1347 const char *s;
1348 switch (graph) {
1349
1350 case DARROW_CHAR: s = "↓"; break;
1351 case UARROW_CHAR: s = "↑"; break;
1352 case LARROW_CHAR: s = "←"; break;
1353 case RARROW_CHAR: s = "→"; break;
1354 default: s = "?"; break;
1355 }
1356
1357 fputs(s, fp);
1358 }
1359
symbol__annotate_fprintf2(struct symbol * sym,FILE * fp)1360 static int symbol__annotate_fprintf2(struct symbol *sym, FILE *fp)
1361 {
1362 struct annotation *notes = symbol__annotation(sym);
1363 struct annotation_write_ops wops = {
1364 .first_line = true,
1365 .obj = fp,
1366 .set_color = FILE__set_color,
1367 .set_percent_color = FILE__set_percent_color,
1368 .set_jumps_percent_color = FILE__set_jumps_percent_color,
1369 .printf = FILE__printf,
1370 .write_graph = FILE__write_graph,
1371 };
1372 struct annotation_line *al;
1373
1374 list_for_each_entry(al, ¬es->src->source, node) {
1375 if (annotation_line__filter(al))
1376 continue;
1377 annotation_line__write(al, notes, &wops);
1378 fputc('\n', fp);
1379 wops.first_line = false;
1380 }
1381
1382 return 0;
1383 }
1384
map_symbol__annotation_dump(struct map_symbol * ms,struct evsel * evsel)1385 int map_symbol__annotation_dump(struct map_symbol *ms, struct evsel *evsel)
1386 {
1387 const char *ev_name = evsel__name(evsel);
1388 char buf[1024];
1389 char *filename;
1390 int err = -1;
1391 FILE *fp;
1392
1393 if (asprintf(&filename, "%s.annotation", ms->sym->name) < 0)
1394 return -1;
1395
1396 fp = fopen(filename, "w");
1397 if (fp == NULL)
1398 goto out_free_filename;
1399
1400 if (evsel__is_group_event(evsel)) {
1401 evsel__group_desc(evsel, buf, sizeof(buf));
1402 ev_name = buf;
1403 }
1404
1405 fprintf(fp, "%s() %s\nEvent: %s\n\n",
1406 ms->sym->name, dso__long_name(map__dso(ms->map)), ev_name);
1407 symbol__annotate_fprintf2(ms->sym, fp);
1408
1409 fclose(fp);
1410 err = 0;
1411 out_free_filename:
1412 free(filename);
1413 return err;
1414 }
1415
symbol__annotate_zero_histogram(struct symbol * sym,struct evsel * evsel)1416 void symbol__annotate_zero_histogram(struct symbol *sym, struct evsel *evsel)
1417 {
1418 struct annotation *notes = symbol__annotation(sym);
1419 struct sym_hist *h = annotation__histogram(notes, evsel);
1420
1421 memset(h, 0, sizeof(*notes->src->histograms) * notes->src->nr_histograms);
1422 }
1423
symbol__annotate_decay_histogram(struct symbol * sym,struct evsel * evsel)1424 void symbol__annotate_decay_histogram(struct symbol *sym, struct evsel *evsel)
1425 {
1426 struct annotation *notes = symbol__annotation(sym);
1427 struct sym_hist *h = annotation__histogram(notes, evsel);
1428 struct annotation_line *al;
1429
1430 h->nr_samples = 0;
1431 list_for_each_entry(al, ¬es->src->source, node) {
1432 struct sym_hist_entry *entry;
1433
1434 if (al->offset == -1)
1435 continue;
1436
1437 entry = annotated_source__hist_entry(notes->src, evsel, al->offset);
1438 if (entry == NULL)
1439 continue;
1440
1441 entry->nr_samples = entry->nr_samples * 7 / 8;
1442 h->nr_samples += entry->nr_samples;
1443 }
1444 }
1445
annotated_source__purge(struct annotated_source * as)1446 void annotated_source__purge(struct annotated_source *as)
1447 {
1448 struct annotation_line *al, *n;
1449
1450 list_for_each_entry_safe(al, n, &as->source, node) {
1451 list_del_init(&al->node);
1452 disasm_line__free(disasm_line(al));
1453 }
1454 as->tried_source = false;
1455 }
1456
disasm_line__fprintf(struct disasm_line * dl,FILE * fp)1457 static size_t disasm_line__fprintf(struct disasm_line *dl, FILE *fp)
1458 {
1459 size_t printed;
1460
1461 if (dl->al.offset == -1)
1462 return fprintf(fp, "%s\n", dl->al.line);
1463
1464 printed = fprintf(fp, "%#" PRIx64 " %s", dl->al.offset, dl->ins.name);
1465
1466 if (dl->ops.raw[0] != '\0') {
1467 printed += fprintf(fp, "%.*s %s\n", 6 - (int)printed, " ",
1468 dl->ops.raw);
1469 }
1470
1471 return printed + fprintf(fp, "\n");
1472 }
1473
disasm__fprintf(struct list_head * head,FILE * fp)1474 size_t disasm__fprintf(struct list_head *head, FILE *fp)
1475 {
1476 struct disasm_line *pos;
1477 size_t printed = 0;
1478
1479 list_for_each_entry(pos, head, al.node)
1480 printed += disasm_line__fprintf(pos, fp);
1481
1482 return printed;
1483 }
1484
disasm_line__is_valid_local_jump(struct disasm_line * dl,struct symbol * sym)1485 bool disasm_line__is_valid_local_jump(struct disasm_line *dl, struct symbol *sym)
1486 {
1487 if (!dl || !dl->ins.ops || !ins__is_jump(&dl->ins) ||
1488 !disasm_line__has_local_offset(dl) || dl->ops.target.offset < 0 ||
1489 dl->ops.target.offset >= (s64)symbol__size(sym))
1490 return false;
1491
1492 return true;
1493 }
1494
1495 static void
annotation__mark_jump_targets(struct annotation * notes,struct symbol * sym)1496 annotation__mark_jump_targets(struct annotation *notes, struct symbol *sym)
1497 {
1498 struct annotation_line *al;
1499
1500 /* PLT symbols contain external offsets */
1501 if (strstr(sym->name, "@plt"))
1502 return;
1503
1504 list_for_each_entry(al, ¬es->src->source, node) {
1505 struct disasm_line *dl;
1506 struct annotation_line *target;
1507
1508 dl = disasm_line(al);
1509
1510 if (!disasm_line__is_valid_local_jump(dl, sym))
1511 continue;
1512
1513 target = annotated_source__get_line(notes->src,
1514 dl->ops.target.offset);
1515 /*
1516 * FIXME: Oops, no jump target? Buggy disassembler? Or do we
1517 * have to adjust to the previous offset?
1518 */
1519 if (target == NULL)
1520 continue;
1521
1522 if (++target->jump_sources > notes->src->max_jump_sources)
1523 notes->src->max_jump_sources = target->jump_sources;
1524 }
1525 }
1526
annotation__set_index(struct annotation * notes)1527 static void annotation__set_index(struct annotation *notes)
1528 {
1529 struct annotation_line *al;
1530 struct annotated_source *src = notes->src;
1531
1532 src->widths.max_line_len = 0;
1533 src->nr_entries = 0;
1534 src->nr_asm_entries = 0;
1535
1536 list_for_each_entry(al, &src->source, node) {
1537 size_t line_len = strlen(al->line);
1538
1539 if (src->widths.max_line_len < line_len)
1540 src->widths.max_line_len = line_len;
1541 al->idx = src->nr_entries++;
1542 if (al->offset != -1)
1543 al->idx_asm = src->nr_asm_entries++;
1544 else
1545 al->idx_asm = -1;
1546 }
1547 }
1548
width_jumps(int n)1549 static inline int width_jumps(int n)
1550 {
1551 if (n >= 100)
1552 return 5;
1553 if (n / 10)
1554 return 2;
1555 return 1;
1556 }
1557
annotation__max_ins_name(struct annotation * notes)1558 static int annotation__max_ins_name(struct annotation *notes)
1559 {
1560 int max_name = 0, len;
1561 struct annotation_line *al;
1562
1563 list_for_each_entry(al, ¬es->src->source, node) {
1564 if (al->offset == -1)
1565 continue;
1566
1567 len = strlen(disasm_line(al)->ins.name);
1568 if (max_name < len)
1569 max_name = len;
1570 }
1571
1572 return max_name;
1573 }
1574
1575 static void
annotation__init_column_widths(struct annotation * notes,struct symbol * sym)1576 annotation__init_column_widths(struct annotation *notes, struct symbol *sym)
1577 {
1578 notes->src->widths.addr = notes->src->widths.target =
1579 notes->src->widths.min_addr = hex_width(symbol__size(sym));
1580 notes->src->widths.max_addr = hex_width(sym->end);
1581 notes->src->widths.jumps = width_jumps(notes->src->max_jump_sources);
1582 notes->src->widths.max_ins_name = annotation__max_ins_name(notes);
1583 }
1584
annotation__update_column_widths(struct annotation * notes)1585 void annotation__update_column_widths(struct annotation *notes)
1586 {
1587 if (annotate_opts.use_offset)
1588 notes->src->widths.target = notes->src->widths.min_addr;
1589 else if (annotate_opts.full_addr)
1590 notes->src->widths.target = BITS_PER_LONG / 4;
1591 else
1592 notes->src->widths.target = notes->src->widths.max_addr;
1593
1594 notes->src->widths.addr = notes->src->widths.target;
1595
1596 if (annotate_opts.show_nr_jumps)
1597 notes->src->widths.addr += notes->src->widths.jumps + 1;
1598 }
1599
annotation__toggle_full_addr(struct annotation * notes,struct map_symbol * ms)1600 void annotation__toggle_full_addr(struct annotation *notes, struct map_symbol *ms)
1601 {
1602 annotate_opts.full_addr = !annotate_opts.full_addr;
1603
1604 if (annotate_opts.full_addr)
1605 notes->src->start = map__objdump_2mem(ms->map, ms->sym->start);
1606 else
1607 notes->src->start = map__rip_2objdump(ms->map, ms->sym->start);
1608
1609 annotation__update_column_widths(notes);
1610 }
1611
annotation__calc_lines(struct annotation * notes,struct map_symbol * ms,struct rb_root * root)1612 static void annotation__calc_lines(struct annotation *notes, struct map_symbol *ms,
1613 struct rb_root *root)
1614 {
1615 struct annotation_line *al;
1616 struct rb_root tmp_root = RB_ROOT;
1617
1618 list_for_each_entry(al, ¬es->src->source, node) {
1619 double percent_max = 0.0;
1620 u64 addr;
1621 int i;
1622
1623 for (i = 0; i < al->data_nr; i++) {
1624 double percent;
1625
1626 percent = annotation_data__percent(&al->data[i],
1627 annotate_opts.percent_type);
1628
1629 if (percent > percent_max)
1630 percent_max = percent;
1631 }
1632
1633 if (percent_max <= 0.5)
1634 continue;
1635
1636 addr = map__rip_2objdump(ms->map, ms->sym->start);
1637 al->path = get_srcline(map__dso(ms->map), addr + al->offset, NULL,
1638 false, true, ms->sym->start + al->offset);
1639 insert_source_line(&tmp_root, al);
1640 }
1641
1642 resort_source_line(root, &tmp_root);
1643 }
1644
symbol__calc_lines(struct map_symbol * ms,struct rb_root * root)1645 static void symbol__calc_lines(struct map_symbol *ms, struct rb_root *root)
1646 {
1647 struct annotation *notes = symbol__annotation(ms->sym);
1648
1649 annotation__calc_lines(notes, ms, root);
1650 }
1651
hist_entry__tty_annotate2(struct hist_entry * he,struct evsel * evsel)1652 int hist_entry__tty_annotate2(struct hist_entry *he, struct evsel *evsel)
1653 {
1654 struct map_symbol *ms = &he->ms;
1655 struct dso *dso = map__dso(ms->map);
1656 struct symbol *sym = ms->sym;
1657 struct rb_root source_line = RB_ROOT;
1658 struct hists *hists = evsel__hists(evsel);
1659 char buf[1024];
1660 int err;
1661
1662 err = symbol__annotate2(ms, evsel, NULL);
1663 if (err) {
1664 char msg[BUFSIZ];
1665
1666 dso__set_annotate_warned(dso);
1667 symbol__strerror_disassemble(ms, err, msg, sizeof(msg));
1668 ui__error("Couldn't annotate %s:\n%s", sym->name, msg);
1669 return -1;
1670 }
1671
1672 if (annotate_opts.print_lines) {
1673 srcline_full_filename = annotate_opts.full_path;
1674 symbol__calc_lines(ms, &source_line);
1675 print_summary(&source_line, dso__long_name(dso));
1676 }
1677
1678 hists__scnprintf_title(hists, buf, sizeof(buf));
1679 fprintf(stdout, "%s, [percent: %s]\n%s() %s\n",
1680 buf, percent_type_str(annotate_opts.percent_type), sym->name, dso__long_name(dso));
1681 symbol__annotate_fprintf2(sym, stdout);
1682
1683 annotated_source__purge(symbol__annotation(sym)->src);
1684
1685 return 0;
1686 }
1687
hist_entry__tty_annotate(struct hist_entry * he,struct evsel * evsel)1688 int hist_entry__tty_annotate(struct hist_entry *he, struct evsel *evsel)
1689 {
1690 struct map_symbol *ms = &he->ms;
1691 struct dso *dso = map__dso(ms->map);
1692 struct symbol *sym = ms->sym;
1693 struct rb_root source_line = RB_ROOT;
1694 int err;
1695
1696 err = symbol__annotate(ms, evsel, NULL);
1697 if (err) {
1698 char msg[BUFSIZ];
1699
1700 dso__set_annotate_warned(dso);
1701 symbol__strerror_disassemble(ms, err, msg, sizeof(msg));
1702 ui__error("Couldn't annotate %s:\n%s", sym->name, msg);
1703 return -1;
1704 }
1705
1706 symbol__calc_percent(sym, evsel);
1707
1708 if (annotate_opts.print_lines) {
1709 srcline_full_filename = annotate_opts.full_path;
1710 symbol__calc_lines(ms, &source_line);
1711 print_summary(&source_line, dso__long_name(dso));
1712 }
1713
1714 hist_entry__annotate_printf(he, evsel);
1715
1716 annotated_source__purge(symbol__annotation(sym)->src);
1717
1718 return 0;
1719 }
1720
ui__has_annotation(void)1721 bool ui__has_annotation(void)
1722 {
1723 return use_browser == 1 && perf_hpp_list.sym;
1724 }
1725
1726
annotation_line__max_percent(struct annotation_line * al,unsigned int percent_type)1727 static double annotation_line__max_percent(struct annotation_line *al,
1728 unsigned int percent_type)
1729 {
1730 double percent_max = 0.0;
1731 int i;
1732
1733 for (i = 0; i < al->data_nr; i++) {
1734 double percent;
1735
1736 percent = annotation_data__percent(&al->data[i],
1737 percent_type);
1738
1739 if (percent > percent_max)
1740 percent_max = percent;
1741 }
1742
1743 return percent_max;
1744 }
1745
disasm_line__write(struct disasm_line * dl,struct annotation * notes,void * obj,char * bf,size_t size,void (* obj__printf)(void * obj,const char * fmt,...),void (* obj__write_graph)(void * obj,int graph))1746 static void disasm_line__write(struct disasm_line *dl, struct annotation *notes,
1747 void *obj, char *bf, size_t size,
1748 void (*obj__printf)(void *obj, const char *fmt, ...),
1749 void (*obj__write_graph)(void *obj, int graph))
1750 {
1751 if (dl->ins.ops && dl->ins.ops->scnprintf) {
1752 if (ins__is_jump(&dl->ins)) {
1753 bool fwd;
1754
1755 if (dl->ops.target.outside)
1756 goto call_like;
1757 fwd = dl->ops.target.offset > dl->al.offset;
1758 obj__write_graph(obj, fwd ? DARROW_CHAR : UARROW_CHAR);
1759 obj__printf(obj, " ");
1760 } else if (ins__is_call(&dl->ins)) {
1761 call_like:
1762 obj__write_graph(obj, RARROW_CHAR);
1763 obj__printf(obj, " ");
1764 } else if (ins__is_ret(&dl->ins)) {
1765 obj__write_graph(obj, LARROW_CHAR);
1766 obj__printf(obj, " ");
1767 } else {
1768 obj__printf(obj, " ");
1769 }
1770 } else {
1771 obj__printf(obj, " ");
1772 }
1773
1774 disasm_line__scnprintf(dl, bf, size, !annotate_opts.use_offset,
1775 notes->src->widths.max_ins_name);
1776 }
1777
ipc_coverage_string(char * bf,int size,struct annotation * notes)1778 static void ipc_coverage_string(char *bf, int size, struct annotation *notes)
1779 {
1780 double ipc = 0.0, coverage = 0.0;
1781 struct annotated_branch *branch = annotation__get_branch(notes);
1782
1783 if (branch && branch->hit_cycles)
1784 ipc = branch->hit_insn / ((double)branch->hit_cycles);
1785
1786 if (branch && branch->total_insn) {
1787 coverage = branch->cover_insn * 100.0 /
1788 ((double)branch->total_insn);
1789 }
1790
1791 scnprintf(bf, size, "(Average IPC: %.2f, IPC Coverage: %.1f%%)",
1792 ipc, coverage);
1793 }
1794
annotation_br_cntr_abbr_list(char ** str,struct evsel * evsel,bool header)1795 int annotation_br_cntr_abbr_list(char **str, struct evsel *evsel, bool header)
1796 {
1797 struct evsel *pos;
1798 struct strbuf sb;
1799
1800 if (evsel->evlist->nr_br_cntr <= 0)
1801 return -ENOTSUP;
1802
1803 strbuf_init(&sb, /*hint=*/ 0);
1804
1805 if (header && strbuf_addf(&sb, "# Branch counter abbr list:\n"))
1806 goto err;
1807
1808 evlist__for_each_entry(evsel->evlist, pos) {
1809 if (!(pos->core.attr.branch_sample_type & PERF_SAMPLE_BRANCH_COUNTERS))
1810 continue;
1811 if (header && strbuf_addf(&sb, "#"))
1812 goto err;
1813
1814 if (strbuf_addf(&sb, " %s = %s\n", pos->name, pos->abbr_name))
1815 goto err;
1816 }
1817
1818 if (header && strbuf_addf(&sb, "#"))
1819 goto err;
1820 if (strbuf_addf(&sb, " '-' No event occurs\n"))
1821 goto err;
1822
1823 if (header && strbuf_addf(&sb, "#"))
1824 goto err;
1825 if (strbuf_addf(&sb, " '+' Event occurrences may be lost due to branch counter saturated\n"))
1826 goto err;
1827
1828 *str = strbuf_detach(&sb, NULL);
1829
1830 return 0;
1831 err:
1832 strbuf_release(&sb);
1833 return -ENOMEM;
1834 }
1835
1836 /* Assume the branch counter saturated at 3 */
1837 #define ANNOTATION_BR_CNTR_SATURATION 3
1838
annotation_br_cntr_entry(char ** str,int br_cntr_nr,u64 * br_cntr,int num_aggr,struct evsel * evsel)1839 int annotation_br_cntr_entry(char **str, int br_cntr_nr,
1840 u64 *br_cntr, int num_aggr,
1841 struct evsel *evsel)
1842 {
1843 struct evsel *pos = evsel ? evlist__first(evsel->evlist) : NULL;
1844 bool saturated = false;
1845 int i, j, avg, used;
1846 struct strbuf sb;
1847
1848 strbuf_init(&sb, /*hint=*/ 0);
1849 for (i = 0; i < br_cntr_nr; i++) {
1850 used = 0;
1851 avg = ceil((double)(br_cntr[i] & ~ANNOTATION__BR_CNTR_SATURATED_FLAG) /
1852 (double)num_aggr);
1853
1854 /*
1855 * A histogram with the abbr name is displayed by default.
1856 * With -v, the exact number of branch counter is displayed.
1857 */
1858 if (verbose) {
1859 evlist__for_each_entry_from(evsel->evlist, pos) {
1860 if ((pos->core.attr.branch_sample_type & PERF_SAMPLE_BRANCH_COUNTERS) &&
1861 (pos->br_cntr_idx == i))
1862 break;
1863 }
1864 if (strbuf_addstr(&sb, pos->abbr_name))
1865 goto err;
1866
1867 if (!br_cntr[i]) {
1868 if (strbuf_addstr(&sb, "=-"))
1869 goto err;
1870 } else {
1871 if (strbuf_addf(&sb, "=%d", avg))
1872 goto err;
1873 }
1874 if (br_cntr[i] & ANNOTATION__BR_CNTR_SATURATED_FLAG) {
1875 if (strbuf_addch(&sb, '+'))
1876 goto err;
1877 } else {
1878 if (strbuf_addch(&sb, ' '))
1879 goto err;
1880 }
1881
1882 if ((i < br_cntr_nr - 1) && strbuf_addch(&sb, ','))
1883 goto err;
1884 continue;
1885 }
1886
1887 if (strbuf_addch(&sb, '|'))
1888 goto err;
1889
1890 if (!br_cntr[i]) {
1891 if (strbuf_addch(&sb, '-'))
1892 goto err;
1893 used++;
1894 } else {
1895 evlist__for_each_entry_from(evsel->evlist, pos) {
1896 if ((pos->core.attr.branch_sample_type & PERF_SAMPLE_BRANCH_COUNTERS) &&
1897 (pos->br_cntr_idx == i))
1898 break;
1899 }
1900 if (br_cntr[i] & ANNOTATION__BR_CNTR_SATURATED_FLAG)
1901 saturated = true;
1902
1903 for (j = 0; j < avg; j++, used++) {
1904 /* Print + if the number of logged events > 3 */
1905 if (j >= ANNOTATION_BR_CNTR_SATURATION) {
1906 saturated = true;
1907 break;
1908 }
1909 if (strbuf_addstr(&sb, pos->abbr_name))
1910 goto err;
1911 }
1912
1913 if (saturated) {
1914 if (strbuf_addch(&sb, '+'))
1915 goto err;
1916 used++;
1917 }
1918 pos = list_next_entry(pos, core.node);
1919 }
1920
1921 for (j = used; j < ANNOTATION_BR_CNTR_SATURATION + 1; j++) {
1922 if (strbuf_addch(&sb, ' '))
1923 goto err;
1924 }
1925 }
1926
1927 if (!verbose && strbuf_addch(&sb, br_cntr_nr ? '|' : ' '))
1928 goto err;
1929
1930 *str = strbuf_detach(&sb, NULL);
1931
1932 return 0;
1933 err:
1934 strbuf_release(&sb);
1935 return -ENOMEM;
1936 }
1937
__annotation_line__write(struct annotation_line * al,struct annotation * notes,bool first_line,bool current_entry,bool change_color,int width,void * obj,unsigned int percent_type,int (* obj__set_color)(void * obj,int color),void (* obj__set_percent_color)(void * obj,double percent,bool current),int (* obj__set_jumps_percent_color)(void * obj,int nr,bool current),void (* obj__printf)(void * obj,const char * fmt,...),void (* obj__write_graph)(void * obj,int graph))1938 static void __annotation_line__write(struct annotation_line *al, struct annotation *notes,
1939 bool first_line, bool current_entry, bool change_color, int width,
1940 void *obj, unsigned int percent_type,
1941 int (*obj__set_color)(void *obj, int color),
1942 void (*obj__set_percent_color)(void *obj, double percent, bool current),
1943 int (*obj__set_jumps_percent_color)(void *obj, int nr, bool current),
1944 void (*obj__printf)(void *obj, const char *fmt, ...),
1945 void (*obj__write_graph)(void *obj, int graph))
1946
1947 {
1948 double percent_max = annotation_line__max_percent(al, percent_type);
1949 int pcnt_width = annotation__pcnt_width(notes),
1950 cycles_width = annotation__cycles_width(notes);
1951 bool show_title = false;
1952 char bf[256];
1953 int printed;
1954
1955 if (first_line && (al->offset == -1 || percent_max == 0.0)) {
1956 if (notes->branch && al->cycles) {
1957 if (al->cycles->ipc == 0.0 && al->cycles->avg == 0)
1958 show_title = true;
1959 } else
1960 show_title = true;
1961 }
1962
1963 if (al->offset != -1 && percent_max != 0.0) {
1964 int i;
1965
1966 for (i = 0; i < al->data_nr; i++) {
1967 double percent;
1968
1969 percent = annotation_data__percent(&al->data[i], percent_type);
1970
1971 obj__set_percent_color(obj, percent, current_entry);
1972 if (symbol_conf.show_total_period) {
1973 obj__printf(obj, "%11" PRIu64 " ", al->data[i].he.period);
1974 } else if (symbol_conf.show_nr_samples) {
1975 obj__printf(obj, "%7" PRIu64 " ",
1976 al->data[i].he.nr_samples);
1977 } else {
1978 obj__printf(obj, "%7.2f ", percent);
1979 }
1980 }
1981 } else {
1982 obj__set_percent_color(obj, 0, current_entry);
1983
1984 if (!show_title)
1985 obj__printf(obj, "%-*s", pcnt_width, " ");
1986 else {
1987 obj__printf(obj, "%-*s", pcnt_width,
1988 symbol_conf.show_total_period ? "Period" :
1989 symbol_conf.show_nr_samples ? "Samples" : "Percent");
1990 }
1991 }
1992
1993 if (notes->branch) {
1994 if (al->cycles && al->cycles->ipc)
1995 obj__printf(obj, "%*.2f ", ANNOTATION__IPC_WIDTH - 1, al->cycles->ipc);
1996 else if (!show_title)
1997 obj__printf(obj, "%*s", ANNOTATION__IPC_WIDTH, " ");
1998 else
1999 obj__printf(obj, "%*s ", ANNOTATION__IPC_WIDTH - 1, "IPC");
2000
2001 if (!annotate_opts.show_minmax_cycle) {
2002 if (al->cycles && al->cycles->avg)
2003 obj__printf(obj, "%*" PRIu64 " ",
2004 ANNOTATION__CYCLES_WIDTH - 1, al->cycles->avg);
2005 else if (!show_title)
2006 obj__printf(obj, "%*s",
2007 ANNOTATION__CYCLES_WIDTH, " ");
2008 else
2009 obj__printf(obj, "%*s ",
2010 ANNOTATION__CYCLES_WIDTH - 1,
2011 "Cycle");
2012 } else {
2013 if (al->cycles) {
2014 char str[32];
2015
2016 scnprintf(str, sizeof(str),
2017 "%" PRIu64 "(%" PRIu64 "/%" PRIu64 ")",
2018 al->cycles->avg, al->cycles->min,
2019 al->cycles->max);
2020
2021 obj__printf(obj, "%*s ",
2022 ANNOTATION__MINMAX_CYCLES_WIDTH - 1,
2023 str);
2024 } else if (!show_title)
2025 obj__printf(obj, "%*s",
2026 ANNOTATION__MINMAX_CYCLES_WIDTH,
2027 " ");
2028 else
2029 obj__printf(obj, "%*s ",
2030 ANNOTATION__MINMAX_CYCLES_WIDTH - 1,
2031 "Cycle(min/max)");
2032 }
2033
2034 if (annotate_opts.show_br_cntr) {
2035 if (show_title) {
2036 obj__printf(obj, "%*s ",
2037 ANNOTATION__BR_CNTR_WIDTH,
2038 "Branch Counter");
2039 } else {
2040 char *buf;
2041
2042 if (!annotation_br_cntr_entry(&buf, al->br_cntr_nr, al->br_cntr,
2043 al->num_aggr, al->evsel)) {
2044 obj__printf(obj, "%*s ", ANNOTATION__BR_CNTR_WIDTH, buf);
2045 free(buf);
2046 }
2047 }
2048 }
2049
2050 if (show_title && !*al->line) {
2051 ipc_coverage_string(bf, sizeof(bf), notes);
2052 obj__printf(obj, "%*s", ANNOTATION__AVG_IPC_WIDTH, bf);
2053 }
2054 }
2055
2056 obj__printf(obj, " ");
2057
2058 if (!*al->line)
2059 obj__printf(obj, "%-*s", width - pcnt_width - cycles_width, " ");
2060 else if (al->offset == -1) {
2061 if (al->line_nr && annotate_opts.show_linenr)
2062 printed = scnprintf(bf, sizeof(bf), "%-*d ",
2063 notes->src->widths.addr + 1, al->line_nr);
2064 else
2065 printed = scnprintf(bf, sizeof(bf), "%-*s ",
2066 notes->src->widths.addr, " ");
2067 obj__printf(obj, bf);
2068 obj__printf(obj, "%-*s", width - printed - pcnt_width - cycles_width + 1, al->line);
2069 } else {
2070 u64 addr = al->offset;
2071 int color = -1;
2072
2073 if (!annotate_opts.use_offset)
2074 addr += notes->src->start;
2075
2076 if (!annotate_opts.use_offset) {
2077 printed = scnprintf(bf, sizeof(bf), "%" PRIx64 ": ", addr);
2078 } else {
2079 if (al->jump_sources &&
2080 annotate_opts.offset_level >= ANNOTATION__OFFSET_JUMP_TARGETS) {
2081 if (annotate_opts.show_nr_jumps) {
2082 int prev;
2083 printed = scnprintf(bf, sizeof(bf), "%*d ",
2084 notes->src->widths.jumps,
2085 al->jump_sources);
2086 prev = obj__set_jumps_percent_color(obj, al->jump_sources,
2087 current_entry);
2088 obj__printf(obj, bf);
2089 obj__set_color(obj, prev);
2090 }
2091 print_addr:
2092 printed = scnprintf(bf, sizeof(bf), "%*" PRIx64 ": ",
2093 notes->src->widths.target, addr);
2094 } else if (ins__is_call(&disasm_line(al)->ins) &&
2095 annotate_opts.offset_level >= ANNOTATION__OFFSET_CALL) {
2096 goto print_addr;
2097 } else if (annotate_opts.offset_level == ANNOTATION__MAX_OFFSET_LEVEL) {
2098 goto print_addr;
2099 } else {
2100 printed = scnprintf(bf, sizeof(bf), "%-*s ",
2101 notes->src->widths.addr, " ");
2102 }
2103 }
2104
2105 if (change_color)
2106 color = obj__set_color(obj, HE_COLORSET_ADDR);
2107 obj__printf(obj, bf);
2108 if (change_color)
2109 obj__set_color(obj, color);
2110
2111 disasm_line__write(disasm_line(al), notes, obj, bf, sizeof(bf), obj__printf, obj__write_graph);
2112
2113 obj__printf(obj, "%-*s", width - pcnt_width - cycles_width - 3 - printed, bf);
2114 }
2115
2116 }
2117
annotation_line__write(struct annotation_line * al,struct annotation * notes,struct annotation_write_ops * wops)2118 void annotation_line__write(struct annotation_line *al, struct annotation *notes,
2119 struct annotation_write_ops *wops)
2120 {
2121 __annotation_line__write(al, notes, wops->first_line, wops->current_entry,
2122 wops->change_color, wops->width, wops->obj,
2123 annotate_opts.percent_type,
2124 wops->set_color, wops->set_percent_color,
2125 wops->set_jumps_percent_color, wops->printf,
2126 wops->write_graph);
2127 }
2128
symbol__annotate2(struct map_symbol * ms,struct evsel * evsel,struct arch ** parch)2129 int symbol__annotate2(struct map_symbol *ms, struct evsel *evsel,
2130 struct arch **parch)
2131 {
2132 struct symbol *sym = ms->sym;
2133 struct annotation *notes = symbol__annotation(sym);
2134 size_t size = symbol__size(sym);
2135 int err;
2136
2137 err = symbol__annotate(ms, evsel, parch);
2138 if (err)
2139 return err;
2140
2141 symbol__calc_percent(sym, evsel);
2142
2143 annotation__set_index(notes);
2144 annotation__mark_jump_targets(notes, sym);
2145
2146 err = annotation__compute_ipc(notes, size, evsel);
2147 if (err)
2148 return err;
2149
2150 annotation__init_column_widths(notes, sym);
2151 annotation__update_column_widths(notes);
2152 sym->annotate2 = 1;
2153
2154 return 0;
2155 }
2156
2157 const char * const perf_disassembler__strs[] = {
2158 [PERF_DISASM_UNKNOWN] = "unknown",
2159 [PERF_DISASM_LLVM] = "llvm",
2160 [PERF_DISASM_CAPSTONE] = "capstone",
2161 [PERF_DISASM_OBJDUMP] = "objdump",
2162 };
2163
2164
annotation_options__add_disassembler(struct annotation_options * options,enum perf_disassembler dis)2165 static void annotation_options__add_disassembler(struct annotation_options *options,
2166 enum perf_disassembler dis)
2167 {
2168 for (u8 i = 0; i < ARRAY_SIZE(options->disassemblers); i++) {
2169 if (options->disassemblers[i] == dis) {
2170 /* Disassembler is already present then don't add again. */
2171 return;
2172 }
2173 if (options->disassemblers[i] == PERF_DISASM_UNKNOWN) {
2174 /* Found a free slot. */
2175 options->disassemblers[i] = dis;
2176 return;
2177 }
2178 }
2179 pr_err("Failed to add disassembler %d\n", dis);
2180 }
2181
annotation_options__add_disassemblers_str(struct annotation_options * options,const char * str)2182 static int annotation_options__add_disassemblers_str(struct annotation_options *options,
2183 const char *str)
2184 {
2185 while (str && *str != '\0') {
2186 const char *comma = strchr(str, ',');
2187 int len = comma ? comma - str : (int)strlen(str);
2188 bool match = false;
2189
2190 for (u8 i = 0; i < ARRAY_SIZE(perf_disassembler__strs); i++) {
2191 const char *dis_str = perf_disassembler__strs[i];
2192
2193 if (len == (int)strlen(dis_str) && !strncmp(str, dis_str, len)) {
2194 annotation_options__add_disassembler(options, i);
2195 match = true;
2196 break;
2197 }
2198 }
2199 if (!match) {
2200 pr_err("Invalid disassembler '%.*s'\n", len, str);
2201 return -1;
2202 }
2203 str = comma ? comma + 1 : NULL;
2204 }
2205 return 0;
2206 }
2207
annotation__config(const char * var,const char * value,void * data)2208 static int annotation__config(const char *var, const char *value, void *data)
2209 {
2210 struct annotation_options *opt = data;
2211
2212 if (!strstarts(var, "annotate."))
2213 return 0;
2214
2215 if (!strcmp(var, "annotate.offset_level")) {
2216 perf_config_u8(&opt->offset_level, "offset_level", value);
2217
2218 if (opt->offset_level > ANNOTATION__MAX_OFFSET_LEVEL)
2219 opt->offset_level = ANNOTATION__MAX_OFFSET_LEVEL;
2220 else if (opt->offset_level < ANNOTATION__MIN_OFFSET_LEVEL)
2221 opt->offset_level = ANNOTATION__MIN_OFFSET_LEVEL;
2222 } else if (!strcmp(var, "annotate.disassemblers")) {
2223 int err = annotation_options__add_disassemblers_str(opt, value);
2224
2225 if (err)
2226 return err;
2227 } else if (!strcmp(var, "annotate.hide_src_code")) {
2228 opt->hide_src_code = perf_config_bool("hide_src_code", value);
2229 } else if (!strcmp(var, "annotate.jump_arrows")) {
2230 opt->jump_arrows = perf_config_bool("jump_arrows", value);
2231 } else if (!strcmp(var, "annotate.show_linenr")) {
2232 opt->show_linenr = perf_config_bool("show_linenr", value);
2233 } else if (!strcmp(var, "annotate.show_nr_jumps")) {
2234 opt->show_nr_jumps = perf_config_bool("show_nr_jumps", value);
2235 } else if (!strcmp(var, "annotate.show_nr_samples")) {
2236 symbol_conf.show_nr_samples = perf_config_bool("show_nr_samples",
2237 value);
2238 } else if (!strcmp(var, "annotate.show_total_period")) {
2239 symbol_conf.show_total_period = perf_config_bool("show_total_period",
2240 value);
2241 } else if (!strcmp(var, "annotate.use_offset")) {
2242 opt->use_offset = perf_config_bool("use_offset", value);
2243 } else if (!strcmp(var, "annotate.disassembler_style")) {
2244 opt->disassembler_style = strdup(value);
2245 if (!opt->disassembler_style) {
2246 pr_err("Not enough memory for annotate.disassembler_style\n");
2247 return -1;
2248 }
2249 } else if (!strcmp(var, "annotate.objdump")) {
2250 opt->objdump_path = strdup(value);
2251 if (!opt->objdump_path) {
2252 pr_err("Not enough memory for annotate.objdump\n");
2253 return -1;
2254 }
2255 } else if (!strcmp(var, "annotate.addr2line")) {
2256 symbol_conf.addr2line_path = strdup(value);
2257 if (!symbol_conf.addr2line_path) {
2258 pr_err("Not enough memory for annotate.addr2line\n");
2259 return -1;
2260 }
2261 } else if (!strcmp(var, "annotate.demangle")) {
2262 symbol_conf.demangle = perf_config_bool("demangle", value);
2263 } else if (!strcmp(var, "annotate.demangle_kernel")) {
2264 symbol_conf.demangle_kernel = perf_config_bool("demangle_kernel", value);
2265 } else {
2266 pr_debug("%s variable unknown, ignoring...", var);
2267 }
2268
2269 return 0;
2270 }
2271
annotation_options__init(void)2272 void annotation_options__init(void)
2273 {
2274 struct annotation_options *opt = &annotate_opts;
2275
2276 memset(opt, 0, sizeof(*opt));
2277
2278 /* Default values. */
2279 opt->use_offset = true;
2280 opt->jump_arrows = true;
2281 opt->annotate_src = true;
2282 opt->offset_level = ANNOTATION__OFFSET_JUMP_TARGETS;
2283 opt->percent_type = PERCENT_PERIOD_LOCAL;
2284 opt->hide_src_code = true;
2285 opt->hide_src_code_on_title = true;
2286 }
2287
annotation_options__exit(void)2288 void annotation_options__exit(void)
2289 {
2290 zfree(&annotate_opts.disassembler_style);
2291 zfree(&annotate_opts.objdump_path);
2292 }
2293
annotation_options__default_init_disassemblers(struct annotation_options * options)2294 static void annotation_options__default_init_disassemblers(struct annotation_options *options)
2295 {
2296 if (options->disassemblers[0] != PERF_DISASM_UNKNOWN) {
2297 /* Already initialized. */
2298 return;
2299 }
2300 #ifdef HAVE_LIBLLVM_SUPPORT
2301 annotation_options__add_disassembler(options, PERF_DISASM_LLVM);
2302 #endif
2303 #ifdef HAVE_LIBCAPSTONE_SUPPORT
2304 annotation_options__add_disassembler(options, PERF_DISASM_CAPSTONE);
2305 #endif
2306 annotation_options__add_disassembler(options, PERF_DISASM_OBJDUMP);
2307 }
2308
annotation_config__init(void)2309 void annotation_config__init(void)
2310 {
2311 perf_config(annotation__config, &annotate_opts);
2312 annotation_options__default_init_disassemblers(&annotate_opts);
2313 }
2314
parse_percent_type(char * str1,char * str2)2315 static unsigned int parse_percent_type(char *str1, char *str2)
2316 {
2317 unsigned int type = (unsigned int) -1;
2318
2319 if (!strcmp("period", str1)) {
2320 if (!strcmp("local", str2))
2321 type = PERCENT_PERIOD_LOCAL;
2322 else if (!strcmp("global", str2))
2323 type = PERCENT_PERIOD_GLOBAL;
2324 }
2325
2326 if (!strcmp("hits", str1)) {
2327 if (!strcmp("local", str2))
2328 type = PERCENT_HITS_LOCAL;
2329 else if (!strcmp("global", str2))
2330 type = PERCENT_HITS_GLOBAL;
2331 }
2332
2333 return type;
2334 }
2335
annotate_parse_percent_type(const struct option * opt __maybe_unused,const char * _str,int unset __maybe_unused)2336 int annotate_parse_percent_type(const struct option *opt __maybe_unused, const char *_str,
2337 int unset __maybe_unused)
2338 {
2339 unsigned int type;
2340 char *str1, *str2;
2341 int err = -1;
2342
2343 str1 = strdup(_str);
2344 if (!str1)
2345 return -ENOMEM;
2346
2347 str2 = strchr(str1, '-');
2348 if (!str2)
2349 goto out;
2350
2351 *str2++ = 0;
2352
2353 type = parse_percent_type(str1, str2);
2354 if (type == (unsigned int) -1)
2355 type = parse_percent_type(str2, str1);
2356 if (type != (unsigned int) -1) {
2357 annotate_opts.percent_type = type;
2358 err = 0;
2359 }
2360
2361 out:
2362 free(str1);
2363 return err;
2364 }
2365
annotate_check_args(void)2366 int annotate_check_args(void)
2367 {
2368 struct annotation_options *args = &annotate_opts;
2369
2370 if (args->prefix_strip && !args->prefix) {
2371 pr_err("--prefix-strip requires --prefix\n");
2372 return -1;
2373 }
2374 return 0;
2375 }
2376
2377 /*
2378 * Get register number and access offset from the given instruction.
2379 * It assumes AT&T x86 asm format like OFFSET(REG). Maybe it needs
2380 * to revisit the format when it handles different architecture.
2381 * Fills @reg and @offset when return 0.
2382 */
extract_reg_offset(struct arch * arch,const char * str,struct annotated_op_loc * op_loc)2383 static int extract_reg_offset(struct arch *arch, const char *str,
2384 struct annotated_op_loc *op_loc)
2385 {
2386 char *p;
2387 char *regname;
2388
2389 if (arch->objdump.register_char == 0)
2390 return -1;
2391
2392 /*
2393 * It should start from offset, but it's possible to skip 0
2394 * in the asm. So 0(%rax) should be same as (%rax).
2395 *
2396 * However, it also start with a segment select register like
2397 * %gs:0x18(%rbx). In that case it should skip the part.
2398 */
2399 if (*str == arch->objdump.register_char) {
2400 if (arch__is(arch, "x86")) {
2401 /* FIXME: Handle other segment registers */
2402 if (!strncmp(str, "%gs:", 4))
2403 op_loc->segment = INSN_SEG_X86_GS;
2404 }
2405
2406 while (*str && !isdigit(*str) &&
2407 *str != arch->objdump.memory_ref_char)
2408 str++;
2409 }
2410
2411 op_loc->offset = strtol(str, &p, 0);
2412
2413 p = strchr(p, arch->objdump.register_char);
2414 if (p == NULL)
2415 return -1;
2416
2417 regname = strdup(p);
2418 if (regname == NULL)
2419 return -1;
2420
2421 op_loc->reg1 = get_dwarf_regnum(regname, arch->e_machine, arch->e_flags);
2422 free(regname);
2423
2424 /* Get the second register */
2425 if (op_loc->multi_regs) {
2426 p = strchr(p + 1, arch->objdump.register_char);
2427 if (p == NULL)
2428 return -1;
2429
2430 regname = strdup(p);
2431 if (regname == NULL)
2432 return -1;
2433
2434 op_loc->reg2 = get_dwarf_regnum(regname, arch->e_machine, arch->e_flags);
2435 free(regname);
2436 }
2437 return 0;
2438 }
2439
2440 /**
2441 * annotate_get_insn_location - Get location of instruction
2442 * @arch: the architecture info
2443 * @dl: the target instruction
2444 * @loc: a buffer to save the data
2445 *
2446 * Get detailed location info (register and offset) in the instruction.
2447 * It needs both source and target operand and whether it accesses a
2448 * memory location. The offset field is meaningful only when the
2449 * corresponding mem flag is set. The reg2 field is meaningful only
2450 * when multi_regs flag is set.
2451 *
2452 * Some examples on x86:
2453 *
2454 * mov (%rax), %rcx # src_reg1 = rax, src_mem = 1, src_offset = 0
2455 * # dst_reg1 = rcx, dst_mem = 0
2456 *
2457 * mov 0x18, %r8 # src_reg1 = -1, src_mem = 0
2458 * # dst_reg1 = r8, dst_mem = 0
2459 *
2460 * mov %rsi, 8(%rbx,%rcx,4) # src_reg1 = rsi, src_mem = 0, src_multi_regs = 0
2461 * # dst_reg1 = rbx, dst_reg2 = rcx, dst_mem = 1
2462 * # dst_multi_regs = 1, dst_offset = 8
2463 */
annotate_get_insn_location(struct arch * arch,struct disasm_line * dl,struct annotated_insn_loc * loc)2464 int annotate_get_insn_location(struct arch *arch, struct disasm_line *dl,
2465 struct annotated_insn_loc *loc)
2466 {
2467 struct ins_operands *ops;
2468 struct annotated_op_loc *op_loc;
2469 int i;
2470
2471 if (ins__is_lock(&dl->ins))
2472 ops = dl->ops.locked.ops;
2473 else
2474 ops = &dl->ops;
2475
2476 if (ops == NULL)
2477 return -1;
2478
2479 memset(loc, 0, sizeof(*loc));
2480
2481 for_each_insn_op_loc(loc, i, op_loc) {
2482 const char *insn_str = ops->source.raw;
2483 bool multi_regs = ops->source.multi_regs;
2484 bool mem_ref = ops->source.mem_ref;
2485
2486 if (i == INSN_OP_TARGET) {
2487 insn_str = ops->target.raw;
2488 multi_regs = ops->target.multi_regs;
2489 mem_ref = ops->target.mem_ref;
2490 }
2491
2492 /* Invalidate the register by default */
2493 op_loc->reg1 = -1;
2494 op_loc->reg2 = -1;
2495
2496 if (insn_str == NULL) {
2497 if (!arch__is(arch, "powerpc"))
2498 continue;
2499 }
2500
2501 /*
2502 * For powerpc, call get_powerpc_regs function which extracts the
2503 * required fields for op_loc, ie reg1, reg2, offset from the
2504 * raw instruction.
2505 */
2506 if (arch__is(arch, "powerpc")) {
2507 op_loc->mem_ref = mem_ref;
2508 op_loc->multi_regs = multi_regs;
2509 get_powerpc_regs(dl->raw.raw_insn, !i, op_loc);
2510 } else if (strchr(insn_str, arch->objdump.memory_ref_char)) {
2511 op_loc->mem_ref = true;
2512 op_loc->multi_regs = multi_regs;
2513 extract_reg_offset(arch, insn_str, op_loc);
2514 } else {
2515 char *s, *p = NULL;
2516
2517 if (arch__is(arch, "x86")) {
2518 /* FIXME: Handle other segment registers */
2519 if (!strncmp(insn_str, "%gs:", 4)) {
2520 op_loc->segment = INSN_SEG_X86_GS;
2521 op_loc->offset = strtol(insn_str + 4,
2522 &p, 0);
2523 if (p && p != insn_str + 4)
2524 op_loc->imm = true;
2525 continue;
2526 }
2527 }
2528
2529 s = strdup(insn_str);
2530 if (s == NULL)
2531 return -1;
2532
2533 if (*s == arch->objdump.register_char)
2534 op_loc->reg1 = get_dwarf_regnum(s, arch->e_machine, arch->e_flags);
2535 else if (*s == arch->objdump.imm_char) {
2536 op_loc->offset = strtol(s + 1, &p, 0);
2537 if (p && p != s + 1)
2538 op_loc->imm = true;
2539 }
2540 free(s);
2541 }
2542 }
2543
2544 return 0;
2545 }
2546
find_disasm_line(struct symbol * sym,u64 ip,bool allow_update)2547 static struct disasm_line *find_disasm_line(struct symbol *sym, u64 ip,
2548 bool allow_update)
2549 {
2550 struct disasm_line *dl;
2551 struct annotation *notes;
2552
2553 notes = symbol__annotation(sym);
2554
2555 list_for_each_entry(dl, ¬es->src->source, al.node) {
2556 if (dl->al.offset == -1)
2557 continue;
2558
2559 if (sym->start + dl->al.offset == ip) {
2560 /*
2561 * llvm-objdump places "lock" in a separate line and
2562 * in that case, we want to get the next line.
2563 */
2564 if (ins__is_lock(&dl->ins) &&
2565 *dl->ops.raw == '\0' && allow_update) {
2566 ip++;
2567 continue;
2568 }
2569 return dl;
2570 }
2571 }
2572 return NULL;
2573 }
2574
annotate_data_stat(struct list_head * head,const char * name)2575 static struct annotated_item_stat *annotate_data_stat(struct list_head *head,
2576 const char *name)
2577 {
2578 struct annotated_item_stat *istat;
2579
2580 list_for_each_entry(istat, head, list) {
2581 if (!strcmp(istat->name, name))
2582 return istat;
2583 }
2584
2585 istat = zalloc(sizeof(*istat));
2586 if (istat == NULL)
2587 return NULL;
2588
2589 istat->name = strdup(name);
2590 if ((istat->name == NULL) || (!strlen(istat->name))) {
2591 free(istat);
2592 return NULL;
2593 }
2594
2595 list_add_tail(&istat->list, head);
2596 return istat;
2597 }
2598
is_stack_operation(struct arch * arch,struct disasm_line * dl)2599 static bool is_stack_operation(struct arch *arch, struct disasm_line *dl)
2600 {
2601 if (arch__is(arch, "x86")) {
2602 if (!strncmp(dl->ins.name, "push", 4) ||
2603 !strncmp(dl->ins.name, "pop", 3) ||
2604 !strncmp(dl->ins.name, "call", 4) ||
2605 !strncmp(dl->ins.name, "ret", 3))
2606 return true;
2607 }
2608
2609 return false;
2610 }
2611
is_stack_canary(struct arch * arch,struct annotated_op_loc * loc)2612 static bool is_stack_canary(struct arch *arch, struct annotated_op_loc *loc)
2613 {
2614 /* On x86_64, %gs:40 is used for stack canary */
2615 if (arch__is(arch, "x86")) {
2616 if (loc->segment == INSN_SEG_X86_GS && loc->imm &&
2617 loc->offset == 40)
2618 return true;
2619 }
2620
2621 return false;
2622 }
2623
2624 static struct disasm_line *
annotation__prev_asm_line(struct annotation * notes,struct disasm_line * curr)2625 annotation__prev_asm_line(struct annotation *notes, struct disasm_line *curr)
2626 {
2627 struct list_head *sources = ¬es->src->source;
2628 struct disasm_line *prev;
2629
2630 if (curr == list_first_entry(sources, struct disasm_line, al.node))
2631 return NULL;
2632
2633 prev = list_prev_entry(curr, al.node);
2634 while (prev->al.offset == -1 &&
2635 prev != list_first_entry(sources, struct disasm_line, al.node))
2636 prev = list_prev_entry(prev, al.node);
2637
2638 if (prev->al.offset == -1)
2639 return NULL;
2640
2641 return prev;
2642 }
2643
2644 static struct disasm_line *
annotation__next_asm_line(struct annotation * notes,struct disasm_line * curr)2645 annotation__next_asm_line(struct annotation *notes, struct disasm_line *curr)
2646 {
2647 struct list_head *sources = ¬es->src->source;
2648 struct disasm_line *next;
2649
2650 if (curr == list_last_entry(sources, struct disasm_line, al.node))
2651 return NULL;
2652
2653 next = list_next_entry(curr, al.node);
2654 while (next->al.offset == -1 &&
2655 next != list_last_entry(sources, struct disasm_line, al.node))
2656 next = list_next_entry(next, al.node);
2657
2658 if (next->al.offset == -1)
2659 return NULL;
2660
2661 return next;
2662 }
2663
annotate_calc_pcrel(struct map_symbol * ms,u64 ip,int offset,struct disasm_line * dl)2664 u64 annotate_calc_pcrel(struct map_symbol *ms, u64 ip, int offset,
2665 struct disasm_line *dl)
2666 {
2667 struct annotation *notes;
2668 struct disasm_line *next;
2669 u64 addr;
2670
2671 notes = symbol__annotation(ms->sym);
2672 /*
2673 * PC-relative addressing starts from the next instruction address
2674 * But the IP is for the current instruction. Since disasm_line
2675 * doesn't have the instruction size, calculate it using the next
2676 * disasm_line. If it's the last one, we can use symbol's end
2677 * address directly.
2678 */
2679 next = annotation__next_asm_line(notes, dl);
2680 if (next == NULL)
2681 addr = ms->sym->end + offset;
2682 else
2683 addr = ip + (next->al.offset - dl->al.offset) + offset;
2684
2685 return map__rip_2objdump(ms->map, addr);
2686 }
2687
2688 static struct debuginfo_cache {
2689 struct dso *dso;
2690 struct debuginfo *dbg;
2691 } di_cache;
2692
debuginfo_cache__delete(void)2693 void debuginfo_cache__delete(void)
2694 {
2695 dso__put(di_cache.dso);
2696 di_cache.dso = NULL;
2697
2698 debuginfo__delete(di_cache.dbg);
2699 di_cache.dbg = NULL;
2700 }
2701
2702 static struct annotated_data_type *
__hist_entry__get_data_type(struct hist_entry * he,struct arch * arch,struct debuginfo * dbg,struct disasm_line * dl,int * type_offset)2703 __hist_entry__get_data_type(struct hist_entry *he, struct arch *arch,
2704 struct debuginfo *dbg, struct disasm_line *dl,
2705 int *type_offset)
2706 {
2707 struct map_symbol *ms = &he->ms;
2708 struct annotated_insn_loc loc;
2709 struct annotated_op_loc *op_loc;
2710 struct annotated_data_type *mem_type;
2711 struct annotated_item_stat *istat;
2712 int i;
2713
2714 istat = annotate_data_stat(&ann_insn_stat, dl->ins.name);
2715 if (istat == NULL) {
2716 ann_data_stat.no_insn++;
2717 return NO_TYPE;
2718 }
2719
2720 if (annotate_get_insn_location(arch, dl, &loc) < 0) {
2721 ann_data_stat.no_insn_ops++;
2722 istat->bad++;
2723 return NO_TYPE;
2724 }
2725
2726 if (is_stack_operation(arch, dl)) {
2727 istat->good++;
2728 *type_offset = 0;
2729 return &stackop_type;
2730 }
2731
2732 for_each_insn_op_loc(&loc, i, op_loc) {
2733 struct data_loc_info dloc = {
2734 .arch = arch,
2735 .thread = he->thread,
2736 .ms = ms,
2737 .ip = ms->sym->start + dl->al.offset,
2738 .cpumode = he->cpumode,
2739 .op = op_loc,
2740 .di = dbg,
2741 };
2742
2743 if (!op_loc->mem_ref && op_loc->segment == INSN_SEG_NONE)
2744 continue;
2745
2746 /* PC-relative addressing */
2747 if (op_loc->reg1 == DWARF_REG_PC) {
2748 dloc.var_addr = annotate_calc_pcrel(ms, dloc.ip,
2749 op_loc->offset, dl);
2750 }
2751
2752 /* This CPU access in kernel - pretend PC-relative addressing */
2753 if (dso__kernel(map__dso(ms->map)) && arch__is(arch, "x86") &&
2754 op_loc->segment == INSN_SEG_X86_GS && op_loc->imm) {
2755 dloc.var_addr = op_loc->offset;
2756 op_loc->reg1 = DWARF_REG_PC;
2757 }
2758
2759 mem_type = find_data_type(&dloc);
2760
2761 if (mem_type == NULL && is_stack_canary(arch, op_loc)) {
2762 istat->good++;
2763 *type_offset = 0;
2764 return &canary_type;
2765 }
2766
2767 if (mem_type)
2768 istat->good++;
2769 else
2770 istat->bad++;
2771
2772 if (symbol_conf.annotate_data_sample) {
2773 struct evsel *evsel = hists_to_evsel(he->hists);
2774
2775 annotated_data_type__update_samples(mem_type, evsel,
2776 dloc.type_offset,
2777 he->stat.nr_events,
2778 he->stat.period);
2779 }
2780 *type_offset = dloc.type_offset;
2781 return mem_type ?: NO_TYPE;
2782 }
2783
2784 /* retry with a fused instruction */
2785 return NULL;
2786 }
2787
2788 /**
2789 * hist_entry__get_data_type - find data type for given hist entry
2790 * @he: hist entry
2791 *
2792 * This function first annotates the instruction at @he->ip and extracts
2793 * register and offset info from it. Then it searches the DWARF debug
2794 * info to get a variable and type information using the address, register,
2795 * and offset.
2796 */
hist_entry__get_data_type(struct hist_entry * he)2797 struct annotated_data_type *hist_entry__get_data_type(struct hist_entry *he)
2798 {
2799 struct map_symbol *ms = &he->ms;
2800 struct evsel *evsel = hists_to_evsel(he->hists);
2801 struct arch *arch;
2802 struct disasm_line *dl;
2803 struct annotated_data_type *mem_type;
2804 struct annotated_item_stat *istat;
2805 u64 ip = he->ip;
2806
2807 ann_data_stat.total++;
2808
2809 if (ms->map == NULL || ms->sym == NULL) {
2810 ann_data_stat.no_sym++;
2811 return NULL;
2812 }
2813
2814 if (!symbol_conf.init_annotation) {
2815 ann_data_stat.no_sym++;
2816 return NULL;
2817 }
2818
2819 /*
2820 * di_cache holds a pair of values, but code below assumes
2821 * di_cache.dso can be compared/updated and di_cache.dbg can be
2822 * read/updated independently from each other. That assumption only
2823 * holds in single threaded code.
2824 */
2825 assert(perf_singlethreaded);
2826
2827 if (map__dso(ms->map) != di_cache.dso) {
2828 dso__put(di_cache.dso);
2829 di_cache.dso = dso__get(map__dso(ms->map));
2830
2831 debuginfo__delete(di_cache.dbg);
2832 di_cache.dbg = debuginfo__new(dso__long_name(di_cache.dso));
2833 }
2834
2835 if (di_cache.dbg == NULL) {
2836 ann_data_stat.no_dbginfo++;
2837 return NULL;
2838 }
2839
2840 /* Make sure it has the disasm of the function */
2841 if (symbol__annotate(ms, evsel, &arch) < 0) {
2842 ann_data_stat.no_insn++;
2843 return NULL;
2844 }
2845
2846 /*
2847 * Get a disasm to extract the location from the insn.
2848 * This is too slow...
2849 */
2850 dl = find_disasm_line(ms->sym, ip, /*allow_update=*/true);
2851 if (dl == NULL) {
2852 ann_data_stat.no_insn++;
2853 return NULL;
2854 }
2855
2856 retry:
2857 mem_type = __hist_entry__get_data_type(he, arch, di_cache.dbg, dl,
2858 &he->mem_type_off);
2859 if (mem_type)
2860 return mem_type == NO_TYPE ? NULL : mem_type;
2861
2862 /*
2863 * Some instructions can be fused and the actual memory access came
2864 * from the previous instruction.
2865 */
2866 if (dl->al.offset > 0) {
2867 struct annotation *notes;
2868 struct disasm_line *prev_dl;
2869
2870 notes = symbol__annotation(ms->sym);
2871 prev_dl = annotation__prev_asm_line(notes, dl);
2872
2873 if (prev_dl && ins__is_fused(arch, prev_dl->ins.name, dl->ins.name)) {
2874 dl = prev_dl;
2875 goto retry;
2876 }
2877 }
2878
2879 ann_data_stat.no_mem_ops++;
2880 istat = annotate_data_stat(&ann_insn_stat, dl->ins.name);
2881 if (istat)
2882 istat->bad++;
2883 return NULL;
2884 }
2885
2886 /* Basic block traversal (BFS) data structure */
2887 struct basic_block_data {
2888 struct list_head queue;
2889 struct list_head visited;
2890 };
2891
2892 /*
2893 * During the traversal, it needs to know the parent block where the current
2894 * block block started from. Note that single basic block can be parent of
2895 * two child basic blocks (in case of condition jump).
2896 */
2897 struct basic_block_link {
2898 struct list_head node;
2899 struct basic_block_link *parent;
2900 struct annotated_basic_block *bb;
2901 };
2902
2903 /* Check any of basic block in the list already has the offset */
basic_block_has_offset(struct list_head * head,s64 offset)2904 static bool basic_block_has_offset(struct list_head *head, s64 offset)
2905 {
2906 struct basic_block_link *link;
2907
2908 list_for_each_entry(link, head, node) {
2909 s64 begin_offset = link->bb->begin->al.offset;
2910 s64 end_offset = link->bb->end->al.offset;
2911
2912 if (begin_offset <= offset && offset <= end_offset)
2913 return true;
2914 }
2915 return false;
2916 }
2917
is_new_basic_block(struct basic_block_data * bb_data,struct disasm_line * dl)2918 static bool is_new_basic_block(struct basic_block_data *bb_data,
2919 struct disasm_line *dl)
2920 {
2921 s64 offset = dl->al.offset;
2922
2923 if (basic_block_has_offset(&bb_data->visited, offset))
2924 return false;
2925 if (basic_block_has_offset(&bb_data->queue, offset))
2926 return false;
2927 return true;
2928 }
2929
2930 /* Add a basic block starting from dl and link it to the parent */
add_basic_block(struct basic_block_data * bb_data,struct basic_block_link * parent,struct disasm_line * dl)2931 static int add_basic_block(struct basic_block_data *bb_data,
2932 struct basic_block_link *parent,
2933 struct disasm_line *dl)
2934 {
2935 struct annotated_basic_block *bb;
2936 struct basic_block_link *link;
2937
2938 if (dl == NULL)
2939 return -1;
2940
2941 if (!is_new_basic_block(bb_data, dl))
2942 return 0;
2943
2944 bb = zalloc(sizeof(*bb));
2945 if (bb == NULL)
2946 return -1;
2947
2948 bb->begin = dl;
2949 bb->end = dl;
2950 INIT_LIST_HEAD(&bb->list);
2951
2952 link = malloc(sizeof(*link));
2953 if (link == NULL) {
2954 free(bb);
2955 return -1;
2956 }
2957
2958 link->bb = bb;
2959 link->parent = parent;
2960 list_add_tail(&link->node, &bb_data->queue);
2961 return 0;
2962 }
2963
2964 /* Returns true when it finds the target in the current basic block */
process_basic_block(struct basic_block_data * bb_data,struct basic_block_link * link,struct symbol * sym,u64 target)2965 static bool process_basic_block(struct basic_block_data *bb_data,
2966 struct basic_block_link *link,
2967 struct symbol *sym, u64 target)
2968 {
2969 struct disasm_line *dl, *next_dl, *last_dl;
2970 struct annotation *notes = symbol__annotation(sym);
2971 bool found = false;
2972
2973 dl = link->bb->begin;
2974 /* Check if it's already visited */
2975 if (basic_block_has_offset(&bb_data->visited, dl->al.offset))
2976 return false;
2977
2978 last_dl = list_last_entry(¬es->src->source,
2979 struct disasm_line, al.node);
2980 if (last_dl->al.offset == -1)
2981 last_dl = annotation__prev_asm_line(notes, last_dl);
2982
2983 if (last_dl == NULL)
2984 return false;
2985
2986 list_for_each_entry_from(dl, ¬es->src->source, al.node) {
2987 /* Skip comment or debug info line */
2988 if (dl->al.offset == -1)
2989 continue;
2990 /* Found the target instruction */
2991 if (sym->start + dl->al.offset == target) {
2992 found = true;
2993 break;
2994 }
2995 /* End of the function, finish the block */
2996 if (dl == last_dl)
2997 break;
2998 /* 'return' instruction finishes the block */
2999 if (ins__is_ret(&dl->ins))
3000 break;
3001 /* normal instructions are part of the basic block */
3002 if (!ins__is_jump(&dl->ins))
3003 continue;
3004 /* jump to a different function, tail call or return */
3005 if (dl->ops.target.outside)
3006 break;
3007 /* jump instruction creates new basic block(s) */
3008 next_dl = find_disasm_line(sym, sym->start + dl->ops.target.offset,
3009 /*allow_update=*/false);
3010 if (next_dl)
3011 add_basic_block(bb_data, link, next_dl);
3012
3013 /*
3014 * FIXME: determine conditional jumps properly.
3015 * Conditional jumps create another basic block with the
3016 * next disasm line.
3017 */
3018 if (!strstr(dl->ins.name, "jmp")) {
3019 next_dl = annotation__next_asm_line(notes, dl);
3020 if (next_dl)
3021 add_basic_block(bb_data, link, next_dl);
3022 }
3023 break;
3024
3025 }
3026 link->bb->end = dl;
3027 return found;
3028 }
3029
3030 /*
3031 * It founds a target basic block, build a proper linked list of basic blocks
3032 * by following the link recursively.
3033 */
link_found_basic_blocks(struct basic_block_link * link,struct list_head * head)3034 static void link_found_basic_blocks(struct basic_block_link *link,
3035 struct list_head *head)
3036 {
3037 while (link) {
3038 struct basic_block_link *parent = link->parent;
3039
3040 list_move(&link->bb->list, head);
3041 list_del(&link->node);
3042 free(link);
3043
3044 link = parent;
3045 }
3046 }
3047
delete_basic_blocks(struct basic_block_data * bb_data)3048 static void delete_basic_blocks(struct basic_block_data *bb_data)
3049 {
3050 struct basic_block_link *link, *tmp;
3051
3052 list_for_each_entry_safe(link, tmp, &bb_data->queue, node) {
3053 list_del(&link->node);
3054 zfree(&link->bb);
3055 free(link);
3056 }
3057
3058 list_for_each_entry_safe(link, tmp, &bb_data->visited, node) {
3059 list_del(&link->node);
3060 zfree(&link->bb);
3061 free(link);
3062 }
3063 }
3064
3065 /**
3066 * annotate_get_basic_blocks - Get basic blocks for given address range
3067 * @sym: symbol to annotate
3068 * @src: source address
3069 * @dst: destination address
3070 * @head: list head to save basic blocks
3071 *
3072 * This function traverses disasm_lines from @src to @dst and save them in a
3073 * list of annotated_basic_block to @head. It uses BFS to find the shortest
3074 * path between two. The basic_block_link is to maintain parent links so
3075 * that it can build a list of blocks from the start.
3076 */
annotate_get_basic_blocks(struct symbol * sym,s64 src,s64 dst,struct list_head * head)3077 int annotate_get_basic_blocks(struct symbol *sym, s64 src, s64 dst,
3078 struct list_head *head)
3079 {
3080 struct basic_block_data bb_data = {
3081 .queue = LIST_HEAD_INIT(bb_data.queue),
3082 .visited = LIST_HEAD_INIT(bb_data.visited),
3083 };
3084 struct basic_block_link *link;
3085 struct disasm_line *dl;
3086 int ret = -1;
3087
3088 dl = find_disasm_line(sym, src, /*allow_update=*/false);
3089 if (dl == NULL)
3090 return -1;
3091
3092 if (add_basic_block(&bb_data, /*parent=*/NULL, dl) < 0)
3093 return -1;
3094
3095 /* Find shortest path from src to dst using BFS */
3096 while (!list_empty(&bb_data.queue)) {
3097 link = list_first_entry(&bb_data.queue, struct basic_block_link, node);
3098
3099 if (process_basic_block(&bb_data, link, sym, dst)) {
3100 link_found_basic_blocks(link, head);
3101 ret = 0;
3102 break;
3103 }
3104 list_move(&link->node, &bb_data.visited);
3105 }
3106 delete_basic_blocks(&bb_data);
3107 return ret;
3108 }
3109