1 /* 2 * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com> 3 * 4 * Parts came from builtin-annotate.c, see those files for further 5 * copyright notes. 6 * 7 * Released under the GPL v2. (and only v2, not any later version) 8 */ 9 10 #include <errno.h> 11 #include <inttypes.h> 12 #include <libgen.h> 13 #include "util.h" 14 #include "ui/ui.h" 15 #include "sort.h" 16 #include "build-id.h" 17 #include "color.h" 18 #include "config.h" 19 #include "cache.h" 20 #include "symbol.h" 21 #include "units.h" 22 #include "debug.h" 23 #include "annotate.h" 24 #include "evsel.h" 25 #include "evlist.h" 26 #include "block-range.h" 27 #include "string2.h" 28 #include "arch/common.h" 29 #include <regex.h> 30 #include <pthread.h> 31 #include <linux/bitops.h> 32 #include <linux/kernel.h> 33 34 /* FIXME: For the HE_COLORSET */ 35 #include "ui/browser.h" 36 37 /* 38 * FIXME: Using the same values as slang.h, 39 * but that header may not be available everywhere 40 */ 41 #define LARROW_CHAR ((unsigned char)',') 42 #define RARROW_CHAR ((unsigned char)'+') 43 #define DARROW_CHAR ((unsigned char)'.') 44 #define UARROW_CHAR ((unsigned char)'-') 45 46 #include "sane_ctype.h" 47 48 struct annotation_options annotation__default_options = { 49 .use_offset = true, 50 .jump_arrows = true, 51 .annotate_src = true, 52 .offset_level = ANNOTATION__OFFSET_JUMP_TARGETS, 53 .percent_type = PERCENT_PERIOD_LOCAL, 54 }; 55 56 static regex_t file_lineno; 57 58 static struct ins_ops *ins__find(struct arch *arch, const char *name); 59 static void ins__sort(struct arch *arch); 60 static int disasm_line__parse(char *line, const char **namep, char **rawp); 61 62 struct arch { 63 const char *name; 64 struct ins *instructions; 65 size_t nr_instructions; 66 size_t nr_instructions_allocated; 67 struct ins_ops *(*associate_instruction_ops)(struct arch *arch, const char *name); 68 bool sorted_instructions; 69 bool initialized; 70 void *priv; 71 unsigned int model; 72 unsigned int family; 73 int (*init)(struct arch *arch, char *cpuid); 74 bool (*ins_is_fused)(struct arch *arch, const char *ins1, 75 const char *ins2); 76 struct { 77 char comment_char; 78 char skip_functions_char; 79 } objdump; 80 }; 81 82 static struct ins_ops call_ops; 83 static struct ins_ops dec_ops; 84 static struct ins_ops jump_ops; 85 static struct ins_ops mov_ops; 86 static struct ins_ops nop_ops; 87 static struct ins_ops lock_ops; 88 static struct ins_ops ret_ops; 89 90 static int arch__grow_instructions(struct arch *arch) 91 { 92 struct ins *new_instructions; 93 size_t new_nr_allocated; 94 95 if (arch->nr_instructions_allocated == 0 && arch->instructions) 96 goto grow_from_non_allocated_table; 97 98 new_nr_allocated = arch->nr_instructions_allocated + 128; 99 new_instructions = realloc(arch->instructions, new_nr_allocated * sizeof(struct ins)); 100 if (new_instructions == NULL) 101 return -1; 102 103 out_update_instructions: 104 arch->instructions = new_instructions; 105 arch->nr_instructions_allocated = new_nr_allocated; 106 return 0; 107 108 grow_from_non_allocated_table: 109 new_nr_allocated = arch->nr_instructions + 128; 110 new_instructions = calloc(new_nr_allocated, sizeof(struct ins)); 111 if (new_instructions == NULL) 112 return -1; 113 114 memcpy(new_instructions, arch->instructions, arch->nr_instructions); 115 goto out_update_instructions; 116 } 117 118 static int arch__associate_ins_ops(struct arch* arch, const char *name, struct ins_ops *ops) 119 { 120 struct ins *ins; 121 122 if (arch->nr_instructions == arch->nr_instructions_allocated && 123 arch__grow_instructions(arch)) 124 return -1; 125 126 ins = &arch->instructions[arch->nr_instructions]; 127 ins->name = strdup(name); 128 if (!ins->name) 129 return -1; 130 131 ins->ops = ops; 132 arch->nr_instructions++; 133 134 ins__sort(arch); 135 return 0; 136 } 137 138 #include "arch/arc/annotate/instructions.c" 139 #include "arch/arm/annotate/instructions.c" 140 #include "arch/arm64/annotate/instructions.c" 141 #include "arch/x86/annotate/instructions.c" 142 #include "arch/powerpc/annotate/instructions.c" 143 #include "arch/s390/annotate/instructions.c" 144 #include "arch/sparc/annotate/instructions.c" 145 146 static struct arch architectures[] = { 147 { 148 .name = "arc", 149 .init = arc__annotate_init, 150 }, 151 { 152 .name = "arm", 153 .init = arm__annotate_init, 154 }, 155 { 156 .name = "arm64", 157 .init = arm64__annotate_init, 158 }, 159 { 160 .name = "x86", 161 .init = x86__annotate_init, 162 .instructions = x86__instructions, 163 .nr_instructions = ARRAY_SIZE(x86__instructions), 164 .ins_is_fused = x86__ins_is_fused, 165 .objdump = { 166 .comment_char = '#', 167 }, 168 }, 169 { 170 .name = "powerpc", 171 .init = powerpc__annotate_init, 172 }, 173 { 174 .name = "s390", 175 .init = s390__annotate_init, 176 .objdump = { 177 .comment_char = '#', 178 }, 179 }, 180 { 181 .name = "sparc", 182 .init = sparc__annotate_init, 183 .objdump = { 184 .comment_char = '#', 185 }, 186 }, 187 }; 188 189 static void ins__delete(struct ins_operands *ops) 190 { 191 if (ops == NULL) 192 return; 193 zfree(&ops->source.raw); 194 zfree(&ops->source.name); 195 zfree(&ops->target.raw); 196 zfree(&ops->target.name); 197 } 198 199 static int ins__raw_scnprintf(struct ins *ins, char *bf, size_t size, 200 struct ins_operands *ops) 201 { 202 return scnprintf(bf, size, "%-6s %s", ins->name, ops->raw); 203 } 204 205 int ins__scnprintf(struct ins *ins, char *bf, size_t size, 206 struct ins_operands *ops) 207 { 208 if (ins->ops->scnprintf) 209 return ins->ops->scnprintf(ins, bf, size, ops); 210 211 return ins__raw_scnprintf(ins, bf, size, ops); 212 } 213 214 bool ins__is_fused(struct arch *arch, const char *ins1, const char *ins2) 215 { 216 if (!arch || !arch->ins_is_fused) 217 return false; 218 219 return arch->ins_is_fused(arch, ins1, ins2); 220 } 221 222 static int call__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms) 223 { 224 char *endptr, *tok, *name; 225 struct map *map = ms->map; 226 struct addr_map_symbol target = { 227 .map = map, 228 }; 229 230 ops->target.addr = strtoull(ops->raw, &endptr, 16); 231 232 name = strchr(endptr, '<'); 233 if (name == NULL) 234 goto indirect_call; 235 236 name++; 237 238 if (arch->objdump.skip_functions_char && 239 strchr(name, arch->objdump.skip_functions_char)) 240 return -1; 241 242 tok = strchr(name, '>'); 243 if (tok == NULL) 244 return -1; 245 246 *tok = '\0'; 247 ops->target.name = strdup(name); 248 *tok = '>'; 249 250 if (ops->target.name == NULL) 251 return -1; 252 find_target: 253 target.addr = map__objdump_2mem(map, ops->target.addr); 254 255 if (map_groups__find_ams(&target) == 0 && 256 map__rip_2objdump(target.map, map->map_ip(target.map, target.addr)) == ops->target.addr) 257 ops->target.sym = target.sym; 258 259 return 0; 260 261 indirect_call: 262 tok = strchr(endptr, '*'); 263 if (tok != NULL) { 264 endptr++; 265 266 /* Indirect call can use a non-rip register and offset: callq *0x8(%rbx). 267 * Do not parse such instruction. */ 268 if (strstr(endptr, "(%r") == NULL) 269 ops->target.addr = strtoull(endptr, NULL, 16); 270 } 271 goto find_target; 272 } 273 274 static int call__scnprintf(struct ins *ins, char *bf, size_t size, 275 struct ins_operands *ops) 276 { 277 if (ops->target.sym) 278 return scnprintf(bf, size, "%-6s %s", ins->name, ops->target.sym->name); 279 280 if (ops->target.addr == 0) 281 return ins__raw_scnprintf(ins, bf, size, ops); 282 283 if (ops->target.name) 284 return scnprintf(bf, size, "%-6s %s", ins->name, ops->target.name); 285 286 return scnprintf(bf, size, "%-6s *%" PRIx64, ins->name, ops->target.addr); 287 } 288 289 static struct ins_ops call_ops = { 290 .parse = call__parse, 291 .scnprintf = call__scnprintf, 292 }; 293 294 bool ins__is_call(const struct ins *ins) 295 { 296 return ins->ops == &call_ops || ins->ops == &s390_call_ops; 297 } 298 299 /* 300 * Prevents from matching commas in the comment section, e.g.: 301 * ffff200008446e70: b.cs ffff2000084470f4 <generic_exec_single+0x314> // b.hs, b.nlast 302 */ 303 static inline const char *validate_comma(const char *c, struct ins_operands *ops) 304 { 305 if (ops->raw_comment && c > ops->raw_comment) 306 return NULL; 307 308 return c; 309 } 310 311 static int jump__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms) 312 { 313 struct map *map = ms->map; 314 struct symbol *sym = ms->sym; 315 struct addr_map_symbol target = { 316 .map = map, 317 }; 318 const char *c = strchr(ops->raw, ','); 319 u64 start, end; 320 321 ops->raw_comment = strchr(ops->raw, arch->objdump.comment_char); 322 c = validate_comma(c, ops); 323 324 /* 325 * Examples of lines to parse for the _cpp_lex_token@@Base 326 * function: 327 * 328 * 1159e6c: jne 115aa32 <_cpp_lex_token@@Base+0xf92> 329 * 1159e8b: jne c469be <cpp_named_operator2name@@Base+0xa72> 330 * 331 * The first is a jump to an offset inside the same function, 332 * the second is to another function, i.e. that 0xa72 is an 333 * offset in the cpp_named_operator2name@@base function. 334 */ 335 /* 336 * skip over possible up to 2 operands to get to address, e.g.: 337 * tbnz w0, #26, ffff0000083cd190 <security_file_permission+0xd0> 338 */ 339 if (c++ != NULL) { 340 ops->target.addr = strtoull(c, NULL, 16); 341 if (!ops->target.addr) { 342 c = strchr(c, ','); 343 c = validate_comma(c, ops); 344 if (c++ != NULL) 345 ops->target.addr = strtoull(c, NULL, 16); 346 } 347 } else { 348 ops->target.addr = strtoull(ops->raw, NULL, 16); 349 } 350 351 target.addr = map__objdump_2mem(map, ops->target.addr); 352 start = map->unmap_ip(map, sym->start), 353 end = map->unmap_ip(map, sym->end); 354 355 ops->target.outside = target.addr < start || target.addr > end; 356 357 /* 358 * FIXME: things like this in _cpp_lex_token (gcc's cc1 program): 359 360 cpp_named_operator2name@@Base+0xa72 361 362 * Point to a place that is after the cpp_named_operator2name 363 * boundaries, i.e. in the ELF symbol table for cc1 364 * cpp_named_operator2name is marked as being 32-bytes long, but it in 365 * fact is much larger than that, so we seem to need a symbols__find() 366 * routine that looks for >= current->start and < next_symbol->start, 367 * possibly just for C++ objects? 368 * 369 * For now lets just make some progress by marking jumps to outside the 370 * current function as call like. 371 * 372 * Actual navigation will come next, with further understanding of how 373 * the symbol searching and disassembly should be done. 374 */ 375 if (map_groups__find_ams(&target) == 0 && 376 map__rip_2objdump(target.map, map->map_ip(target.map, target.addr)) == ops->target.addr) 377 ops->target.sym = target.sym; 378 379 if (!ops->target.outside) { 380 ops->target.offset = target.addr - start; 381 ops->target.offset_avail = true; 382 } else { 383 ops->target.offset_avail = false; 384 } 385 386 return 0; 387 } 388 389 static int jump__scnprintf(struct ins *ins, char *bf, size_t size, 390 struct ins_operands *ops) 391 { 392 const char *c; 393 394 if (!ops->target.addr || ops->target.offset < 0) 395 return ins__raw_scnprintf(ins, bf, size, ops); 396 397 if (ops->target.outside && ops->target.sym != NULL) 398 return scnprintf(bf, size, "%-6s %s", ins->name, ops->target.sym->name); 399 400 c = strchr(ops->raw, ','); 401 c = validate_comma(c, ops); 402 403 if (c != NULL) { 404 const char *c2 = strchr(c + 1, ','); 405 406 c2 = validate_comma(c2, ops); 407 /* check for 3-op insn */ 408 if (c2 != NULL) 409 c = c2; 410 c++; 411 412 /* mirror arch objdump's space-after-comma style */ 413 if (*c == ' ') 414 c++; 415 } 416 417 return scnprintf(bf, size, "%-6s %.*s%" PRIx64, 418 ins->name, c ? c - ops->raw : 0, ops->raw, 419 ops->target.offset); 420 } 421 422 static struct ins_ops jump_ops = { 423 .parse = jump__parse, 424 .scnprintf = jump__scnprintf, 425 }; 426 427 bool ins__is_jump(const struct ins *ins) 428 { 429 return ins->ops == &jump_ops; 430 } 431 432 static int comment__symbol(char *raw, char *comment, u64 *addrp, char **namep) 433 { 434 char *endptr, *name, *t; 435 436 if (strstr(raw, "(%rip)") == NULL) 437 return 0; 438 439 *addrp = strtoull(comment, &endptr, 16); 440 if (endptr == comment) 441 return 0; 442 name = strchr(endptr, '<'); 443 if (name == NULL) 444 return -1; 445 446 name++; 447 448 t = strchr(name, '>'); 449 if (t == NULL) 450 return 0; 451 452 *t = '\0'; 453 *namep = strdup(name); 454 *t = '>'; 455 456 return 0; 457 } 458 459 static int lock__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms) 460 { 461 ops->locked.ops = zalloc(sizeof(*ops->locked.ops)); 462 if (ops->locked.ops == NULL) 463 return 0; 464 465 if (disasm_line__parse(ops->raw, &ops->locked.ins.name, &ops->locked.ops->raw) < 0) 466 goto out_free_ops; 467 468 ops->locked.ins.ops = ins__find(arch, ops->locked.ins.name); 469 470 if (ops->locked.ins.ops == NULL) 471 goto out_free_ops; 472 473 if (ops->locked.ins.ops->parse && 474 ops->locked.ins.ops->parse(arch, ops->locked.ops, ms) < 0) 475 goto out_free_ops; 476 477 return 0; 478 479 out_free_ops: 480 zfree(&ops->locked.ops); 481 return 0; 482 } 483 484 static int lock__scnprintf(struct ins *ins, char *bf, size_t size, 485 struct ins_operands *ops) 486 { 487 int printed; 488 489 if (ops->locked.ins.ops == NULL) 490 return ins__raw_scnprintf(ins, bf, size, ops); 491 492 printed = scnprintf(bf, size, "%-6s ", ins->name); 493 return printed + ins__scnprintf(&ops->locked.ins, bf + printed, 494 size - printed, ops->locked.ops); 495 } 496 497 static void lock__delete(struct ins_operands *ops) 498 { 499 struct ins *ins = &ops->locked.ins; 500 501 if (ins->ops && ins->ops->free) 502 ins->ops->free(ops->locked.ops); 503 else 504 ins__delete(ops->locked.ops); 505 506 zfree(&ops->locked.ops); 507 zfree(&ops->target.raw); 508 zfree(&ops->target.name); 509 } 510 511 static struct ins_ops lock_ops = { 512 .free = lock__delete, 513 .parse = lock__parse, 514 .scnprintf = lock__scnprintf, 515 }; 516 517 static int mov__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms __maybe_unused) 518 { 519 char *s = strchr(ops->raw, ','), *target, *comment, prev; 520 521 if (s == NULL) 522 return -1; 523 524 *s = '\0'; 525 ops->source.raw = strdup(ops->raw); 526 *s = ','; 527 528 if (ops->source.raw == NULL) 529 return -1; 530 531 target = ++s; 532 comment = strchr(s, arch->objdump.comment_char); 533 534 if (comment != NULL) 535 s = comment - 1; 536 else 537 s = strchr(s, '\0') - 1; 538 539 while (s > target && isspace(s[0])) 540 --s; 541 s++; 542 prev = *s; 543 *s = '\0'; 544 545 ops->target.raw = strdup(target); 546 *s = prev; 547 548 if (ops->target.raw == NULL) 549 goto out_free_source; 550 551 if (comment == NULL) 552 return 0; 553 554 comment = ltrim(comment); 555 comment__symbol(ops->source.raw, comment + 1, &ops->source.addr, &ops->source.name); 556 comment__symbol(ops->target.raw, comment + 1, &ops->target.addr, &ops->target.name); 557 558 return 0; 559 560 out_free_source: 561 zfree(&ops->source.raw); 562 return -1; 563 } 564 565 static int mov__scnprintf(struct ins *ins, char *bf, size_t size, 566 struct ins_operands *ops) 567 { 568 return scnprintf(bf, size, "%-6s %s,%s", ins->name, 569 ops->source.name ?: ops->source.raw, 570 ops->target.name ?: ops->target.raw); 571 } 572 573 static struct ins_ops mov_ops = { 574 .parse = mov__parse, 575 .scnprintf = mov__scnprintf, 576 }; 577 578 static int dec__parse(struct arch *arch __maybe_unused, struct ins_operands *ops, struct map_symbol *ms __maybe_unused) 579 { 580 char *target, *comment, *s, prev; 581 582 target = s = ops->raw; 583 584 while (s[0] != '\0' && !isspace(s[0])) 585 ++s; 586 prev = *s; 587 *s = '\0'; 588 589 ops->target.raw = strdup(target); 590 *s = prev; 591 592 if (ops->target.raw == NULL) 593 return -1; 594 595 comment = strchr(s, arch->objdump.comment_char); 596 if (comment == NULL) 597 return 0; 598 599 comment = ltrim(comment); 600 comment__symbol(ops->target.raw, comment + 1, &ops->target.addr, &ops->target.name); 601 602 return 0; 603 } 604 605 static int dec__scnprintf(struct ins *ins, char *bf, size_t size, 606 struct ins_operands *ops) 607 { 608 return scnprintf(bf, size, "%-6s %s", ins->name, 609 ops->target.name ?: ops->target.raw); 610 } 611 612 static struct ins_ops dec_ops = { 613 .parse = dec__parse, 614 .scnprintf = dec__scnprintf, 615 }; 616 617 static int nop__scnprintf(struct ins *ins __maybe_unused, char *bf, size_t size, 618 struct ins_operands *ops __maybe_unused) 619 { 620 return scnprintf(bf, size, "%-6s", "nop"); 621 } 622 623 static struct ins_ops nop_ops = { 624 .scnprintf = nop__scnprintf, 625 }; 626 627 static struct ins_ops ret_ops = { 628 .scnprintf = ins__raw_scnprintf, 629 }; 630 631 bool ins__is_ret(const struct ins *ins) 632 { 633 return ins->ops == &ret_ops; 634 } 635 636 bool ins__is_lock(const struct ins *ins) 637 { 638 return ins->ops == &lock_ops; 639 } 640 641 static int ins__key_cmp(const void *name, const void *insp) 642 { 643 const struct ins *ins = insp; 644 645 return strcmp(name, ins->name); 646 } 647 648 static int ins__cmp(const void *a, const void *b) 649 { 650 const struct ins *ia = a; 651 const struct ins *ib = b; 652 653 return strcmp(ia->name, ib->name); 654 } 655 656 static void ins__sort(struct arch *arch) 657 { 658 const int nmemb = arch->nr_instructions; 659 660 qsort(arch->instructions, nmemb, sizeof(struct ins), ins__cmp); 661 } 662 663 static struct ins_ops *__ins__find(struct arch *arch, const char *name) 664 { 665 struct ins *ins; 666 const int nmemb = arch->nr_instructions; 667 668 if (!arch->sorted_instructions) { 669 ins__sort(arch); 670 arch->sorted_instructions = true; 671 } 672 673 ins = bsearch(name, arch->instructions, nmemb, sizeof(struct ins), ins__key_cmp); 674 return ins ? ins->ops : NULL; 675 } 676 677 static struct ins_ops *ins__find(struct arch *arch, const char *name) 678 { 679 struct ins_ops *ops = __ins__find(arch, name); 680 681 if (!ops && arch->associate_instruction_ops) 682 ops = arch->associate_instruction_ops(arch, name); 683 684 return ops; 685 } 686 687 static int arch__key_cmp(const void *name, const void *archp) 688 { 689 const struct arch *arch = archp; 690 691 return strcmp(name, arch->name); 692 } 693 694 static int arch__cmp(const void *a, const void *b) 695 { 696 const struct arch *aa = a; 697 const struct arch *ab = b; 698 699 return strcmp(aa->name, ab->name); 700 } 701 702 static void arch__sort(void) 703 { 704 const int nmemb = ARRAY_SIZE(architectures); 705 706 qsort(architectures, nmemb, sizeof(struct arch), arch__cmp); 707 } 708 709 static struct arch *arch__find(const char *name) 710 { 711 const int nmemb = ARRAY_SIZE(architectures); 712 static bool sorted; 713 714 if (!sorted) { 715 arch__sort(); 716 sorted = true; 717 } 718 719 return bsearch(name, architectures, nmemb, sizeof(struct arch), arch__key_cmp); 720 } 721 722 static struct annotated_source *annotated_source__new(void) 723 { 724 struct annotated_source *src = zalloc(sizeof(*src)); 725 726 if (src != NULL) 727 INIT_LIST_HEAD(&src->source); 728 729 return src; 730 } 731 732 static __maybe_unused void annotated_source__delete(struct annotated_source *src) 733 { 734 if (src == NULL) 735 return; 736 zfree(&src->histograms); 737 zfree(&src->cycles_hist); 738 free(src); 739 } 740 741 static int annotated_source__alloc_histograms(struct annotated_source *src, 742 size_t size, int nr_hists) 743 { 744 size_t sizeof_sym_hist; 745 746 /* 747 * Add buffer of one element for zero length symbol. 748 * When sample is taken from first instruction of 749 * zero length symbol, perf still resolves it and 750 * shows symbol name in perf report and allows to 751 * annotate it. 752 */ 753 if (size == 0) 754 size = 1; 755 756 /* Check for overflow when calculating sizeof_sym_hist */ 757 if (size > (SIZE_MAX - sizeof(struct sym_hist)) / sizeof(struct sym_hist_entry)) 758 return -1; 759 760 sizeof_sym_hist = (sizeof(struct sym_hist) + size * sizeof(struct sym_hist_entry)); 761 762 /* Check for overflow in zalloc argument */ 763 if (sizeof_sym_hist > SIZE_MAX / nr_hists) 764 return -1; 765 766 src->sizeof_sym_hist = sizeof_sym_hist; 767 src->nr_histograms = nr_hists; 768 src->histograms = calloc(nr_hists, sizeof_sym_hist) ; 769 return src->histograms ? 0 : -1; 770 } 771 772 /* The cycles histogram is lazily allocated. */ 773 static int symbol__alloc_hist_cycles(struct symbol *sym) 774 { 775 struct annotation *notes = symbol__annotation(sym); 776 const size_t size = symbol__size(sym); 777 778 notes->src->cycles_hist = calloc(size, sizeof(struct cyc_hist)); 779 if (notes->src->cycles_hist == NULL) 780 return -1; 781 return 0; 782 } 783 784 void symbol__annotate_zero_histograms(struct symbol *sym) 785 { 786 struct annotation *notes = symbol__annotation(sym); 787 788 pthread_mutex_lock(¬es->lock); 789 if (notes->src != NULL) { 790 memset(notes->src->histograms, 0, 791 notes->src->nr_histograms * notes->src->sizeof_sym_hist); 792 if (notes->src->cycles_hist) 793 memset(notes->src->cycles_hist, 0, 794 symbol__size(sym) * sizeof(struct cyc_hist)); 795 } 796 pthread_mutex_unlock(¬es->lock); 797 } 798 799 static int __symbol__account_cycles(struct cyc_hist *ch, 800 u64 start, 801 unsigned offset, unsigned cycles, 802 unsigned have_start) 803 { 804 /* 805 * For now we can only account one basic block per 806 * final jump. But multiple could be overlapping. 807 * Always account the longest one. So when 808 * a shorter one has been already seen throw it away. 809 * 810 * We separately always account the full cycles. 811 */ 812 ch[offset].num_aggr++; 813 ch[offset].cycles_aggr += cycles; 814 815 if (cycles > ch[offset].cycles_max) 816 ch[offset].cycles_max = cycles; 817 818 if (ch[offset].cycles_min) { 819 if (cycles && cycles < ch[offset].cycles_min) 820 ch[offset].cycles_min = cycles; 821 } else 822 ch[offset].cycles_min = cycles; 823 824 if (!have_start && ch[offset].have_start) 825 return 0; 826 if (ch[offset].num) { 827 if (have_start && (!ch[offset].have_start || 828 ch[offset].start > start)) { 829 ch[offset].have_start = 0; 830 ch[offset].cycles = 0; 831 ch[offset].num = 0; 832 if (ch[offset].reset < 0xffff) 833 ch[offset].reset++; 834 } else if (have_start && 835 ch[offset].start < start) 836 return 0; 837 } 838 ch[offset].have_start = have_start; 839 ch[offset].start = start; 840 ch[offset].cycles += cycles; 841 ch[offset].num++; 842 return 0; 843 } 844 845 static int __symbol__inc_addr_samples(struct symbol *sym, struct map *map, 846 struct annotated_source *src, int evidx, u64 addr, 847 struct perf_sample *sample) 848 { 849 unsigned offset; 850 struct sym_hist *h; 851 852 pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, map->unmap_ip(map, addr)); 853 854 if ((addr < sym->start || addr >= sym->end) && 855 (addr != sym->end || sym->start != sym->end)) { 856 pr_debug("%s(%d): ERANGE! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 "\n", 857 __func__, __LINE__, sym->name, sym->start, addr, sym->end); 858 return -ERANGE; 859 } 860 861 offset = addr - sym->start; 862 h = annotated_source__histogram(src, evidx); 863 if (h == NULL) { 864 pr_debug("%s(%d): ENOMEM! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 ", func: %d\n", 865 __func__, __LINE__, sym->name, sym->start, addr, sym->end, sym->type == STT_FUNC); 866 return -ENOMEM; 867 } 868 h->nr_samples++; 869 h->addr[offset].nr_samples++; 870 h->period += sample->period; 871 h->addr[offset].period += sample->period; 872 873 pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64 874 ", evidx=%d] => nr_samples: %" PRIu64 ", period: %" PRIu64 "\n", 875 sym->start, sym->name, addr, addr - sym->start, evidx, 876 h->addr[offset].nr_samples, h->addr[offset].period); 877 return 0; 878 } 879 880 static struct cyc_hist *symbol__cycles_hist(struct symbol *sym) 881 { 882 struct annotation *notes = symbol__annotation(sym); 883 884 if (notes->src == NULL) { 885 notes->src = annotated_source__new(); 886 if (notes->src == NULL) 887 return NULL; 888 goto alloc_cycles_hist; 889 } 890 891 if (!notes->src->cycles_hist) { 892 alloc_cycles_hist: 893 symbol__alloc_hist_cycles(sym); 894 } 895 896 return notes->src->cycles_hist; 897 } 898 899 struct annotated_source *symbol__hists(struct symbol *sym, int nr_hists) 900 { 901 struct annotation *notes = symbol__annotation(sym); 902 903 if (notes->src == NULL) { 904 notes->src = annotated_source__new(); 905 if (notes->src == NULL) 906 return NULL; 907 goto alloc_histograms; 908 } 909 910 if (notes->src->histograms == NULL) { 911 alloc_histograms: 912 annotated_source__alloc_histograms(notes->src, symbol__size(sym), 913 nr_hists); 914 } 915 916 return notes->src; 917 } 918 919 static int symbol__inc_addr_samples(struct symbol *sym, struct map *map, 920 struct perf_evsel *evsel, u64 addr, 921 struct perf_sample *sample) 922 { 923 struct annotated_source *src; 924 925 if (sym == NULL) 926 return 0; 927 src = symbol__hists(sym, evsel->evlist->nr_entries); 928 if (src == NULL) 929 return -ENOMEM; 930 return __symbol__inc_addr_samples(sym, map, src, evsel->idx, addr, sample); 931 } 932 933 static int symbol__account_cycles(u64 addr, u64 start, 934 struct symbol *sym, unsigned cycles) 935 { 936 struct cyc_hist *cycles_hist; 937 unsigned offset; 938 939 if (sym == NULL) 940 return 0; 941 cycles_hist = symbol__cycles_hist(sym); 942 if (cycles_hist == NULL) 943 return -ENOMEM; 944 if (addr < sym->start || addr >= sym->end) 945 return -ERANGE; 946 947 if (start) { 948 if (start < sym->start || start >= sym->end) 949 return -ERANGE; 950 if (start >= addr) 951 start = 0; 952 } 953 offset = addr - sym->start; 954 return __symbol__account_cycles(cycles_hist, 955 start ? start - sym->start : 0, 956 offset, cycles, 957 !!start); 958 } 959 960 int addr_map_symbol__account_cycles(struct addr_map_symbol *ams, 961 struct addr_map_symbol *start, 962 unsigned cycles) 963 { 964 u64 saddr = 0; 965 int err; 966 967 if (!cycles) 968 return 0; 969 970 /* 971 * Only set start when IPC can be computed. We can only 972 * compute it when the basic block is completely in a single 973 * function. 974 * Special case the case when the jump is elsewhere, but 975 * it starts on the function start. 976 */ 977 if (start && 978 (start->sym == ams->sym || 979 (ams->sym && 980 start->addr == ams->sym->start + ams->map->start))) 981 saddr = start->al_addr; 982 if (saddr == 0) 983 pr_debug2("BB with bad start: addr %"PRIx64" start %"PRIx64" sym %"PRIx64" saddr %"PRIx64"\n", 984 ams->addr, 985 start ? start->addr : 0, 986 ams->sym ? ams->sym->start + ams->map->start : 0, 987 saddr); 988 err = symbol__account_cycles(ams->al_addr, saddr, ams->sym, cycles); 989 if (err) 990 pr_debug2("account_cycles failed %d\n", err); 991 return err; 992 } 993 994 static unsigned annotation__count_insn(struct annotation *notes, u64 start, u64 end) 995 { 996 unsigned n_insn = 0; 997 u64 offset; 998 999 for (offset = start; offset <= end; offset++) { 1000 if (notes->offsets[offset]) 1001 n_insn++; 1002 } 1003 return n_insn; 1004 } 1005 1006 static void annotation__count_and_fill(struct annotation *notes, u64 start, u64 end, struct cyc_hist *ch) 1007 { 1008 unsigned n_insn; 1009 unsigned int cover_insn = 0; 1010 u64 offset; 1011 1012 n_insn = annotation__count_insn(notes, start, end); 1013 if (n_insn && ch->num && ch->cycles) { 1014 float ipc = n_insn / ((double)ch->cycles / (double)ch->num); 1015 1016 /* Hide data when there are too many overlaps. */ 1017 if (ch->reset >= 0x7fff || ch->reset >= ch->num / 2) 1018 return; 1019 1020 for (offset = start; offset <= end; offset++) { 1021 struct annotation_line *al = notes->offsets[offset]; 1022 1023 if (al && al->ipc == 0.0) { 1024 al->ipc = ipc; 1025 cover_insn++; 1026 } 1027 } 1028 1029 if (cover_insn) { 1030 notes->hit_cycles += ch->cycles; 1031 notes->hit_insn += n_insn * ch->num; 1032 notes->cover_insn += cover_insn; 1033 } 1034 } 1035 } 1036 1037 void annotation__compute_ipc(struct annotation *notes, size_t size) 1038 { 1039 s64 offset; 1040 1041 if (!notes->src || !notes->src->cycles_hist) 1042 return; 1043 1044 notes->total_insn = annotation__count_insn(notes, 0, size - 1); 1045 notes->hit_cycles = 0; 1046 notes->hit_insn = 0; 1047 notes->cover_insn = 0; 1048 1049 pthread_mutex_lock(¬es->lock); 1050 for (offset = size - 1; offset >= 0; --offset) { 1051 struct cyc_hist *ch; 1052 1053 ch = ¬es->src->cycles_hist[offset]; 1054 if (ch && ch->cycles) { 1055 struct annotation_line *al; 1056 1057 if (ch->have_start) 1058 annotation__count_and_fill(notes, ch->start, offset, ch); 1059 al = notes->offsets[offset]; 1060 if (al && ch->num_aggr) { 1061 al->cycles = ch->cycles_aggr / ch->num_aggr; 1062 al->cycles_max = ch->cycles_max; 1063 al->cycles_min = ch->cycles_min; 1064 } 1065 notes->have_cycles = true; 1066 } 1067 } 1068 pthread_mutex_unlock(¬es->lock); 1069 } 1070 1071 int addr_map_symbol__inc_samples(struct addr_map_symbol *ams, struct perf_sample *sample, 1072 struct perf_evsel *evsel) 1073 { 1074 return symbol__inc_addr_samples(ams->sym, ams->map, evsel, ams->al_addr, sample); 1075 } 1076 1077 int hist_entry__inc_addr_samples(struct hist_entry *he, struct perf_sample *sample, 1078 struct perf_evsel *evsel, u64 ip) 1079 { 1080 return symbol__inc_addr_samples(he->ms.sym, he->ms.map, evsel, ip, sample); 1081 } 1082 1083 static void disasm_line__init_ins(struct disasm_line *dl, struct arch *arch, struct map_symbol *ms) 1084 { 1085 dl->ins.ops = ins__find(arch, dl->ins.name); 1086 1087 if (!dl->ins.ops) 1088 return; 1089 1090 if (dl->ins.ops->parse && dl->ins.ops->parse(arch, &dl->ops, ms) < 0) 1091 dl->ins.ops = NULL; 1092 } 1093 1094 static int disasm_line__parse(char *line, const char **namep, char **rawp) 1095 { 1096 char tmp, *name = ltrim(line); 1097 1098 if (name[0] == '\0') 1099 return -1; 1100 1101 *rawp = name + 1; 1102 1103 while ((*rawp)[0] != '\0' && !isspace((*rawp)[0])) 1104 ++*rawp; 1105 1106 tmp = (*rawp)[0]; 1107 (*rawp)[0] = '\0'; 1108 *namep = strdup(name); 1109 1110 if (*namep == NULL) 1111 goto out_free_name; 1112 1113 (*rawp)[0] = tmp; 1114 *rawp = ltrim(*rawp); 1115 1116 return 0; 1117 1118 out_free_name: 1119 free((void *)namep); 1120 *namep = NULL; 1121 return -1; 1122 } 1123 1124 struct annotate_args { 1125 size_t privsize; 1126 struct arch *arch; 1127 struct map_symbol ms; 1128 struct perf_evsel *evsel; 1129 struct annotation_options *options; 1130 s64 offset; 1131 char *line; 1132 int line_nr; 1133 }; 1134 1135 static void annotation_line__delete(struct annotation_line *al) 1136 { 1137 void *ptr = (void *) al - al->privsize; 1138 1139 free_srcline(al->path); 1140 zfree(&al->line); 1141 free(ptr); 1142 } 1143 1144 /* 1145 * Allocating the annotation line data with following 1146 * structure: 1147 * 1148 * -------------------------------------- 1149 * private space | struct annotation_line 1150 * -------------------------------------- 1151 * 1152 * Size of the private space is stored in 'struct annotation_line'. 1153 * 1154 */ 1155 static struct annotation_line * 1156 annotation_line__new(struct annotate_args *args, size_t privsize) 1157 { 1158 struct annotation_line *al; 1159 struct perf_evsel *evsel = args->evsel; 1160 size_t size = privsize + sizeof(*al); 1161 int nr = 1; 1162 1163 if (perf_evsel__is_group_event(evsel)) 1164 nr = evsel->nr_members; 1165 1166 size += sizeof(al->data[0]) * nr; 1167 1168 al = zalloc(size); 1169 if (al) { 1170 al = (void *) al + privsize; 1171 al->privsize = privsize; 1172 al->offset = args->offset; 1173 al->line = strdup(args->line); 1174 al->line_nr = args->line_nr; 1175 al->data_nr = nr; 1176 } 1177 1178 return al; 1179 } 1180 1181 /* 1182 * Allocating the disasm annotation line data with 1183 * following structure: 1184 * 1185 * ------------------------------------------------------------ 1186 * privsize space | struct disasm_line | struct annotation_line 1187 * ------------------------------------------------------------ 1188 * 1189 * We have 'struct annotation_line' member as last member 1190 * of 'struct disasm_line' to have an easy access. 1191 * 1192 */ 1193 static struct disasm_line *disasm_line__new(struct annotate_args *args) 1194 { 1195 struct disasm_line *dl = NULL; 1196 struct annotation_line *al; 1197 size_t privsize = args->privsize + offsetof(struct disasm_line, al); 1198 1199 al = annotation_line__new(args, privsize); 1200 if (al != NULL) { 1201 dl = disasm_line(al); 1202 1203 if (dl->al.line == NULL) 1204 goto out_delete; 1205 1206 if (args->offset != -1) { 1207 if (disasm_line__parse(dl->al.line, &dl->ins.name, &dl->ops.raw) < 0) 1208 goto out_free_line; 1209 1210 disasm_line__init_ins(dl, args->arch, &args->ms); 1211 } 1212 } 1213 1214 return dl; 1215 1216 out_free_line: 1217 zfree(&dl->al.line); 1218 out_delete: 1219 free(dl); 1220 return NULL; 1221 } 1222 1223 void disasm_line__free(struct disasm_line *dl) 1224 { 1225 if (dl->ins.ops && dl->ins.ops->free) 1226 dl->ins.ops->free(&dl->ops); 1227 else 1228 ins__delete(&dl->ops); 1229 free((void *)dl->ins.name); 1230 dl->ins.name = NULL; 1231 annotation_line__delete(&dl->al); 1232 } 1233 1234 int disasm_line__scnprintf(struct disasm_line *dl, char *bf, size_t size, bool raw) 1235 { 1236 if (raw || !dl->ins.ops) 1237 return scnprintf(bf, size, "%-6s %s", dl->ins.name, dl->ops.raw); 1238 1239 return ins__scnprintf(&dl->ins, bf, size, &dl->ops); 1240 } 1241 1242 static void annotation_line__add(struct annotation_line *al, struct list_head *head) 1243 { 1244 list_add_tail(&al->node, head); 1245 } 1246 1247 struct annotation_line * 1248 annotation_line__next(struct annotation_line *pos, struct list_head *head) 1249 { 1250 list_for_each_entry_continue(pos, head, node) 1251 if (pos->offset >= 0) 1252 return pos; 1253 1254 return NULL; 1255 } 1256 1257 static const char *annotate__address_color(struct block_range *br) 1258 { 1259 double cov = block_range__coverage(br); 1260 1261 if (cov >= 0) { 1262 /* mark red for >75% coverage */ 1263 if (cov > 0.75) 1264 return PERF_COLOR_RED; 1265 1266 /* mark dull for <1% coverage */ 1267 if (cov < 0.01) 1268 return PERF_COLOR_NORMAL; 1269 } 1270 1271 return PERF_COLOR_MAGENTA; 1272 } 1273 1274 static const char *annotate__asm_color(struct block_range *br) 1275 { 1276 double cov = block_range__coverage(br); 1277 1278 if (cov >= 0) { 1279 /* mark dull for <1% coverage */ 1280 if (cov < 0.01) 1281 return PERF_COLOR_NORMAL; 1282 } 1283 1284 return PERF_COLOR_BLUE; 1285 } 1286 1287 static void annotate__branch_printf(struct block_range *br, u64 addr) 1288 { 1289 bool emit_comment = true; 1290 1291 if (!br) 1292 return; 1293 1294 #if 1 1295 if (br->is_target && br->start == addr) { 1296 struct block_range *branch = br; 1297 double p; 1298 1299 /* 1300 * Find matching branch to our target. 1301 */ 1302 while (!branch->is_branch) 1303 branch = block_range__next(branch); 1304 1305 p = 100 *(double)br->entry / branch->coverage; 1306 1307 if (p > 0.1) { 1308 if (emit_comment) { 1309 emit_comment = false; 1310 printf("\t#"); 1311 } 1312 1313 /* 1314 * The percentage of coverage joined at this target in relation 1315 * to the next branch. 1316 */ 1317 printf(" +%.2f%%", p); 1318 } 1319 } 1320 #endif 1321 if (br->is_branch && br->end == addr) { 1322 double p = 100*(double)br->taken / br->coverage; 1323 1324 if (p > 0.1) { 1325 if (emit_comment) { 1326 emit_comment = false; 1327 printf("\t#"); 1328 } 1329 1330 /* 1331 * The percentage of coverage leaving at this branch, and 1332 * its prediction ratio. 1333 */ 1334 printf(" -%.2f%% (p:%.2f%%)", p, 100*(double)br->pred / br->taken); 1335 } 1336 } 1337 } 1338 1339 static int disasm_line__print(struct disasm_line *dl, u64 start, int addr_fmt_width) 1340 { 1341 s64 offset = dl->al.offset; 1342 const u64 addr = start + offset; 1343 struct block_range *br; 1344 1345 br = block_range__find(addr); 1346 color_fprintf(stdout, annotate__address_color(br), " %*" PRIx64 ":", addr_fmt_width, addr); 1347 color_fprintf(stdout, annotate__asm_color(br), "%s", dl->al.line); 1348 annotate__branch_printf(br, addr); 1349 return 0; 1350 } 1351 1352 static int 1353 annotation_line__print(struct annotation_line *al, struct symbol *sym, u64 start, 1354 struct perf_evsel *evsel, u64 len, int min_pcnt, int printed, 1355 int max_lines, struct annotation_line *queue, int addr_fmt_width, 1356 int percent_type) 1357 { 1358 struct disasm_line *dl = container_of(al, struct disasm_line, al); 1359 static const char *prev_line; 1360 static const char *prev_color; 1361 1362 if (al->offset != -1) { 1363 double max_percent = 0.0; 1364 int i, nr_percent = 1; 1365 const char *color; 1366 struct annotation *notes = symbol__annotation(sym); 1367 1368 for (i = 0; i < al->data_nr; i++) { 1369 double percent; 1370 1371 percent = annotation_data__percent(&al->data[i], 1372 percent_type); 1373 1374 if (percent > max_percent) 1375 max_percent = percent; 1376 } 1377 1378 if (al->data_nr > nr_percent) 1379 nr_percent = al->data_nr; 1380 1381 if (max_percent < min_pcnt) 1382 return -1; 1383 1384 if (max_lines && printed >= max_lines) 1385 return 1; 1386 1387 if (queue != NULL) { 1388 list_for_each_entry_from(queue, ¬es->src->source, node) { 1389 if (queue == al) 1390 break; 1391 annotation_line__print(queue, sym, start, evsel, len, 1392 0, 0, 1, NULL, addr_fmt_width, 1393 percent_type); 1394 } 1395 } 1396 1397 color = get_percent_color(max_percent); 1398 1399 /* 1400 * Also color the filename and line if needed, with 1401 * the same color than the percentage. Don't print it 1402 * twice for close colored addr with the same filename:line 1403 */ 1404 if (al->path) { 1405 if (!prev_line || strcmp(prev_line, al->path) 1406 || color != prev_color) { 1407 color_fprintf(stdout, color, " %s", al->path); 1408 prev_line = al->path; 1409 prev_color = color; 1410 } 1411 } 1412 1413 for (i = 0; i < nr_percent; i++) { 1414 struct annotation_data *data = &al->data[i]; 1415 double percent; 1416 1417 percent = annotation_data__percent(data, percent_type); 1418 color = get_percent_color(percent); 1419 1420 if (symbol_conf.show_total_period) 1421 color_fprintf(stdout, color, " %11" PRIu64, 1422 data->he.period); 1423 else if (symbol_conf.show_nr_samples) 1424 color_fprintf(stdout, color, " %7" PRIu64, 1425 data->he.nr_samples); 1426 else 1427 color_fprintf(stdout, color, " %7.2f", percent); 1428 } 1429 1430 printf(" : "); 1431 1432 disasm_line__print(dl, start, addr_fmt_width); 1433 printf("\n"); 1434 } else if (max_lines && printed >= max_lines) 1435 return 1; 1436 else { 1437 int width = symbol_conf.show_total_period ? 12 : 8; 1438 1439 if (queue) 1440 return -1; 1441 1442 if (perf_evsel__is_group_event(evsel)) 1443 width *= evsel->nr_members; 1444 1445 if (!*al->line) 1446 printf(" %*s:\n", width, " "); 1447 else 1448 printf(" %*s: %*s %s\n", width, " ", addr_fmt_width, " ", al->line); 1449 } 1450 1451 return 0; 1452 } 1453 1454 /* 1455 * symbol__parse_objdump_line() parses objdump output (with -d --no-show-raw) 1456 * which looks like following 1457 * 1458 * 0000000000415500 <_init>: 1459 * 415500: sub $0x8,%rsp 1460 * 415504: mov 0x2f5ad5(%rip),%rax # 70afe0 <_DYNAMIC+0x2f8> 1461 * 41550b: test %rax,%rax 1462 * 41550e: je 415515 <_init+0x15> 1463 * 415510: callq 416e70 <__gmon_start__@plt> 1464 * 415515: add $0x8,%rsp 1465 * 415519: retq 1466 * 1467 * it will be parsed and saved into struct disasm_line as 1468 * <offset> <name> <ops.raw> 1469 * 1470 * The offset will be a relative offset from the start of the symbol and -1 1471 * means that it's not a disassembly line so should be treated differently. 1472 * The ops.raw part will be parsed further according to type of the instruction. 1473 */ 1474 static int symbol__parse_objdump_line(struct symbol *sym, FILE *file, 1475 struct annotate_args *args, 1476 int *line_nr) 1477 { 1478 struct map *map = args->ms.map; 1479 struct annotation *notes = symbol__annotation(sym); 1480 struct disasm_line *dl; 1481 char *line = NULL, *parsed_line, *tmp, *tmp2; 1482 size_t line_len; 1483 s64 line_ip, offset = -1; 1484 regmatch_t match[2]; 1485 1486 if (getline(&line, &line_len, file) < 0) 1487 return -1; 1488 1489 if (!line) 1490 return -1; 1491 1492 line_ip = -1; 1493 parsed_line = rtrim(line); 1494 1495 /* /filename:linenr ? Save line number and ignore. */ 1496 if (regexec(&file_lineno, parsed_line, 2, match, 0) == 0) { 1497 *line_nr = atoi(parsed_line + match[1].rm_so); 1498 return 0; 1499 } 1500 1501 tmp = ltrim(parsed_line); 1502 if (*tmp) { 1503 /* 1504 * Parse hexa addresses followed by ':' 1505 */ 1506 line_ip = strtoull(tmp, &tmp2, 16); 1507 if (*tmp2 != ':' || tmp == tmp2 || tmp2[1] == '\0') 1508 line_ip = -1; 1509 } 1510 1511 if (line_ip != -1) { 1512 u64 start = map__rip_2objdump(map, sym->start), 1513 end = map__rip_2objdump(map, sym->end); 1514 1515 offset = line_ip - start; 1516 if ((u64)line_ip < start || (u64)line_ip >= end) 1517 offset = -1; 1518 else 1519 parsed_line = tmp2 + 1; 1520 } 1521 1522 args->offset = offset; 1523 args->line = parsed_line; 1524 args->line_nr = *line_nr; 1525 args->ms.sym = sym; 1526 1527 dl = disasm_line__new(args); 1528 free(line); 1529 (*line_nr)++; 1530 1531 if (dl == NULL) 1532 return -1; 1533 1534 if (!disasm_line__has_local_offset(dl)) { 1535 dl->ops.target.offset = dl->ops.target.addr - 1536 map__rip_2objdump(map, sym->start); 1537 dl->ops.target.offset_avail = true; 1538 } 1539 1540 /* kcore has no symbols, so add the call target symbol */ 1541 if (dl->ins.ops && ins__is_call(&dl->ins) && !dl->ops.target.sym) { 1542 struct addr_map_symbol target = { 1543 .map = map, 1544 .addr = dl->ops.target.addr, 1545 }; 1546 1547 if (!map_groups__find_ams(&target) && 1548 target.sym->start == target.al_addr) 1549 dl->ops.target.sym = target.sym; 1550 } 1551 1552 annotation_line__add(&dl->al, ¬es->src->source); 1553 1554 return 0; 1555 } 1556 1557 static __attribute__((constructor)) void symbol__init_regexpr(void) 1558 { 1559 regcomp(&file_lineno, "^/[^:]+:([0-9]+)", REG_EXTENDED); 1560 } 1561 1562 static void delete_last_nop(struct symbol *sym) 1563 { 1564 struct annotation *notes = symbol__annotation(sym); 1565 struct list_head *list = ¬es->src->source; 1566 struct disasm_line *dl; 1567 1568 while (!list_empty(list)) { 1569 dl = list_entry(list->prev, struct disasm_line, al.node); 1570 1571 if (dl->ins.ops) { 1572 if (dl->ins.ops != &nop_ops) 1573 return; 1574 } else { 1575 if (!strstr(dl->al.line, " nop ") && 1576 !strstr(dl->al.line, " nopl ") && 1577 !strstr(dl->al.line, " nopw ")) 1578 return; 1579 } 1580 1581 list_del(&dl->al.node); 1582 disasm_line__free(dl); 1583 } 1584 } 1585 1586 int symbol__strerror_disassemble(struct symbol *sym __maybe_unused, struct map *map, 1587 int errnum, char *buf, size_t buflen) 1588 { 1589 struct dso *dso = map->dso; 1590 1591 BUG_ON(buflen == 0); 1592 1593 if (errnum >= 0) { 1594 str_error_r(errnum, buf, buflen); 1595 return 0; 1596 } 1597 1598 switch (errnum) { 1599 case SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX: { 1600 char bf[SBUILD_ID_SIZE + 15] = " with build id "; 1601 char *build_id_msg = NULL; 1602 1603 if (dso->has_build_id) { 1604 build_id__sprintf(dso->build_id, 1605 sizeof(dso->build_id), bf + 15); 1606 build_id_msg = bf; 1607 } 1608 scnprintf(buf, buflen, 1609 "No vmlinux file%s\nwas found in the path.\n\n" 1610 "Note that annotation using /proc/kcore requires CAP_SYS_RAWIO capability.\n\n" 1611 "Please use:\n\n" 1612 " perf buildid-cache -vu vmlinux\n\n" 1613 "or:\n\n" 1614 " --vmlinux vmlinux\n", build_id_msg ?: ""); 1615 } 1616 break; 1617 default: 1618 scnprintf(buf, buflen, "Internal error: Invalid %d error code\n", errnum); 1619 break; 1620 } 1621 1622 return 0; 1623 } 1624 1625 static int dso__disassemble_filename(struct dso *dso, char *filename, size_t filename_size) 1626 { 1627 char linkname[PATH_MAX]; 1628 char *build_id_filename; 1629 char *build_id_path = NULL; 1630 char *pos; 1631 1632 if (dso->symtab_type == DSO_BINARY_TYPE__KALLSYMS && 1633 !dso__is_kcore(dso)) 1634 return SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX; 1635 1636 build_id_filename = dso__build_id_filename(dso, NULL, 0, false); 1637 if (build_id_filename) { 1638 __symbol__join_symfs(filename, filename_size, build_id_filename); 1639 free(build_id_filename); 1640 } else { 1641 if (dso->has_build_id) 1642 return ENOMEM; 1643 goto fallback; 1644 } 1645 1646 build_id_path = strdup(filename); 1647 if (!build_id_path) 1648 return -1; 1649 1650 /* 1651 * old style build-id cache has name of XX/XXXXXXX.. while 1652 * new style has XX/XXXXXXX../{elf,kallsyms,vdso}. 1653 * extract the build-id part of dirname in the new style only. 1654 */ 1655 pos = strrchr(build_id_path, '/'); 1656 if (pos && strlen(pos) < SBUILD_ID_SIZE - 2) 1657 dirname(build_id_path); 1658 1659 if (dso__is_kcore(dso) || 1660 readlink(build_id_path, linkname, sizeof(linkname)) < 0 || 1661 strstr(linkname, DSO__NAME_KALLSYMS) || 1662 access(filename, R_OK)) { 1663 fallback: 1664 /* 1665 * If we don't have build-ids or the build-id file isn't in the 1666 * cache, or is just a kallsyms file, well, lets hope that this 1667 * DSO is the same as when 'perf record' ran. 1668 */ 1669 __symbol__join_symfs(filename, filename_size, dso->long_name); 1670 } 1671 1672 free(build_id_path); 1673 return 0; 1674 } 1675 1676 static int symbol__disassemble(struct symbol *sym, struct annotate_args *args) 1677 { 1678 struct annotation_options *opts = args->options; 1679 struct map *map = args->ms.map; 1680 struct dso *dso = map->dso; 1681 char *command; 1682 FILE *file; 1683 char symfs_filename[PATH_MAX]; 1684 struct kcore_extract kce; 1685 bool delete_extract = false; 1686 bool decomp = false; 1687 int stdout_fd[2]; 1688 int lineno = 0; 1689 int nline; 1690 pid_t pid; 1691 int err = dso__disassemble_filename(dso, symfs_filename, sizeof(symfs_filename)); 1692 1693 if (err) 1694 return err; 1695 1696 pr_debug("%s: filename=%s, sym=%s, start=%#" PRIx64 ", end=%#" PRIx64 "\n", __func__, 1697 symfs_filename, sym->name, map->unmap_ip(map, sym->start), 1698 map->unmap_ip(map, sym->end)); 1699 1700 pr_debug("annotating [%p] %30s : [%p] %30s\n", 1701 dso, dso->long_name, sym, sym->name); 1702 1703 if (dso__is_kcore(dso)) { 1704 kce.kcore_filename = symfs_filename; 1705 kce.addr = map__rip_2objdump(map, sym->start); 1706 kce.offs = sym->start; 1707 kce.len = sym->end - sym->start; 1708 if (!kcore_extract__create(&kce)) { 1709 delete_extract = true; 1710 strlcpy(symfs_filename, kce.extract_filename, 1711 sizeof(symfs_filename)); 1712 } 1713 } else if (dso__needs_decompress(dso)) { 1714 char tmp[KMOD_DECOMP_LEN]; 1715 1716 if (dso__decompress_kmodule_path(dso, symfs_filename, 1717 tmp, sizeof(tmp)) < 0) 1718 goto out; 1719 1720 decomp = true; 1721 strcpy(symfs_filename, tmp); 1722 } 1723 1724 err = asprintf(&command, 1725 "%s %s%s --start-address=0x%016" PRIx64 1726 " --stop-address=0x%016" PRIx64 1727 " -l -d %s %s -C \"$1\" 2>/dev/null|grep -v \"$1:\"|expand", 1728 opts->objdump_path ?: "objdump", 1729 opts->disassembler_style ? "-M " : "", 1730 opts->disassembler_style ?: "", 1731 map__rip_2objdump(map, sym->start), 1732 map__rip_2objdump(map, sym->end), 1733 opts->show_asm_raw ? "" : "--no-show-raw", 1734 opts->annotate_src ? "-S" : ""); 1735 1736 if (err < 0) { 1737 pr_err("Failure allocating memory for the command to run\n"); 1738 goto out_remove_tmp; 1739 } 1740 1741 pr_debug("Executing: %s\n", command); 1742 1743 err = -1; 1744 if (pipe(stdout_fd) < 0) { 1745 pr_err("Failure creating the pipe to run %s\n", command); 1746 goto out_free_command; 1747 } 1748 1749 pid = fork(); 1750 if (pid < 0) { 1751 pr_err("Failure forking to run %s\n", command); 1752 goto out_close_stdout; 1753 } 1754 1755 if (pid == 0) { 1756 close(stdout_fd[0]); 1757 dup2(stdout_fd[1], 1); 1758 close(stdout_fd[1]); 1759 execl("/bin/sh", "sh", "-c", command, "--", symfs_filename, 1760 NULL); 1761 perror(command); 1762 exit(-1); 1763 } 1764 1765 close(stdout_fd[1]); 1766 1767 file = fdopen(stdout_fd[0], "r"); 1768 if (!file) { 1769 pr_err("Failure creating FILE stream for %s\n", command); 1770 /* 1771 * If we were using debug info should retry with 1772 * original binary. 1773 */ 1774 goto out_free_command; 1775 } 1776 1777 nline = 0; 1778 while (!feof(file)) { 1779 /* 1780 * The source code line number (lineno) needs to be kept in 1781 * across calls to symbol__parse_objdump_line(), so that it 1782 * can associate it with the instructions till the next one. 1783 * See disasm_line__new() and struct disasm_line::line_nr. 1784 */ 1785 if (symbol__parse_objdump_line(sym, file, args, &lineno) < 0) 1786 break; 1787 nline++; 1788 } 1789 1790 if (nline == 0) 1791 pr_err("No output from %s\n", command); 1792 1793 /* 1794 * kallsyms does not have symbol sizes so there may a nop at the end. 1795 * Remove it. 1796 */ 1797 if (dso__is_kcore(dso)) 1798 delete_last_nop(sym); 1799 1800 fclose(file); 1801 err = 0; 1802 out_free_command: 1803 free(command); 1804 out_remove_tmp: 1805 close(stdout_fd[0]); 1806 1807 if (decomp) 1808 unlink(symfs_filename); 1809 1810 if (delete_extract) 1811 kcore_extract__delete(&kce); 1812 out: 1813 return err; 1814 1815 out_close_stdout: 1816 close(stdout_fd[1]); 1817 goto out_free_command; 1818 } 1819 1820 static void calc_percent(struct sym_hist *sym_hist, 1821 struct hists *hists, 1822 struct annotation_data *data, 1823 s64 offset, s64 end) 1824 { 1825 unsigned int hits = 0; 1826 u64 period = 0; 1827 1828 while (offset < end) { 1829 hits += sym_hist->addr[offset].nr_samples; 1830 period += sym_hist->addr[offset].period; 1831 ++offset; 1832 } 1833 1834 if (sym_hist->nr_samples) { 1835 data->he.period = period; 1836 data->he.nr_samples = hits; 1837 data->percent[PERCENT_HITS_LOCAL] = 100.0 * hits / sym_hist->nr_samples; 1838 } 1839 1840 if (hists->stats.nr_non_filtered_samples) 1841 data->percent[PERCENT_HITS_GLOBAL] = 100.0 * hits / hists->stats.nr_non_filtered_samples; 1842 1843 if (sym_hist->period) 1844 data->percent[PERCENT_PERIOD_LOCAL] = 100.0 * period / sym_hist->period; 1845 1846 if (hists->stats.total_period) 1847 data->percent[PERCENT_PERIOD_GLOBAL] = 100.0 * period / hists->stats.total_period; 1848 } 1849 1850 static void annotation__calc_percent(struct annotation *notes, 1851 struct perf_evsel *leader, s64 len) 1852 { 1853 struct annotation_line *al, *next; 1854 struct perf_evsel *evsel; 1855 1856 list_for_each_entry(al, ¬es->src->source, node) { 1857 s64 end; 1858 int i = 0; 1859 1860 if (al->offset == -1) 1861 continue; 1862 1863 next = annotation_line__next(al, ¬es->src->source); 1864 end = next ? next->offset : len; 1865 1866 for_each_group_evsel(evsel, leader) { 1867 struct hists *hists = evsel__hists(evsel); 1868 struct annotation_data *data; 1869 struct sym_hist *sym_hist; 1870 1871 BUG_ON(i >= al->data_nr); 1872 1873 sym_hist = annotation__histogram(notes, evsel->idx); 1874 data = &al->data[i++]; 1875 1876 calc_percent(sym_hist, hists, data, al->offset, end); 1877 } 1878 } 1879 } 1880 1881 void symbol__calc_percent(struct symbol *sym, struct perf_evsel *evsel) 1882 { 1883 struct annotation *notes = symbol__annotation(sym); 1884 1885 annotation__calc_percent(notes, evsel, symbol__size(sym)); 1886 } 1887 1888 int symbol__annotate(struct symbol *sym, struct map *map, 1889 struct perf_evsel *evsel, size_t privsize, 1890 struct annotation_options *options, 1891 struct arch **parch) 1892 { 1893 struct annotate_args args = { 1894 .privsize = privsize, 1895 .evsel = evsel, 1896 .options = options, 1897 }; 1898 struct perf_env *env = perf_evsel__env(evsel); 1899 const char *arch_name = perf_env__arch(env); 1900 struct arch *arch; 1901 int err; 1902 1903 if (!arch_name) 1904 return -1; 1905 1906 args.arch = arch = arch__find(arch_name); 1907 if (arch == NULL) 1908 return -ENOTSUP; 1909 1910 if (parch) 1911 *parch = arch; 1912 1913 if (arch->init) { 1914 err = arch->init(arch, env ? env->cpuid : NULL); 1915 if (err) { 1916 pr_err("%s: failed to initialize %s arch priv area\n", __func__, arch->name); 1917 return err; 1918 } 1919 } 1920 1921 args.ms.map = map; 1922 args.ms.sym = sym; 1923 1924 return symbol__disassemble(sym, &args); 1925 } 1926 1927 static void insert_source_line(struct rb_root *root, struct annotation_line *al, 1928 struct annotation_options *opts) 1929 { 1930 struct annotation_line *iter; 1931 struct rb_node **p = &root->rb_node; 1932 struct rb_node *parent = NULL; 1933 int i, ret; 1934 1935 while (*p != NULL) { 1936 parent = *p; 1937 iter = rb_entry(parent, struct annotation_line, rb_node); 1938 1939 ret = strcmp(iter->path, al->path); 1940 if (ret == 0) { 1941 for (i = 0; i < al->data_nr; i++) { 1942 iter->data[i].percent_sum += annotation_data__percent(&al->data[i], 1943 opts->percent_type); 1944 } 1945 return; 1946 } 1947 1948 if (ret < 0) 1949 p = &(*p)->rb_left; 1950 else 1951 p = &(*p)->rb_right; 1952 } 1953 1954 for (i = 0; i < al->data_nr; i++) { 1955 al->data[i].percent_sum = annotation_data__percent(&al->data[i], 1956 opts->percent_type); 1957 } 1958 1959 rb_link_node(&al->rb_node, parent, p); 1960 rb_insert_color(&al->rb_node, root); 1961 } 1962 1963 static int cmp_source_line(struct annotation_line *a, struct annotation_line *b) 1964 { 1965 int i; 1966 1967 for (i = 0; i < a->data_nr; i++) { 1968 if (a->data[i].percent_sum == b->data[i].percent_sum) 1969 continue; 1970 return a->data[i].percent_sum > b->data[i].percent_sum; 1971 } 1972 1973 return 0; 1974 } 1975 1976 static void __resort_source_line(struct rb_root *root, struct annotation_line *al) 1977 { 1978 struct annotation_line *iter; 1979 struct rb_node **p = &root->rb_node; 1980 struct rb_node *parent = NULL; 1981 1982 while (*p != NULL) { 1983 parent = *p; 1984 iter = rb_entry(parent, struct annotation_line, rb_node); 1985 1986 if (cmp_source_line(al, iter)) 1987 p = &(*p)->rb_left; 1988 else 1989 p = &(*p)->rb_right; 1990 } 1991 1992 rb_link_node(&al->rb_node, parent, p); 1993 rb_insert_color(&al->rb_node, root); 1994 } 1995 1996 static void resort_source_line(struct rb_root *dest_root, struct rb_root *src_root) 1997 { 1998 struct annotation_line *al; 1999 struct rb_node *node; 2000 2001 node = rb_first(src_root); 2002 while (node) { 2003 struct rb_node *next; 2004 2005 al = rb_entry(node, struct annotation_line, rb_node); 2006 next = rb_next(node); 2007 rb_erase(node, src_root); 2008 2009 __resort_source_line(dest_root, al); 2010 node = next; 2011 } 2012 } 2013 2014 static void print_summary(struct rb_root *root, const char *filename) 2015 { 2016 struct annotation_line *al; 2017 struct rb_node *node; 2018 2019 printf("\nSorted summary for file %s\n", filename); 2020 printf("----------------------------------------------\n\n"); 2021 2022 if (RB_EMPTY_ROOT(root)) { 2023 printf(" Nothing higher than %1.1f%%\n", MIN_GREEN); 2024 return; 2025 } 2026 2027 node = rb_first(root); 2028 while (node) { 2029 double percent, percent_max = 0.0; 2030 const char *color; 2031 char *path; 2032 int i; 2033 2034 al = rb_entry(node, struct annotation_line, rb_node); 2035 for (i = 0; i < al->data_nr; i++) { 2036 percent = al->data[i].percent_sum; 2037 color = get_percent_color(percent); 2038 color_fprintf(stdout, color, " %7.2f", percent); 2039 2040 if (percent > percent_max) 2041 percent_max = percent; 2042 } 2043 2044 path = al->path; 2045 color = get_percent_color(percent_max); 2046 color_fprintf(stdout, color, " %s\n", path); 2047 2048 node = rb_next(node); 2049 } 2050 } 2051 2052 static void symbol__annotate_hits(struct symbol *sym, struct perf_evsel *evsel) 2053 { 2054 struct annotation *notes = symbol__annotation(sym); 2055 struct sym_hist *h = annotation__histogram(notes, evsel->idx); 2056 u64 len = symbol__size(sym), offset; 2057 2058 for (offset = 0; offset < len; ++offset) 2059 if (h->addr[offset].nr_samples != 0) 2060 printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2, 2061 sym->start + offset, h->addr[offset].nr_samples); 2062 printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->nr_samples", h->nr_samples); 2063 } 2064 2065 static int annotated_source__addr_fmt_width(struct list_head *lines, u64 start) 2066 { 2067 char bf[32]; 2068 struct annotation_line *line; 2069 2070 list_for_each_entry_reverse(line, lines, node) { 2071 if (line->offset != -1) 2072 return scnprintf(bf, sizeof(bf), "%" PRIx64, start + line->offset); 2073 } 2074 2075 return 0; 2076 } 2077 2078 int symbol__annotate_printf(struct symbol *sym, struct map *map, 2079 struct perf_evsel *evsel, 2080 struct annotation_options *opts) 2081 { 2082 struct dso *dso = map->dso; 2083 char *filename; 2084 const char *d_filename; 2085 const char *evsel_name = perf_evsel__name(evsel); 2086 struct annotation *notes = symbol__annotation(sym); 2087 struct sym_hist *h = annotation__histogram(notes, evsel->idx); 2088 struct annotation_line *pos, *queue = NULL; 2089 u64 start = map__rip_2objdump(map, sym->start); 2090 int printed = 2, queue_len = 0, addr_fmt_width; 2091 int more = 0; 2092 bool context = opts->context; 2093 u64 len; 2094 int width = symbol_conf.show_total_period ? 12 : 8; 2095 int graph_dotted_len; 2096 char buf[512]; 2097 2098 filename = strdup(dso->long_name); 2099 if (!filename) 2100 return -ENOMEM; 2101 2102 if (opts->full_path) 2103 d_filename = filename; 2104 else 2105 d_filename = basename(filename); 2106 2107 len = symbol__size(sym); 2108 2109 if (perf_evsel__is_group_event(evsel)) { 2110 width *= evsel->nr_members; 2111 perf_evsel__group_desc(evsel, buf, sizeof(buf)); 2112 evsel_name = buf; 2113 } 2114 2115 graph_dotted_len = printf(" %-*.*s| Source code & Disassembly of %s for %s (%" PRIu64 " samples, " 2116 "percent: %s)\n", 2117 width, width, symbol_conf.show_total_period ? "Period" : 2118 symbol_conf.show_nr_samples ? "Samples" : "Percent", 2119 d_filename, evsel_name, h->nr_samples, 2120 percent_type_str(opts->percent_type)); 2121 2122 printf("%-*.*s----\n", 2123 graph_dotted_len, graph_dotted_len, graph_dotted_line); 2124 2125 if (verbose > 0) 2126 symbol__annotate_hits(sym, evsel); 2127 2128 addr_fmt_width = annotated_source__addr_fmt_width(¬es->src->source, start); 2129 2130 list_for_each_entry(pos, ¬es->src->source, node) { 2131 int err; 2132 2133 if (context && queue == NULL) { 2134 queue = pos; 2135 queue_len = 0; 2136 } 2137 2138 err = annotation_line__print(pos, sym, start, evsel, len, 2139 opts->min_pcnt, printed, opts->max_lines, 2140 queue, addr_fmt_width, opts->percent_type); 2141 2142 switch (err) { 2143 case 0: 2144 ++printed; 2145 if (context) { 2146 printed += queue_len; 2147 queue = NULL; 2148 queue_len = 0; 2149 } 2150 break; 2151 case 1: 2152 /* filtered by max_lines */ 2153 ++more; 2154 break; 2155 case -1: 2156 default: 2157 /* 2158 * Filtered by min_pcnt or non IP lines when 2159 * context != 0 2160 */ 2161 if (!context) 2162 break; 2163 if (queue_len == context) 2164 queue = list_entry(queue->node.next, typeof(*queue), node); 2165 else 2166 ++queue_len; 2167 break; 2168 } 2169 } 2170 2171 free(filename); 2172 2173 return more; 2174 } 2175 2176 static void FILE__set_percent_color(void *fp __maybe_unused, 2177 double percent __maybe_unused, 2178 bool current __maybe_unused) 2179 { 2180 } 2181 2182 static int FILE__set_jumps_percent_color(void *fp __maybe_unused, 2183 int nr __maybe_unused, bool current __maybe_unused) 2184 { 2185 return 0; 2186 } 2187 2188 static int FILE__set_color(void *fp __maybe_unused, int color __maybe_unused) 2189 { 2190 return 0; 2191 } 2192 2193 static void FILE__printf(void *fp, const char *fmt, ...) 2194 { 2195 va_list args; 2196 2197 va_start(args, fmt); 2198 vfprintf(fp, fmt, args); 2199 va_end(args); 2200 } 2201 2202 static void FILE__write_graph(void *fp, int graph) 2203 { 2204 const char *s; 2205 switch (graph) { 2206 2207 case DARROW_CHAR: s = "↓"; break; 2208 case UARROW_CHAR: s = "↑"; break; 2209 case LARROW_CHAR: s = "←"; break; 2210 case RARROW_CHAR: s = "→"; break; 2211 default: s = "?"; break; 2212 } 2213 2214 fputs(s, fp); 2215 } 2216 2217 static int symbol__annotate_fprintf2(struct symbol *sym, FILE *fp, 2218 struct annotation_options *opts) 2219 { 2220 struct annotation *notes = symbol__annotation(sym); 2221 struct annotation_write_ops wops = { 2222 .first_line = true, 2223 .obj = fp, 2224 .set_color = FILE__set_color, 2225 .set_percent_color = FILE__set_percent_color, 2226 .set_jumps_percent_color = FILE__set_jumps_percent_color, 2227 .printf = FILE__printf, 2228 .write_graph = FILE__write_graph, 2229 }; 2230 struct annotation_line *al; 2231 2232 list_for_each_entry(al, ¬es->src->source, node) { 2233 if (annotation_line__filter(al, notes)) 2234 continue; 2235 annotation_line__write(al, notes, &wops, opts); 2236 fputc('\n', fp); 2237 wops.first_line = false; 2238 } 2239 2240 return 0; 2241 } 2242 2243 int map_symbol__annotation_dump(struct map_symbol *ms, struct perf_evsel *evsel, 2244 struct annotation_options *opts) 2245 { 2246 const char *ev_name = perf_evsel__name(evsel); 2247 char buf[1024]; 2248 char *filename; 2249 int err = -1; 2250 FILE *fp; 2251 2252 if (asprintf(&filename, "%s.annotation", ms->sym->name) < 0) 2253 return -1; 2254 2255 fp = fopen(filename, "w"); 2256 if (fp == NULL) 2257 goto out_free_filename; 2258 2259 if (perf_evsel__is_group_event(evsel)) { 2260 perf_evsel__group_desc(evsel, buf, sizeof(buf)); 2261 ev_name = buf; 2262 } 2263 2264 fprintf(fp, "%s() %s\nEvent: %s\n\n", 2265 ms->sym->name, ms->map->dso->long_name, ev_name); 2266 symbol__annotate_fprintf2(ms->sym, fp, opts); 2267 2268 fclose(fp); 2269 err = 0; 2270 out_free_filename: 2271 free(filename); 2272 return err; 2273 } 2274 2275 void symbol__annotate_zero_histogram(struct symbol *sym, int evidx) 2276 { 2277 struct annotation *notes = symbol__annotation(sym); 2278 struct sym_hist *h = annotation__histogram(notes, evidx); 2279 2280 memset(h, 0, notes->src->sizeof_sym_hist); 2281 } 2282 2283 void symbol__annotate_decay_histogram(struct symbol *sym, int evidx) 2284 { 2285 struct annotation *notes = symbol__annotation(sym); 2286 struct sym_hist *h = annotation__histogram(notes, evidx); 2287 int len = symbol__size(sym), offset; 2288 2289 h->nr_samples = 0; 2290 for (offset = 0; offset < len; ++offset) { 2291 h->addr[offset].nr_samples = h->addr[offset].nr_samples * 7 / 8; 2292 h->nr_samples += h->addr[offset].nr_samples; 2293 } 2294 } 2295 2296 void annotated_source__purge(struct annotated_source *as) 2297 { 2298 struct annotation_line *al, *n; 2299 2300 list_for_each_entry_safe(al, n, &as->source, node) { 2301 list_del(&al->node); 2302 disasm_line__free(disasm_line(al)); 2303 } 2304 } 2305 2306 static size_t disasm_line__fprintf(struct disasm_line *dl, FILE *fp) 2307 { 2308 size_t printed; 2309 2310 if (dl->al.offset == -1) 2311 return fprintf(fp, "%s\n", dl->al.line); 2312 2313 printed = fprintf(fp, "%#" PRIx64 " %s", dl->al.offset, dl->ins.name); 2314 2315 if (dl->ops.raw[0] != '\0') { 2316 printed += fprintf(fp, "%.*s %s\n", 6 - (int)printed, " ", 2317 dl->ops.raw); 2318 } 2319 2320 return printed + fprintf(fp, "\n"); 2321 } 2322 2323 size_t disasm__fprintf(struct list_head *head, FILE *fp) 2324 { 2325 struct disasm_line *pos; 2326 size_t printed = 0; 2327 2328 list_for_each_entry(pos, head, al.node) 2329 printed += disasm_line__fprintf(pos, fp); 2330 2331 return printed; 2332 } 2333 2334 bool disasm_line__is_valid_local_jump(struct disasm_line *dl, struct symbol *sym) 2335 { 2336 if (!dl || !dl->ins.ops || !ins__is_jump(&dl->ins) || 2337 !disasm_line__has_local_offset(dl) || dl->ops.target.offset < 0 || 2338 dl->ops.target.offset >= (s64)symbol__size(sym)) 2339 return false; 2340 2341 return true; 2342 } 2343 2344 void annotation__mark_jump_targets(struct annotation *notes, struct symbol *sym) 2345 { 2346 u64 offset, size = symbol__size(sym); 2347 2348 /* PLT symbols contain external offsets */ 2349 if (strstr(sym->name, "@plt")) 2350 return; 2351 2352 for (offset = 0; offset < size; ++offset) { 2353 struct annotation_line *al = notes->offsets[offset]; 2354 struct disasm_line *dl; 2355 2356 dl = disasm_line(al); 2357 2358 if (!disasm_line__is_valid_local_jump(dl, sym)) 2359 continue; 2360 2361 al = notes->offsets[dl->ops.target.offset]; 2362 2363 /* 2364 * FIXME: Oops, no jump target? Buggy disassembler? Or do we 2365 * have to adjust to the previous offset? 2366 */ 2367 if (al == NULL) 2368 continue; 2369 2370 if (++al->jump_sources > notes->max_jump_sources) 2371 notes->max_jump_sources = al->jump_sources; 2372 2373 ++notes->nr_jumps; 2374 } 2375 } 2376 2377 void annotation__set_offsets(struct annotation *notes, s64 size) 2378 { 2379 struct annotation_line *al; 2380 2381 notes->max_line_len = 0; 2382 2383 list_for_each_entry(al, ¬es->src->source, node) { 2384 size_t line_len = strlen(al->line); 2385 2386 if (notes->max_line_len < line_len) 2387 notes->max_line_len = line_len; 2388 al->idx = notes->nr_entries++; 2389 if (al->offset != -1) { 2390 al->idx_asm = notes->nr_asm_entries++; 2391 /* 2392 * FIXME: short term bandaid to cope with assembly 2393 * routines that comes with labels in the same column 2394 * as the address in objdump, sigh. 2395 * 2396 * E.g. copy_user_generic_unrolled 2397 */ 2398 if (al->offset < size) 2399 notes->offsets[al->offset] = al; 2400 } else 2401 al->idx_asm = -1; 2402 } 2403 } 2404 2405 static inline int width_jumps(int n) 2406 { 2407 if (n >= 100) 2408 return 5; 2409 if (n / 10) 2410 return 2; 2411 return 1; 2412 } 2413 2414 void annotation__init_column_widths(struct annotation *notes, struct symbol *sym) 2415 { 2416 notes->widths.addr = notes->widths.target = 2417 notes->widths.min_addr = hex_width(symbol__size(sym)); 2418 notes->widths.max_addr = hex_width(sym->end); 2419 notes->widths.jumps = width_jumps(notes->max_jump_sources); 2420 } 2421 2422 void annotation__update_column_widths(struct annotation *notes) 2423 { 2424 if (notes->options->use_offset) 2425 notes->widths.target = notes->widths.min_addr; 2426 else 2427 notes->widths.target = notes->widths.max_addr; 2428 2429 notes->widths.addr = notes->widths.target; 2430 2431 if (notes->options->show_nr_jumps) 2432 notes->widths.addr += notes->widths.jumps + 1; 2433 } 2434 2435 static void annotation__calc_lines(struct annotation *notes, struct map *map, 2436 struct rb_root *root, 2437 struct annotation_options *opts) 2438 { 2439 struct annotation_line *al; 2440 struct rb_root tmp_root = RB_ROOT; 2441 2442 list_for_each_entry(al, ¬es->src->source, node) { 2443 double percent_max = 0.0; 2444 int i; 2445 2446 for (i = 0; i < al->data_nr; i++) { 2447 double percent; 2448 2449 percent = annotation_data__percent(&al->data[i], 2450 opts->percent_type); 2451 2452 if (percent > percent_max) 2453 percent_max = percent; 2454 } 2455 2456 if (percent_max <= 0.5) 2457 continue; 2458 2459 al->path = get_srcline(map->dso, notes->start + al->offset, NULL, 2460 false, true, notes->start + al->offset); 2461 insert_source_line(&tmp_root, al, opts); 2462 } 2463 2464 resort_source_line(root, &tmp_root); 2465 } 2466 2467 static void symbol__calc_lines(struct symbol *sym, struct map *map, 2468 struct rb_root *root, 2469 struct annotation_options *opts) 2470 { 2471 struct annotation *notes = symbol__annotation(sym); 2472 2473 annotation__calc_lines(notes, map, root, opts); 2474 } 2475 2476 int symbol__tty_annotate2(struct symbol *sym, struct map *map, 2477 struct perf_evsel *evsel, 2478 struct annotation_options *opts) 2479 { 2480 struct dso *dso = map->dso; 2481 struct rb_root source_line = RB_ROOT; 2482 struct hists *hists = evsel__hists(evsel); 2483 char buf[1024]; 2484 2485 if (symbol__annotate2(sym, map, evsel, opts, NULL) < 0) 2486 return -1; 2487 2488 if (opts->print_lines) { 2489 srcline_full_filename = opts->full_path; 2490 symbol__calc_lines(sym, map, &source_line, opts); 2491 print_summary(&source_line, dso->long_name); 2492 } 2493 2494 hists__scnprintf_title(hists, buf, sizeof(buf)); 2495 fprintf(stdout, "%s, [percent: %s]\n%s() %s\n", 2496 buf, percent_type_str(opts->percent_type), sym->name, dso->long_name); 2497 symbol__annotate_fprintf2(sym, stdout, opts); 2498 2499 annotated_source__purge(symbol__annotation(sym)->src); 2500 2501 return 0; 2502 } 2503 2504 int symbol__tty_annotate(struct symbol *sym, struct map *map, 2505 struct perf_evsel *evsel, 2506 struct annotation_options *opts) 2507 { 2508 struct dso *dso = map->dso; 2509 struct rb_root source_line = RB_ROOT; 2510 2511 if (symbol__annotate(sym, map, evsel, 0, opts, NULL) < 0) 2512 return -1; 2513 2514 symbol__calc_percent(sym, evsel); 2515 2516 if (opts->print_lines) { 2517 srcline_full_filename = opts->full_path; 2518 symbol__calc_lines(sym, map, &source_line, opts); 2519 print_summary(&source_line, dso->long_name); 2520 } 2521 2522 symbol__annotate_printf(sym, map, evsel, opts); 2523 2524 annotated_source__purge(symbol__annotation(sym)->src); 2525 2526 return 0; 2527 } 2528 2529 bool ui__has_annotation(void) 2530 { 2531 return use_browser == 1 && perf_hpp_list.sym; 2532 } 2533 2534 2535 static double annotation_line__max_percent(struct annotation_line *al, 2536 struct annotation *notes, 2537 unsigned int percent_type) 2538 { 2539 double percent_max = 0.0; 2540 int i; 2541 2542 for (i = 0; i < notes->nr_events; i++) { 2543 double percent; 2544 2545 percent = annotation_data__percent(&al->data[i], 2546 percent_type); 2547 2548 if (percent > percent_max) 2549 percent_max = percent; 2550 } 2551 2552 return percent_max; 2553 } 2554 2555 static void disasm_line__write(struct disasm_line *dl, struct annotation *notes, 2556 void *obj, char *bf, size_t size, 2557 void (*obj__printf)(void *obj, const char *fmt, ...), 2558 void (*obj__write_graph)(void *obj, int graph)) 2559 { 2560 if (dl->ins.ops && dl->ins.ops->scnprintf) { 2561 if (ins__is_jump(&dl->ins)) { 2562 bool fwd; 2563 2564 if (dl->ops.target.outside) 2565 goto call_like; 2566 fwd = dl->ops.target.offset > dl->al.offset; 2567 obj__write_graph(obj, fwd ? DARROW_CHAR : UARROW_CHAR); 2568 obj__printf(obj, " "); 2569 } else if (ins__is_call(&dl->ins)) { 2570 call_like: 2571 obj__write_graph(obj, RARROW_CHAR); 2572 obj__printf(obj, " "); 2573 } else if (ins__is_ret(&dl->ins)) { 2574 obj__write_graph(obj, LARROW_CHAR); 2575 obj__printf(obj, " "); 2576 } else { 2577 obj__printf(obj, " "); 2578 } 2579 } else { 2580 obj__printf(obj, " "); 2581 } 2582 2583 disasm_line__scnprintf(dl, bf, size, !notes->options->use_offset); 2584 } 2585 2586 static void ipc_coverage_string(char *bf, int size, struct annotation *notes) 2587 { 2588 double ipc = 0.0, coverage = 0.0; 2589 2590 if (notes->hit_cycles) 2591 ipc = notes->hit_insn / ((double)notes->hit_cycles); 2592 2593 if (notes->total_insn) { 2594 coverage = notes->cover_insn * 100.0 / 2595 ((double)notes->total_insn); 2596 } 2597 2598 scnprintf(bf, size, "(Average IPC: %.2f, IPC Coverage: %.1f%%)", 2599 ipc, coverage); 2600 } 2601 2602 static void __annotation_line__write(struct annotation_line *al, struct annotation *notes, 2603 bool first_line, bool current_entry, bool change_color, int width, 2604 void *obj, unsigned int percent_type, 2605 int (*obj__set_color)(void *obj, int color), 2606 void (*obj__set_percent_color)(void *obj, double percent, bool current), 2607 int (*obj__set_jumps_percent_color)(void *obj, int nr, bool current), 2608 void (*obj__printf)(void *obj, const char *fmt, ...), 2609 void (*obj__write_graph)(void *obj, int graph)) 2610 2611 { 2612 double percent_max = annotation_line__max_percent(al, notes, percent_type); 2613 int pcnt_width = annotation__pcnt_width(notes), 2614 cycles_width = annotation__cycles_width(notes); 2615 bool show_title = false; 2616 char bf[256]; 2617 int printed; 2618 2619 if (first_line && (al->offset == -1 || percent_max == 0.0)) { 2620 if (notes->have_cycles) { 2621 if (al->ipc == 0.0 && al->cycles == 0) 2622 show_title = true; 2623 } else 2624 show_title = true; 2625 } 2626 2627 if (al->offset != -1 && percent_max != 0.0) { 2628 int i; 2629 2630 for (i = 0; i < notes->nr_events; i++) { 2631 double percent; 2632 2633 percent = annotation_data__percent(&al->data[i], percent_type); 2634 2635 obj__set_percent_color(obj, percent, current_entry); 2636 if (notes->options->show_total_period) { 2637 obj__printf(obj, "%11" PRIu64 " ", al->data[i].he.period); 2638 } else if (notes->options->show_nr_samples) { 2639 obj__printf(obj, "%6" PRIu64 " ", 2640 al->data[i].he.nr_samples); 2641 } else { 2642 obj__printf(obj, "%6.2f ", percent); 2643 } 2644 } 2645 } else { 2646 obj__set_percent_color(obj, 0, current_entry); 2647 2648 if (!show_title) 2649 obj__printf(obj, "%-*s", pcnt_width, " "); 2650 else { 2651 obj__printf(obj, "%-*s", pcnt_width, 2652 notes->options->show_total_period ? "Period" : 2653 notes->options->show_nr_samples ? "Samples" : "Percent"); 2654 } 2655 } 2656 2657 if (notes->have_cycles) { 2658 if (al->ipc) 2659 obj__printf(obj, "%*.2f ", ANNOTATION__IPC_WIDTH - 1, al->ipc); 2660 else if (!show_title) 2661 obj__printf(obj, "%*s", ANNOTATION__IPC_WIDTH, " "); 2662 else 2663 obj__printf(obj, "%*s ", ANNOTATION__IPC_WIDTH - 1, "IPC"); 2664 2665 if (!notes->options->show_minmax_cycle) { 2666 if (al->cycles) 2667 obj__printf(obj, "%*" PRIu64 " ", 2668 ANNOTATION__CYCLES_WIDTH - 1, al->cycles); 2669 else if (!show_title) 2670 obj__printf(obj, "%*s", 2671 ANNOTATION__CYCLES_WIDTH, " "); 2672 else 2673 obj__printf(obj, "%*s ", 2674 ANNOTATION__CYCLES_WIDTH - 1, 2675 "Cycle"); 2676 } else { 2677 if (al->cycles) { 2678 char str[32]; 2679 2680 scnprintf(str, sizeof(str), 2681 "%" PRIu64 "(%" PRIu64 "/%" PRIu64 ")", 2682 al->cycles, al->cycles_min, 2683 al->cycles_max); 2684 2685 obj__printf(obj, "%*s ", 2686 ANNOTATION__MINMAX_CYCLES_WIDTH - 1, 2687 str); 2688 } else if (!show_title) 2689 obj__printf(obj, "%*s", 2690 ANNOTATION__MINMAX_CYCLES_WIDTH, 2691 " "); 2692 else 2693 obj__printf(obj, "%*s ", 2694 ANNOTATION__MINMAX_CYCLES_WIDTH - 1, 2695 "Cycle(min/max)"); 2696 } 2697 2698 if (show_title && !*al->line) { 2699 ipc_coverage_string(bf, sizeof(bf), notes); 2700 obj__printf(obj, "%*s", ANNOTATION__AVG_IPC_WIDTH, bf); 2701 } 2702 } 2703 2704 obj__printf(obj, " "); 2705 2706 if (!*al->line) 2707 obj__printf(obj, "%-*s", width - pcnt_width - cycles_width, " "); 2708 else if (al->offset == -1) { 2709 if (al->line_nr && notes->options->show_linenr) 2710 printed = scnprintf(bf, sizeof(bf), "%-*d ", notes->widths.addr + 1, al->line_nr); 2711 else 2712 printed = scnprintf(bf, sizeof(bf), "%-*s ", notes->widths.addr, " "); 2713 obj__printf(obj, bf); 2714 obj__printf(obj, "%-*s", width - printed - pcnt_width - cycles_width + 1, al->line); 2715 } else { 2716 u64 addr = al->offset; 2717 int color = -1; 2718 2719 if (!notes->options->use_offset) 2720 addr += notes->start; 2721 2722 if (!notes->options->use_offset) { 2723 printed = scnprintf(bf, sizeof(bf), "%" PRIx64 ": ", addr); 2724 } else { 2725 if (al->jump_sources && 2726 notes->options->offset_level >= ANNOTATION__OFFSET_JUMP_TARGETS) { 2727 if (notes->options->show_nr_jumps) { 2728 int prev; 2729 printed = scnprintf(bf, sizeof(bf), "%*d ", 2730 notes->widths.jumps, 2731 al->jump_sources); 2732 prev = obj__set_jumps_percent_color(obj, al->jump_sources, 2733 current_entry); 2734 obj__printf(obj, bf); 2735 obj__set_color(obj, prev); 2736 } 2737 print_addr: 2738 printed = scnprintf(bf, sizeof(bf), "%*" PRIx64 ": ", 2739 notes->widths.target, addr); 2740 } else if (ins__is_call(&disasm_line(al)->ins) && 2741 notes->options->offset_level >= ANNOTATION__OFFSET_CALL) { 2742 goto print_addr; 2743 } else if (notes->options->offset_level == ANNOTATION__MAX_OFFSET_LEVEL) { 2744 goto print_addr; 2745 } else { 2746 printed = scnprintf(bf, sizeof(bf), "%-*s ", 2747 notes->widths.addr, " "); 2748 } 2749 } 2750 2751 if (change_color) 2752 color = obj__set_color(obj, HE_COLORSET_ADDR); 2753 obj__printf(obj, bf); 2754 if (change_color) 2755 obj__set_color(obj, color); 2756 2757 disasm_line__write(disasm_line(al), notes, obj, bf, sizeof(bf), obj__printf, obj__write_graph); 2758 2759 obj__printf(obj, "%-*s", width - pcnt_width - cycles_width - 3 - printed, bf); 2760 } 2761 2762 } 2763 2764 void annotation_line__write(struct annotation_line *al, struct annotation *notes, 2765 struct annotation_write_ops *wops, 2766 struct annotation_options *opts) 2767 { 2768 __annotation_line__write(al, notes, wops->first_line, wops->current_entry, 2769 wops->change_color, wops->width, wops->obj, 2770 opts->percent_type, 2771 wops->set_color, wops->set_percent_color, 2772 wops->set_jumps_percent_color, wops->printf, 2773 wops->write_graph); 2774 } 2775 2776 int symbol__annotate2(struct symbol *sym, struct map *map, struct perf_evsel *evsel, 2777 struct annotation_options *options, struct arch **parch) 2778 { 2779 struct annotation *notes = symbol__annotation(sym); 2780 size_t size = symbol__size(sym); 2781 int nr_pcnt = 1, err; 2782 2783 notes->offsets = zalloc(size * sizeof(struct annotation_line *)); 2784 if (notes->offsets == NULL) 2785 return -1; 2786 2787 if (perf_evsel__is_group_event(evsel)) 2788 nr_pcnt = evsel->nr_members; 2789 2790 err = symbol__annotate(sym, map, evsel, 0, options, parch); 2791 if (err) 2792 goto out_free_offsets; 2793 2794 notes->options = options; 2795 2796 symbol__calc_percent(sym, evsel); 2797 2798 notes->start = map__rip_2objdump(map, sym->start); 2799 2800 annotation__set_offsets(notes, size); 2801 annotation__mark_jump_targets(notes, sym); 2802 annotation__compute_ipc(notes, size); 2803 annotation__init_column_widths(notes, sym); 2804 notes->nr_events = nr_pcnt; 2805 2806 annotation__update_column_widths(notes); 2807 sym->annotate2 = true; 2808 2809 return 0; 2810 2811 out_free_offsets: 2812 zfree(¬es->offsets); 2813 return -1; 2814 } 2815 2816 #define ANNOTATION__CFG(n) \ 2817 { .name = #n, .value = &annotation__default_options.n, } 2818 2819 /* 2820 * Keep the entries sorted, they are bsearch'ed 2821 */ 2822 static struct annotation_config { 2823 const char *name; 2824 void *value; 2825 } annotation__configs[] = { 2826 ANNOTATION__CFG(hide_src_code), 2827 ANNOTATION__CFG(jump_arrows), 2828 ANNOTATION__CFG(offset_level), 2829 ANNOTATION__CFG(show_linenr), 2830 ANNOTATION__CFG(show_nr_jumps), 2831 ANNOTATION__CFG(show_nr_samples), 2832 ANNOTATION__CFG(show_total_period), 2833 ANNOTATION__CFG(use_offset), 2834 }; 2835 2836 #undef ANNOTATION__CFG 2837 2838 static int annotation_config__cmp(const void *name, const void *cfgp) 2839 { 2840 const struct annotation_config *cfg = cfgp; 2841 2842 return strcmp(name, cfg->name); 2843 } 2844 2845 static int annotation__config(const char *var, const char *value, 2846 void *data __maybe_unused) 2847 { 2848 struct annotation_config *cfg; 2849 const char *name; 2850 2851 if (!strstarts(var, "annotate.")) 2852 return 0; 2853 2854 name = var + 9; 2855 cfg = bsearch(name, annotation__configs, ARRAY_SIZE(annotation__configs), 2856 sizeof(struct annotation_config), annotation_config__cmp); 2857 2858 if (cfg == NULL) 2859 pr_debug("%s variable unknown, ignoring...", var); 2860 else if (strcmp(var, "annotate.offset_level") == 0) { 2861 perf_config_int(cfg->value, name, value); 2862 2863 if (*(int *)cfg->value > ANNOTATION__MAX_OFFSET_LEVEL) 2864 *(int *)cfg->value = ANNOTATION__MAX_OFFSET_LEVEL; 2865 else if (*(int *)cfg->value < ANNOTATION__MIN_OFFSET_LEVEL) 2866 *(int *)cfg->value = ANNOTATION__MIN_OFFSET_LEVEL; 2867 } else { 2868 *(bool *)cfg->value = perf_config_bool(name, value); 2869 } 2870 return 0; 2871 } 2872 2873 void annotation_config__init(void) 2874 { 2875 perf_config(annotation__config, NULL); 2876 2877 annotation__default_options.show_total_period = symbol_conf.show_total_period; 2878 annotation__default_options.show_nr_samples = symbol_conf.show_nr_samples; 2879 } 2880 2881 static unsigned int parse_percent_type(char *str1, char *str2) 2882 { 2883 unsigned int type = (unsigned int) -1; 2884 2885 if (!strcmp("period", str1)) { 2886 if (!strcmp("local", str2)) 2887 type = PERCENT_PERIOD_LOCAL; 2888 else if (!strcmp("global", str2)) 2889 type = PERCENT_PERIOD_GLOBAL; 2890 } 2891 2892 if (!strcmp("hits", str1)) { 2893 if (!strcmp("local", str2)) 2894 type = PERCENT_HITS_LOCAL; 2895 else if (!strcmp("global", str2)) 2896 type = PERCENT_HITS_GLOBAL; 2897 } 2898 2899 return type; 2900 } 2901 2902 int annotate_parse_percent_type(const struct option *opt, const char *_str, 2903 int unset __maybe_unused) 2904 { 2905 struct annotation_options *opts = opt->value; 2906 unsigned int type; 2907 char *str1, *str2; 2908 int err = -1; 2909 2910 str1 = strdup(_str); 2911 if (!str1) 2912 return -ENOMEM; 2913 2914 str2 = strchr(str1, '-'); 2915 if (!str2) 2916 goto out; 2917 2918 *str2++ = 0; 2919 2920 type = parse_percent_type(str1, str2); 2921 if (type == (unsigned int) -1) 2922 type = parse_percent_type(str2, str1); 2923 if (type != (unsigned int) -1) { 2924 opts->percent_type = type; 2925 err = 0; 2926 } 2927 2928 out: 2929 free(str1); 2930 return err; 2931 } 2932