2 * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
4 * Parts came from builtin-annotate.c, see those files for further
7 * Released under the GPL v2. (and only v2, not any later version)
25 #include "block-range.h"
27 #include "arch/common.h"
30 #include <linux/bitops.h>
31 #include <linux/kernel.h>
33 /* FIXME: For the HE_COLORSET */
34 #include "ui/browser.h"
37 * FIXME: Using the same values as slang.h,
38 * but that header may not be available everywhere
40 #define LARROW_CHAR ((unsigned char)',')
41 #define RARROW_CHAR ((unsigned char)'+')
42 #define DARROW_CHAR ((unsigned char)'.')
43 #define UARROW_CHAR ((unsigned char)'-')
45 #include "sane_ctype.h"
47 struct annotation_options annotation__default_options = {
51 .offset_level = ANNOTATION__OFFSET_JUMP_TARGETS,
52 .percent_type = PERCENT_PERIOD_LOCAL,
55 static regex_t file_lineno;
57 static struct ins_ops *ins__find(struct arch *arch, const char *name);
58 static void ins__sort(struct arch *arch);
59 static int disasm_line__parse(char *line, const char **namep, char **rawp);
63 struct ins *instructions;
64 size_t nr_instructions;
65 size_t nr_instructions_allocated;
66 struct ins_ops *(*associate_instruction_ops)(struct arch *arch, const char *name);
67 bool sorted_instructions;
72 int (*init)(struct arch *arch, char *cpuid);
73 bool (*ins_is_fused)(struct arch *arch, const char *ins1,
77 char skip_functions_char;
81 static struct ins_ops call_ops;
82 static struct ins_ops dec_ops;
83 static struct ins_ops jump_ops;
84 static struct ins_ops mov_ops;
85 static struct ins_ops nop_ops;
86 static struct ins_ops lock_ops;
87 static struct ins_ops ret_ops;
89 static int arch__grow_instructions(struct arch *arch)
91 struct ins *new_instructions;
92 size_t new_nr_allocated;
94 if (arch->nr_instructions_allocated == 0 && arch->instructions)
95 goto grow_from_non_allocated_table;
97 new_nr_allocated = arch->nr_instructions_allocated + 128;
98 new_instructions = realloc(arch->instructions, new_nr_allocated * sizeof(struct ins));
99 if (new_instructions == NULL)
102 out_update_instructions:
103 arch->instructions = new_instructions;
104 arch->nr_instructions_allocated = new_nr_allocated;
107 grow_from_non_allocated_table:
108 new_nr_allocated = arch->nr_instructions + 128;
109 new_instructions = calloc(new_nr_allocated, sizeof(struct ins));
110 if (new_instructions == NULL)
113 memcpy(new_instructions, arch->instructions, arch->nr_instructions);
114 goto out_update_instructions;
117 static int arch__associate_ins_ops(struct arch* arch, const char *name, struct ins_ops *ops)
121 if (arch->nr_instructions == arch->nr_instructions_allocated &&
122 arch__grow_instructions(arch))
125 ins = &arch->instructions[arch->nr_instructions];
126 ins->name = strdup(name);
131 arch->nr_instructions++;
137 #include "arch/arm/annotate/instructions.c"
138 #include "arch/arm64/annotate/instructions.c"
139 #include "arch/x86/annotate/instructions.c"
140 #include "arch/powerpc/annotate/instructions.c"
141 #include "arch/s390/annotate/instructions.c"
142 #include "arch/sparc/annotate/instructions.c"
144 static struct arch architectures[] = {
147 .init = arm__annotate_init,
151 .init = arm64__annotate_init,
155 .init = x86__annotate_init,
156 .instructions = x86__instructions,
157 .nr_instructions = ARRAY_SIZE(x86__instructions),
158 .ins_is_fused = x86__ins_is_fused,
165 .init = powerpc__annotate_init,
169 .init = s390__annotate_init,
176 .init = sparc__annotate_init,
183 static void ins__delete(struct ins_operands *ops)
187 zfree(&ops->source.raw);
188 zfree(&ops->source.name);
189 zfree(&ops->target.raw);
190 zfree(&ops->target.name);
193 static int ins__raw_scnprintf(struct ins *ins, char *bf, size_t size,
194 struct ins_operands *ops)
196 return scnprintf(bf, size, "%-6s %s", ins->name, ops->raw);
199 int ins__scnprintf(struct ins *ins, char *bf, size_t size,
200 struct ins_operands *ops)
202 if (ins->ops->scnprintf)
203 return ins->ops->scnprintf(ins, bf, size, ops);
205 return ins__raw_scnprintf(ins, bf, size, ops);
208 bool ins__is_fused(struct arch *arch, const char *ins1, const char *ins2)
210 if (!arch || !arch->ins_is_fused)
213 return arch->ins_is_fused(arch, ins1, ins2);
216 static int call__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms)
218 char *endptr, *tok, *name;
219 struct map *map = ms->map;
220 struct addr_map_symbol target = {
224 ops->target.addr = strtoull(ops->raw, &endptr, 16);
226 name = strchr(endptr, '<');
232 if (arch->objdump.skip_functions_char &&
233 strchr(name, arch->objdump.skip_functions_char))
236 tok = strchr(name, '>');
241 ops->target.name = strdup(name);
244 if (ops->target.name == NULL)
247 target.addr = map__objdump_2mem(map, ops->target.addr);
249 if (map_groups__find_ams(&target) == 0 &&
250 map__rip_2objdump(target.map, map->map_ip(target.map, target.addr)) == ops->target.addr)
251 ops->target.sym = target.sym;
256 tok = strchr(endptr, '*');
260 /* Indirect call can use a non-rip register and offset: callq *0x8(%rbx).
261 * Do not parse such instruction. */
262 if (strstr(endptr, "(%r") == NULL)
263 ops->target.addr = strtoull(endptr, NULL, 16);
268 static int call__scnprintf(struct ins *ins, char *bf, size_t size,
269 struct ins_operands *ops)
272 return scnprintf(bf, size, "%-6s %s", ins->name, ops->target.sym->name);
274 if (ops->target.addr == 0)
275 return ins__raw_scnprintf(ins, bf, size, ops);
277 if (ops->target.name)
278 return scnprintf(bf, size, "%-6s %s", ins->name, ops->target.name);
280 return scnprintf(bf, size, "%-6s *%" PRIx64, ins->name, ops->target.addr);
283 static struct ins_ops call_ops = {
284 .parse = call__parse,
285 .scnprintf = call__scnprintf,
288 bool ins__is_call(const struct ins *ins)
290 return ins->ops == &call_ops || ins->ops == &s390_call_ops;
294 * Prevents from matching commas in the comment section, e.g.:
295 * ffff200008446e70: b.cs ffff2000084470f4 <generic_exec_single+0x314> // b.hs, b.nlast
297 static inline const char *validate_comma(const char *c, struct ins_operands *ops)
299 if (ops->raw_comment && c > ops->raw_comment)
305 static int jump__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms)
307 struct map *map = ms->map;
308 struct symbol *sym = ms->sym;
309 struct addr_map_symbol target = {
312 const char *c = strchr(ops->raw, ',');
315 ops->raw_comment = strchr(ops->raw, arch->objdump.comment_char);
316 c = validate_comma(c, ops);
319 * Examples of lines to parse for the _cpp_lex_token@@Base
322 * 1159e6c: jne 115aa32 <_cpp_lex_token@@Base+0xf92>
323 * 1159e8b: jne c469be <cpp_named_operator2name@@Base+0xa72>
325 * The first is a jump to an offset inside the same function,
326 * the second is to another function, i.e. that 0xa72 is an
327 * offset in the cpp_named_operator2name@@base function.
330 * skip over possible up to 2 operands to get to address, e.g.:
331 * tbnz w0, #26, ffff0000083cd190 <security_file_permission+0xd0>
334 ops->target.addr = strtoull(c, NULL, 16);
335 if (!ops->target.addr) {
337 c = validate_comma(c, ops);
339 ops->target.addr = strtoull(c, NULL, 16);
342 ops->target.addr = strtoull(ops->raw, NULL, 16);
345 target.addr = map__objdump_2mem(map, ops->target.addr);
346 start = map->unmap_ip(map, sym->start),
347 end = map->unmap_ip(map, sym->end);
349 ops->target.outside = target.addr < start || target.addr > end;
352 * FIXME: things like this in _cpp_lex_token (gcc's cc1 program):
354 cpp_named_operator2name@@Base+0xa72
356 * Point to a place that is after the cpp_named_operator2name
357 * boundaries, i.e. in the ELF symbol table for cc1
358 * cpp_named_operator2name is marked as being 32-bytes long, but it in
359 * fact is much larger than that, so we seem to need a symbols__find()
360 * routine that looks for >= current->start and < next_symbol->start,
361 * possibly just for C++ objects?
363 * For now lets just make some progress by marking jumps to outside the
364 * current function as call like.
366 * Actual navigation will come next, with further understanding of how
367 * the symbol searching and disassembly should be done.
369 if (map_groups__find_ams(&target) == 0 &&
370 map__rip_2objdump(target.map, map->map_ip(target.map, target.addr)) == ops->target.addr)
371 ops->target.sym = target.sym;
373 if (!ops->target.outside) {
374 ops->target.offset = target.addr - start;
375 ops->target.offset_avail = true;
377 ops->target.offset_avail = false;
383 static int jump__scnprintf(struct ins *ins, char *bf, size_t size,
384 struct ins_operands *ops)
388 if (!ops->target.addr || ops->target.offset < 0)
389 return ins__raw_scnprintf(ins, bf, size, ops);
391 if (ops->target.outside && ops->target.sym != NULL)
392 return scnprintf(bf, size, "%-6s %s", ins->name, ops->target.sym->name);
394 c = strchr(ops->raw, ',');
395 c = validate_comma(c, ops);
398 const char *c2 = strchr(c + 1, ',');
400 c2 = validate_comma(c2, ops);
401 /* check for 3-op insn */
406 /* mirror arch objdump's space-after-comma style */
411 return scnprintf(bf, size, "%-6s %.*s%" PRIx64,
412 ins->name, c ? c - ops->raw : 0, ops->raw,
416 static struct ins_ops jump_ops = {
417 .parse = jump__parse,
418 .scnprintf = jump__scnprintf,
421 bool ins__is_jump(const struct ins *ins)
423 return ins->ops == &jump_ops;
426 static int comment__symbol(char *raw, char *comment, u64 *addrp, char **namep)
428 char *endptr, *name, *t;
430 if (strstr(raw, "(%rip)") == NULL)
433 *addrp = strtoull(comment, &endptr, 16);
434 if (endptr == comment)
436 name = strchr(endptr, '<');
442 t = strchr(name, '>');
447 *namep = strdup(name);
453 static int lock__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms)
455 ops->locked.ops = zalloc(sizeof(*ops->locked.ops));
456 if (ops->locked.ops == NULL)
459 if (disasm_line__parse(ops->raw, &ops->locked.ins.name, &ops->locked.ops->raw) < 0)
462 ops->locked.ins.ops = ins__find(arch, ops->locked.ins.name);
464 if (ops->locked.ins.ops == NULL)
467 if (ops->locked.ins.ops->parse &&
468 ops->locked.ins.ops->parse(arch, ops->locked.ops, ms) < 0)
474 zfree(&ops->locked.ops);
478 static int lock__scnprintf(struct ins *ins, char *bf, size_t size,
479 struct ins_operands *ops)
483 if (ops->locked.ins.ops == NULL)
484 return ins__raw_scnprintf(ins, bf, size, ops);
486 printed = scnprintf(bf, size, "%-6s ", ins->name);
487 return printed + ins__scnprintf(&ops->locked.ins, bf + printed,
488 size - printed, ops->locked.ops);
491 static void lock__delete(struct ins_operands *ops)
493 struct ins *ins = &ops->locked.ins;
495 if (ins->ops && ins->ops->free)
496 ins->ops->free(ops->locked.ops);
498 ins__delete(ops->locked.ops);
500 zfree(&ops->locked.ops);
501 zfree(&ops->target.raw);
502 zfree(&ops->target.name);
505 static struct ins_ops lock_ops = {
506 .free = lock__delete,
507 .parse = lock__parse,
508 .scnprintf = lock__scnprintf,
511 static int mov__parse(struct arch *arch, struct ins_operands *ops, struct map_symbol *ms __maybe_unused)
513 char *s = strchr(ops->raw, ','), *target, *comment, prev;
519 ops->source.raw = strdup(ops->raw);
522 if (ops->source.raw == NULL)
526 comment = strchr(s, arch->objdump.comment_char);
531 s = strchr(s, '\0') - 1;
533 while (s > target && isspace(s[0]))
539 ops->target.raw = strdup(target);
542 if (ops->target.raw == NULL)
543 goto out_free_source;
548 comment = ltrim(comment);
549 comment__symbol(ops->source.raw, comment + 1, &ops->source.addr, &ops->source.name);
550 comment__symbol(ops->target.raw, comment + 1, &ops->target.addr, &ops->target.name);
555 zfree(&ops->source.raw);
559 static int mov__scnprintf(struct ins *ins, char *bf, size_t size,
560 struct ins_operands *ops)
562 return scnprintf(bf, size, "%-6s %s,%s", ins->name,
563 ops->source.name ?: ops->source.raw,
564 ops->target.name ?: ops->target.raw);
567 static struct ins_ops mov_ops = {
569 .scnprintf = mov__scnprintf,
572 static int dec__parse(struct arch *arch __maybe_unused, struct ins_operands *ops, struct map_symbol *ms __maybe_unused)
574 char *target, *comment, *s, prev;
576 target = s = ops->raw;
578 while (s[0] != '\0' && !isspace(s[0]))
583 ops->target.raw = strdup(target);
586 if (ops->target.raw == NULL)
589 comment = strchr(s, arch->objdump.comment_char);
593 comment = ltrim(comment);
594 comment__symbol(ops->target.raw, comment + 1, &ops->target.addr, &ops->target.name);
599 static int dec__scnprintf(struct ins *ins, char *bf, size_t size,
600 struct ins_operands *ops)
602 return scnprintf(bf, size, "%-6s %s", ins->name,
603 ops->target.name ?: ops->target.raw);
606 static struct ins_ops dec_ops = {
608 .scnprintf = dec__scnprintf,
611 static int nop__scnprintf(struct ins *ins __maybe_unused, char *bf, size_t size,
612 struct ins_operands *ops __maybe_unused)
614 return scnprintf(bf, size, "%-6s", "nop");
617 static struct ins_ops nop_ops = {
618 .scnprintf = nop__scnprintf,
621 static struct ins_ops ret_ops = {
622 .scnprintf = ins__raw_scnprintf,
625 bool ins__is_ret(const struct ins *ins)
627 return ins->ops == &ret_ops;
630 bool ins__is_lock(const struct ins *ins)
632 return ins->ops == &lock_ops;
635 static int ins__key_cmp(const void *name, const void *insp)
637 const struct ins *ins = insp;
639 return strcmp(name, ins->name);
642 static int ins__cmp(const void *a, const void *b)
644 const struct ins *ia = a;
645 const struct ins *ib = b;
647 return strcmp(ia->name, ib->name);
650 static void ins__sort(struct arch *arch)
652 const int nmemb = arch->nr_instructions;
654 qsort(arch->instructions, nmemb, sizeof(struct ins), ins__cmp);
657 static struct ins_ops *__ins__find(struct arch *arch, const char *name)
660 const int nmemb = arch->nr_instructions;
662 if (!arch->sorted_instructions) {
664 arch->sorted_instructions = true;
667 ins = bsearch(name, arch->instructions, nmemb, sizeof(struct ins), ins__key_cmp);
668 return ins ? ins->ops : NULL;
671 static struct ins_ops *ins__find(struct arch *arch, const char *name)
673 struct ins_ops *ops = __ins__find(arch, name);
675 if (!ops && arch->associate_instruction_ops)
676 ops = arch->associate_instruction_ops(arch, name);
681 static int arch__key_cmp(const void *name, const void *archp)
683 const struct arch *arch = archp;
685 return strcmp(name, arch->name);
688 static int arch__cmp(const void *a, const void *b)
690 const struct arch *aa = a;
691 const struct arch *ab = b;
693 return strcmp(aa->name, ab->name);
696 static void arch__sort(void)
698 const int nmemb = ARRAY_SIZE(architectures);
700 qsort(architectures, nmemb, sizeof(struct arch), arch__cmp);
703 static struct arch *arch__find(const char *name)
705 const int nmemb = ARRAY_SIZE(architectures);
713 return bsearch(name, architectures, nmemb, sizeof(struct arch), arch__key_cmp);
716 static struct annotated_source *annotated_source__new(void)
718 struct annotated_source *src = zalloc(sizeof(*src));
721 INIT_LIST_HEAD(&src->source);
726 static __maybe_unused void annotated_source__delete(struct annotated_source *src)
730 zfree(&src->histograms);
731 zfree(&src->cycles_hist);
735 static int annotated_source__alloc_histograms(struct annotated_source *src,
736 size_t size, int nr_hists)
738 size_t sizeof_sym_hist;
741 * Add buffer of one element for zero length symbol.
742 * When sample is taken from first instruction of
743 * zero length symbol, perf still resolves it and
744 * shows symbol name in perf report and allows to
750 /* Check for overflow when calculating sizeof_sym_hist */
751 if (size > (SIZE_MAX - sizeof(struct sym_hist)) / sizeof(struct sym_hist_entry))
754 sizeof_sym_hist = (sizeof(struct sym_hist) + size * sizeof(struct sym_hist_entry));
756 /* Check for overflow in zalloc argument */
757 if (sizeof_sym_hist > SIZE_MAX / nr_hists)
760 src->sizeof_sym_hist = sizeof_sym_hist;
761 src->nr_histograms = nr_hists;
762 src->histograms = calloc(nr_hists, sizeof_sym_hist) ;
763 return src->histograms ? 0 : -1;
766 /* The cycles histogram is lazily allocated. */
767 static int symbol__alloc_hist_cycles(struct symbol *sym)
769 struct annotation *notes = symbol__annotation(sym);
770 const size_t size = symbol__size(sym);
772 notes->src->cycles_hist = calloc(size, sizeof(struct cyc_hist));
773 if (notes->src->cycles_hist == NULL)
778 void symbol__annotate_zero_histograms(struct symbol *sym)
780 struct annotation *notes = symbol__annotation(sym);
782 pthread_mutex_lock(¬es->lock);
783 if (notes->src != NULL) {
784 memset(notes->src->histograms, 0,
785 notes->src->nr_histograms * notes->src->sizeof_sym_hist);
786 if (notes->src->cycles_hist)
787 memset(notes->src->cycles_hist, 0,
788 symbol__size(sym) * sizeof(struct cyc_hist));
790 pthread_mutex_unlock(¬es->lock);
793 static int __symbol__account_cycles(struct cyc_hist *ch,
795 unsigned offset, unsigned cycles,
799 * For now we can only account one basic block per
800 * final jump. But multiple could be overlapping.
801 * Always account the longest one. So when
802 * a shorter one has been already seen throw it away.
804 * We separately always account the full cycles.
806 ch[offset].num_aggr++;
807 ch[offset].cycles_aggr += cycles;
809 if (cycles > ch[offset].cycles_max)
810 ch[offset].cycles_max = cycles;
812 if (ch[offset].cycles_min) {
813 if (cycles && cycles < ch[offset].cycles_min)
814 ch[offset].cycles_min = cycles;
816 ch[offset].cycles_min = cycles;
818 if (!have_start && ch[offset].have_start)
820 if (ch[offset].num) {
821 if (have_start && (!ch[offset].have_start ||
822 ch[offset].start > start)) {
823 ch[offset].have_start = 0;
824 ch[offset].cycles = 0;
826 if (ch[offset].reset < 0xffff)
828 } else if (have_start &&
829 ch[offset].start < start)
832 ch[offset].have_start = have_start;
833 ch[offset].start = start;
834 ch[offset].cycles += cycles;
839 static int __symbol__inc_addr_samples(struct symbol *sym, struct map *map,
840 struct annotated_source *src, int evidx, u64 addr,
841 struct perf_sample *sample)
846 pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, map->unmap_ip(map, addr));
848 if ((addr < sym->start || addr >= sym->end) &&
849 (addr != sym->end || sym->start != sym->end)) {
850 pr_debug("%s(%d): ERANGE! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 "\n",
851 __func__, __LINE__, sym->name, sym->start, addr, sym->end);
855 offset = addr - sym->start;
856 h = annotated_source__histogram(src, evidx);
858 pr_debug("%s(%d): ENOMEM! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 ", func: %d\n",
859 __func__, __LINE__, sym->name, sym->start, addr, sym->end, sym->type == STT_FUNC);
863 h->addr[offset].nr_samples++;
864 h->period += sample->period;
865 h->addr[offset].period += sample->period;
867 pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64
868 ", evidx=%d] => nr_samples: %" PRIu64 ", period: %" PRIu64 "\n",
869 sym->start, sym->name, addr, addr - sym->start, evidx,
870 h->addr[offset].nr_samples, h->addr[offset].period);
874 static struct cyc_hist *symbol__cycles_hist(struct symbol *sym)
876 struct annotation *notes = symbol__annotation(sym);
878 if (notes->src == NULL) {
879 notes->src = annotated_source__new();
880 if (notes->src == NULL)
882 goto alloc_cycles_hist;
885 if (!notes->src->cycles_hist) {
887 symbol__alloc_hist_cycles(sym);
890 return notes->src->cycles_hist;
893 struct annotated_source *symbol__hists(struct symbol *sym, int nr_hists)
895 struct annotation *notes = symbol__annotation(sym);
897 if (notes->src == NULL) {
898 notes->src = annotated_source__new();
899 if (notes->src == NULL)
901 goto alloc_histograms;
904 if (notes->src->histograms == NULL) {
906 annotated_source__alloc_histograms(notes->src, symbol__size(sym),
913 static int symbol__inc_addr_samples(struct symbol *sym, struct map *map,
914 struct perf_evsel *evsel, u64 addr,
915 struct perf_sample *sample)
917 struct annotated_source *src;
921 src = symbol__hists(sym, evsel->evlist->nr_entries);
924 return __symbol__inc_addr_samples(sym, map, src, evsel->idx, addr, sample);
927 static int symbol__account_cycles(u64 addr, u64 start,
928 struct symbol *sym, unsigned cycles)
930 struct cyc_hist *cycles_hist;
935 cycles_hist = symbol__cycles_hist(sym);
936 if (cycles_hist == NULL)
938 if (addr < sym->start || addr >= sym->end)
942 if (start < sym->start || start >= sym->end)
947 offset = addr - sym->start;
948 return __symbol__account_cycles(cycles_hist,
949 start ? start - sym->start : 0,
954 int addr_map_symbol__account_cycles(struct addr_map_symbol *ams,
955 struct addr_map_symbol *start,
965 * Only set start when IPC can be computed. We can only
966 * compute it when the basic block is completely in a single
968 * Special case the case when the jump is elsewhere, but
969 * it starts on the function start.
972 (start->sym == ams->sym ||
974 start->addr == ams->sym->start + ams->map->start)))
975 saddr = start->al_addr;
977 pr_debug2("BB with bad start: addr %"PRIx64" start %"PRIx64" sym %"PRIx64" saddr %"PRIx64"\n",
979 start ? start->addr : 0,
980 ams->sym ? ams->sym->start + ams->map->start : 0,
982 err = symbol__account_cycles(ams->al_addr, saddr, ams->sym, cycles);
984 pr_debug2("account_cycles failed %d\n", err);
988 static unsigned annotation__count_insn(struct annotation *notes, u64 start, u64 end)
993 for (offset = start; offset <= end; offset++) {
994 if (notes->offsets[offset])
1000 static void annotation__count_and_fill(struct annotation *notes, u64 start, u64 end, struct cyc_hist *ch)
1005 n_insn = annotation__count_insn(notes, start, end);
1006 if (n_insn && ch->num && ch->cycles) {
1007 float ipc = n_insn / ((double)ch->cycles / (double)ch->num);
1009 /* Hide data when there are too many overlaps. */
1010 if (ch->reset >= 0x7fff || ch->reset >= ch->num / 2)
1013 for (offset = start; offset <= end; offset++) {
1014 struct annotation_line *al = notes->offsets[offset];
1022 void annotation__compute_ipc(struct annotation *notes, size_t size)
1026 if (!notes->src || !notes->src->cycles_hist)
1029 pthread_mutex_lock(¬es->lock);
1030 for (offset = 0; offset < size; ++offset) {
1031 struct cyc_hist *ch;
1033 ch = ¬es->src->cycles_hist[offset];
1034 if (ch && ch->cycles) {
1035 struct annotation_line *al;
1038 annotation__count_and_fill(notes, ch->start, offset, ch);
1039 al = notes->offsets[offset];
1040 if (al && ch->num_aggr) {
1041 al->cycles = ch->cycles_aggr / ch->num_aggr;
1042 al->cycles_max = ch->cycles_max;
1043 al->cycles_min = ch->cycles_min;
1045 notes->have_cycles = true;
1048 pthread_mutex_unlock(¬es->lock);
1051 int addr_map_symbol__inc_samples(struct addr_map_symbol *ams, struct perf_sample *sample,
1052 struct perf_evsel *evsel)
1054 return symbol__inc_addr_samples(ams->sym, ams->map, evsel, ams->al_addr, sample);
1057 int hist_entry__inc_addr_samples(struct hist_entry *he, struct perf_sample *sample,
1058 struct perf_evsel *evsel, u64 ip)
1060 return symbol__inc_addr_samples(he->ms.sym, he->ms.map, evsel, ip, sample);
1063 static void disasm_line__init_ins(struct disasm_line *dl, struct arch *arch, struct map_symbol *ms)
1065 dl->ins.ops = ins__find(arch, dl->ins.name);
1070 if (dl->ins.ops->parse && dl->ins.ops->parse(arch, &dl->ops, ms) < 0)
1074 static int disasm_line__parse(char *line, const char **namep, char **rawp)
1076 char tmp, *name = ltrim(line);
1078 if (name[0] == '\0')
1083 while ((*rawp)[0] != '\0' && !isspace((*rawp)[0]))
1088 *namep = strdup(name);
1094 *rawp = ltrim(*rawp);
1099 free((void *)namep);
1104 struct annotate_args {
1107 struct map_symbol ms;
1108 struct perf_evsel *evsel;
1109 struct annotation_options *options;
1115 static void annotation_line__delete(struct annotation_line *al)
1117 void *ptr = (void *) al - al->privsize;
1119 free_srcline(al->path);
1125 * Allocating the annotation line data with following
1128 * --------------------------------------
1129 * private space | struct annotation_line
1130 * --------------------------------------
1132 * Size of the private space is stored in 'struct annotation_line'.
1135 static struct annotation_line *
1136 annotation_line__new(struct annotate_args *args, size_t privsize)
1138 struct annotation_line *al;
1139 struct perf_evsel *evsel = args->evsel;
1140 size_t size = privsize + sizeof(*al);
1143 if (perf_evsel__is_group_event(evsel))
1144 nr = evsel->nr_members;
1146 size += sizeof(al->data[0]) * nr;
1150 al = (void *) al + privsize;
1151 al->privsize = privsize;
1152 al->offset = args->offset;
1153 al->line = strdup(args->line);
1154 al->line_nr = args->line_nr;
1162 * Allocating the disasm annotation line data with
1163 * following structure:
1165 * ------------------------------------------------------------
1166 * privsize space | struct disasm_line | struct annotation_line
1167 * ------------------------------------------------------------
1169 * We have 'struct annotation_line' member as last member
1170 * of 'struct disasm_line' to have an easy access.
1173 static struct disasm_line *disasm_line__new(struct annotate_args *args)
1175 struct disasm_line *dl = NULL;
1176 struct annotation_line *al;
1177 size_t privsize = args->privsize + offsetof(struct disasm_line, al);
1179 al = annotation_line__new(args, privsize);
1181 dl = disasm_line(al);
1183 if (dl->al.line == NULL)
1186 if (args->offset != -1) {
1187 if (disasm_line__parse(dl->al.line, &dl->ins.name, &dl->ops.raw) < 0)
1190 disasm_line__init_ins(dl, args->arch, &args->ms);
1197 zfree(&dl->al.line);
1203 void disasm_line__free(struct disasm_line *dl)
1205 if (dl->ins.ops && dl->ins.ops->free)
1206 dl->ins.ops->free(&dl->ops);
1208 ins__delete(&dl->ops);
1209 free((void *)dl->ins.name);
1210 dl->ins.name = NULL;
1211 annotation_line__delete(&dl->al);
1214 int disasm_line__scnprintf(struct disasm_line *dl, char *bf, size_t size, bool raw)
1216 if (raw || !dl->ins.ops)
1217 return scnprintf(bf, size, "%-6s %s", dl->ins.name, dl->ops.raw);
1219 return ins__scnprintf(&dl->ins, bf, size, &dl->ops);
1222 static void annotation_line__add(struct annotation_line *al, struct list_head *head)
1224 list_add_tail(&al->node, head);
1227 struct annotation_line *
1228 annotation_line__next(struct annotation_line *pos, struct list_head *head)
1230 list_for_each_entry_continue(pos, head, node)
1231 if (pos->offset >= 0)
1237 static const char *annotate__address_color(struct block_range *br)
1239 double cov = block_range__coverage(br);
1242 /* mark red for >75% coverage */
1244 return PERF_COLOR_RED;
1246 /* mark dull for <1% coverage */
1248 return PERF_COLOR_NORMAL;
1251 return PERF_COLOR_MAGENTA;
1254 static const char *annotate__asm_color(struct block_range *br)
1256 double cov = block_range__coverage(br);
1259 /* mark dull for <1% coverage */
1261 return PERF_COLOR_NORMAL;
1264 return PERF_COLOR_BLUE;
1267 static void annotate__branch_printf(struct block_range *br, u64 addr)
1269 bool emit_comment = true;
1275 if (br->is_target && br->start == addr) {
1276 struct block_range *branch = br;
1280 * Find matching branch to our target.
1282 while (!branch->is_branch)
1283 branch = block_range__next(branch);
1285 p = 100 *(double)br->entry / branch->coverage;
1289 emit_comment = false;
1294 * The percentage of coverage joined at this target in relation
1295 * to the next branch.
1297 printf(" +%.2f%%", p);
1301 if (br->is_branch && br->end == addr) {
1302 double p = 100*(double)br->taken / br->coverage;
1306 emit_comment = false;
1311 * The percentage of coverage leaving at this branch, and
1312 * its prediction ratio.
1314 printf(" -%.2f%% (p:%.2f%%)", p, 100*(double)br->pred / br->taken);
1319 static int disasm_line__print(struct disasm_line *dl, u64 start, int addr_fmt_width)
1321 s64 offset = dl->al.offset;
1322 const u64 addr = start + offset;
1323 struct block_range *br;
1325 br = block_range__find(addr);
1326 color_fprintf(stdout, annotate__address_color(br), " %*" PRIx64 ":", addr_fmt_width, addr);
1327 color_fprintf(stdout, annotate__asm_color(br), "%s", dl->al.line);
1328 annotate__branch_printf(br, addr);
1333 annotation_line__print(struct annotation_line *al, struct symbol *sym, u64 start,
1334 struct perf_evsel *evsel, u64 len, int min_pcnt, int printed,
1335 int max_lines, struct annotation_line *queue, int addr_fmt_width,
1338 struct disasm_line *dl = container_of(al, struct disasm_line, al);
1339 static const char *prev_line;
1340 static const char *prev_color;
1342 if (al->offset != -1) {
1343 double max_percent = 0.0;
1344 int i, nr_percent = 1;
1346 struct annotation *notes = symbol__annotation(sym);
1348 for (i = 0; i < al->data_nr; i++) {
1351 percent = annotation_data__percent(&al->data[i],
1354 if (percent > max_percent)
1355 max_percent = percent;
1358 if (al->data_nr > nr_percent)
1359 nr_percent = al->data_nr;
1361 if (max_percent < min_pcnt)
1364 if (max_lines && printed >= max_lines)
1367 if (queue != NULL) {
1368 list_for_each_entry_from(queue, ¬es->src->source, node) {
1371 annotation_line__print(queue, sym, start, evsel, len,
1372 0, 0, 1, NULL, addr_fmt_width,
1377 color = get_percent_color(max_percent);
1380 * Also color the filename and line if needed, with
1381 * the same color than the percentage. Don't print it
1382 * twice for close colored addr with the same filename:line
1385 if (!prev_line || strcmp(prev_line, al->path)
1386 || color != prev_color) {
1387 color_fprintf(stdout, color, " %s", al->path);
1388 prev_line = al->path;
1393 for (i = 0; i < nr_percent; i++) {
1394 struct annotation_data *data = &al->data[i];
1397 percent = annotation_data__percent(data, percent_type);
1398 color = get_percent_color(percent);
1400 if (symbol_conf.show_total_period)
1401 color_fprintf(stdout, color, " %11" PRIu64,
1403 else if (symbol_conf.show_nr_samples)
1404 color_fprintf(stdout, color, " %7" PRIu64,
1405 data->he.nr_samples);
1407 color_fprintf(stdout, color, " %7.2f", percent);
1412 disasm_line__print(dl, start, addr_fmt_width);
1414 } else if (max_lines && printed >= max_lines)
1417 int width = symbol_conf.show_total_period ? 12 : 8;
1422 if (perf_evsel__is_group_event(evsel))
1423 width *= evsel->nr_members;
1426 printf(" %*s:\n", width, " ");
1428 printf(" %*s: %*s %s\n", width, " ", addr_fmt_width, " ", al->line);
1435 * symbol__parse_objdump_line() parses objdump output (with -d --no-show-raw)
1436 * which looks like following
1438 * 0000000000415500 <_init>:
1439 * 415500: sub $0x8,%rsp
1440 * 415504: mov 0x2f5ad5(%rip),%rax # 70afe0 <_DYNAMIC+0x2f8>
1441 * 41550b: test %rax,%rax
1442 * 41550e: je 415515 <_init+0x15>
1443 * 415510: callq 416e70 <__gmon_start__@plt>
1444 * 415515: add $0x8,%rsp
1447 * it will be parsed and saved into struct disasm_line as
1448 * <offset> <name> <ops.raw>
1450 * The offset will be a relative offset from the start of the symbol and -1
1451 * means that it's not a disassembly line so should be treated differently.
1452 * The ops.raw part will be parsed further according to type of the instruction.
1454 static int symbol__parse_objdump_line(struct symbol *sym, FILE *file,
1455 struct annotate_args *args,
1458 struct map *map = args->ms.map;
1459 struct annotation *notes = symbol__annotation(sym);
1460 struct disasm_line *dl;
1461 char *line = NULL, *parsed_line, *tmp, *tmp2;
1463 s64 line_ip, offset = -1;
1464 regmatch_t match[2];
1466 if (getline(&line, &line_len, file) < 0)
1473 parsed_line = rtrim(line);
1475 /* /filename:linenr ? Save line number and ignore. */
1476 if (regexec(&file_lineno, parsed_line, 2, match, 0) == 0) {
1477 *line_nr = atoi(parsed_line + match[1].rm_so);
1481 tmp = ltrim(parsed_line);
1484 * Parse hexa addresses followed by ':'
1486 line_ip = strtoull(tmp, &tmp2, 16);
1487 if (*tmp2 != ':' || tmp == tmp2 || tmp2[1] == '\0')
1491 if (line_ip != -1) {
1492 u64 start = map__rip_2objdump(map, sym->start),
1493 end = map__rip_2objdump(map, sym->end);
1495 offset = line_ip - start;
1496 if ((u64)line_ip < start || (u64)line_ip >= end)
1499 parsed_line = tmp2 + 1;
1502 args->offset = offset;
1503 args->line = parsed_line;
1504 args->line_nr = *line_nr;
1507 dl = disasm_line__new(args);
1514 if (!disasm_line__has_local_offset(dl)) {
1515 dl->ops.target.offset = dl->ops.target.addr -
1516 map__rip_2objdump(map, sym->start);
1517 dl->ops.target.offset_avail = true;
1520 /* kcore has no symbols, so add the call target symbol */
1521 if (dl->ins.ops && ins__is_call(&dl->ins) && !dl->ops.target.sym) {
1522 struct addr_map_symbol target = {
1524 .addr = dl->ops.target.addr,
1527 if (!map_groups__find_ams(&target) &&
1528 target.sym->start == target.al_addr)
1529 dl->ops.target.sym = target.sym;
1532 annotation_line__add(&dl->al, ¬es->src->source);
1537 static __attribute__((constructor)) void symbol__init_regexpr(void)
1539 regcomp(&file_lineno, "^/[^:]+:([0-9]+)", REG_EXTENDED);
1542 static void delete_last_nop(struct symbol *sym)
1544 struct annotation *notes = symbol__annotation(sym);
1545 struct list_head *list = ¬es->src->source;
1546 struct disasm_line *dl;
1548 while (!list_empty(list)) {
1549 dl = list_entry(list->prev, struct disasm_line, al.node);
1552 if (dl->ins.ops != &nop_ops)
1555 if (!strstr(dl->al.line, " nop ") &&
1556 !strstr(dl->al.line, " nopl ") &&
1557 !strstr(dl->al.line, " nopw "))
1561 list_del(&dl->al.node);
1562 disasm_line__free(dl);
1566 int symbol__strerror_disassemble(struct symbol *sym __maybe_unused, struct map *map,
1567 int errnum, char *buf, size_t buflen)
1569 struct dso *dso = map->dso;
1571 BUG_ON(buflen == 0);
1574 str_error_r(errnum, buf, buflen);
1579 case SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX: {
1580 char bf[SBUILD_ID_SIZE + 15] = " with build id ";
1581 char *build_id_msg = NULL;
1583 if (dso->has_build_id) {
1584 build_id__sprintf(dso->build_id,
1585 sizeof(dso->build_id), bf + 15);
1588 scnprintf(buf, buflen,
1589 "No vmlinux file%s\nwas found in the path.\n\n"
1590 "Note that annotation using /proc/kcore requires CAP_SYS_RAWIO capability.\n\n"
1592 " perf buildid-cache -vu vmlinux\n\n"
1594 " --vmlinux vmlinux\n", build_id_msg ?: "");
1598 scnprintf(buf, buflen, "Internal error: Invalid %d error code\n", errnum);
1605 static int dso__disassemble_filename(struct dso *dso, char *filename, size_t filename_size)
1607 char linkname[PATH_MAX];
1608 char *build_id_filename;
1609 char *build_id_path = NULL;
1612 if (dso->symtab_type == DSO_BINARY_TYPE__KALLSYMS &&
1613 !dso__is_kcore(dso))
1614 return SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX;
1616 build_id_filename = dso__build_id_filename(dso, NULL, 0, false);
1617 if (build_id_filename) {
1618 __symbol__join_symfs(filename, filename_size, build_id_filename);
1619 free(build_id_filename);
1621 if (dso->has_build_id)
1626 build_id_path = strdup(filename);
1631 * old style build-id cache has name of XX/XXXXXXX.. while
1632 * new style has XX/XXXXXXX../{elf,kallsyms,vdso}.
1633 * extract the build-id part of dirname in the new style only.
1635 pos = strrchr(build_id_path, '/');
1636 if (pos && strlen(pos) < SBUILD_ID_SIZE - 2)
1637 dirname(build_id_path);
1639 if (dso__is_kcore(dso) ||
1640 readlink(build_id_path, linkname, sizeof(linkname)) < 0 ||
1641 strstr(linkname, DSO__NAME_KALLSYMS) ||
1642 access(filename, R_OK)) {
1645 * If we don't have build-ids or the build-id file isn't in the
1646 * cache, or is just a kallsyms file, well, lets hope that this
1647 * DSO is the same as when 'perf record' ran.
1649 __symbol__join_symfs(filename, filename_size, dso->long_name);
1652 free(build_id_path);
1656 static int symbol__disassemble(struct symbol *sym, struct annotate_args *args)
1658 struct annotation_options *opts = args->options;
1659 struct map *map = args->ms.map;
1660 struct dso *dso = map->dso;
1663 char symfs_filename[PATH_MAX];
1664 struct kcore_extract kce;
1665 bool delete_extract = false;
1666 bool decomp = false;
1671 int err = dso__disassemble_filename(dso, symfs_filename, sizeof(symfs_filename));
1676 pr_debug("%s: filename=%s, sym=%s, start=%#" PRIx64 ", end=%#" PRIx64 "\n", __func__,
1677 symfs_filename, sym->name, map->unmap_ip(map, sym->start),
1678 map->unmap_ip(map, sym->end));
1680 pr_debug("annotating [%p] %30s : [%p] %30s\n",
1681 dso, dso->long_name, sym, sym->name);
1683 if (dso__is_kcore(dso)) {
1684 kce.kcore_filename = symfs_filename;
1685 kce.addr = map__rip_2objdump(map, sym->start);
1686 kce.offs = sym->start;
1687 kce.len = sym->end - sym->start;
1688 if (!kcore_extract__create(&kce)) {
1689 delete_extract = true;
1690 strlcpy(symfs_filename, kce.extract_filename,
1691 sizeof(symfs_filename));
1693 } else if (dso__needs_decompress(dso)) {
1694 char tmp[KMOD_DECOMP_LEN];
1696 if (dso__decompress_kmodule_path(dso, symfs_filename,
1697 tmp, sizeof(tmp)) < 0)
1701 strcpy(symfs_filename, tmp);
1704 err = asprintf(&command,
1705 "%s %s%s --start-address=0x%016" PRIx64
1706 " --stop-address=0x%016" PRIx64
1707 " -l -d %s %s -C \"%s\" 2>/dev/null|grep -v \"%s:\"|expand",
1708 opts->objdump_path ?: "objdump",
1709 opts->disassembler_style ? "-M " : "",
1710 opts->disassembler_style ?: "",
1711 map__rip_2objdump(map, sym->start),
1712 map__rip_2objdump(map, sym->end),
1713 opts->show_asm_raw ? "" : "--no-show-raw",
1714 opts->annotate_src ? "-S" : "",
1715 symfs_filename, symfs_filename);
1718 pr_err("Failure allocating memory for the command to run\n");
1719 goto out_remove_tmp;
1722 pr_debug("Executing: %s\n", command);
1725 if (pipe(stdout_fd) < 0) {
1726 pr_err("Failure creating the pipe to run %s\n", command);
1727 goto out_free_command;
1732 pr_err("Failure forking to run %s\n", command);
1733 goto out_close_stdout;
1737 close(stdout_fd[0]);
1738 dup2(stdout_fd[1], 1);
1739 close(stdout_fd[1]);
1740 execl("/bin/sh", "sh", "-c", command, NULL);
1745 close(stdout_fd[1]);
1747 file = fdopen(stdout_fd[0], "r");
1749 pr_err("Failure creating FILE stream for %s\n", command);
1751 * If we were using debug info should retry with
1754 goto out_free_command;
1758 while (!feof(file)) {
1760 * The source code line number (lineno) needs to be kept in
1761 * accross calls to symbol__parse_objdump_line(), so that it
1762 * can associate it with the instructions till the next one.
1763 * See disasm_line__new() and struct disasm_line::line_nr.
1765 if (symbol__parse_objdump_line(sym, file, args, &lineno) < 0)
1771 pr_err("No output from %s\n", command);
1774 * kallsyms does not have symbol sizes so there may a nop at the end.
1777 if (dso__is_kcore(dso))
1778 delete_last_nop(sym);
1785 close(stdout_fd[0]);
1788 unlink(symfs_filename);
1791 kcore_extract__delete(&kce);
1796 close(stdout_fd[1]);
1797 goto out_free_command;
1800 static void calc_percent(struct sym_hist *sym_hist,
1801 struct hists *hists,
1802 struct annotation_data *data,
1803 s64 offset, s64 end)
1805 unsigned int hits = 0;
1808 while (offset < end) {
1809 hits += sym_hist->addr[offset].nr_samples;
1810 period += sym_hist->addr[offset].period;
1814 if (sym_hist->nr_samples) {
1815 data->he.period = period;
1816 data->he.nr_samples = hits;
1817 data->percent[PERCENT_HITS_LOCAL] = 100.0 * hits / sym_hist->nr_samples;
1820 if (hists->stats.nr_non_filtered_samples)
1821 data->percent[PERCENT_HITS_GLOBAL] = 100.0 * hits / hists->stats.nr_non_filtered_samples;
1823 if (sym_hist->period)
1824 data->percent[PERCENT_PERIOD_LOCAL] = 100.0 * period / sym_hist->period;
1826 if (hists->stats.total_period)
1827 data->percent[PERCENT_PERIOD_GLOBAL] = 100.0 * period / hists->stats.total_period;
1830 static void annotation__calc_percent(struct annotation *notes,
1831 struct perf_evsel *leader, s64 len)
1833 struct annotation_line *al, *next;
1834 struct perf_evsel *evsel;
1836 list_for_each_entry(al, ¬es->src->source, node) {
1840 if (al->offset == -1)
1843 next = annotation_line__next(al, ¬es->src->source);
1844 end = next ? next->offset : len;
1846 for_each_group_evsel(evsel, leader) {
1847 struct hists *hists = evsel__hists(evsel);
1848 struct annotation_data *data;
1849 struct sym_hist *sym_hist;
1851 BUG_ON(i >= al->data_nr);
1853 sym_hist = annotation__histogram(notes, evsel->idx);
1854 data = &al->data[i++];
1856 calc_percent(sym_hist, hists, data, al->offset, end);
1861 void symbol__calc_percent(struct symbol *sym, struct perf_evsel *evsel)
1863 struct annotation *notes = symbol__annotation(sym);
1865 annotation__calc_percent(notes, evsel, symbol__size(sym));
1868 int symbol__annotate(struct symbol *sym, struct map *map,
1869 struct perf_evsel *evsel, size_t privsize,
1870 struct annotation_options *options,
1871 struct arch **parch)
1873 struct annotate_args args = {
1874 .privsize = privsize,
1878 struct perf_env *env = perf_evsel__env(evsel);
1879 const char *arch_name = perf_env__arch(env);
1886 args.arch = arch = arch__find(arch_name);
1894 err = arch->init(arch, env ? env->cpuid : NULL);
1896 pr_err("%s: failed to initialize %s arch priv area\n", __func__, arch->name);
1904 return symbol__disassemble(sym, &args);
1907 static void insert_source_line(struct rb_root *root, struct annotation_line *al,
1908 struct annotation_options *opts)
1910 struct annotation_line *iter;
1911 struct rb_node **p = &root->rb_node;
1912 struct rb_node *parent = NULL;
1915 while (*p != NULL) {
1917 iter = rb_entry(parent, struct annotation_line, rb_node);
1919 ret = strcmp(iter->path, al->path);
1921 for (i = 0; i < al->data_nr; i++) {
1922 iter->data[i].percent_sum += annotation_data__percent(&al->data[i],
1923 opts->percent_type);
1931 p = &(*p)->rb_right;
1934 for (i = 0; i < al->data_nr; i++) {
1935 al->data[i].percent_sum = annotation_data__percent(&al->data[i],
1936 opts->percent_type);
1939 rb_link_node(&al->rb_node, parent, p);
1940 rb_insert_color(&al->rb_node, root);
1943 static int cmp_source_line(struct annotation_line *a, struct annotation_line *b)
1947 for (i = 0; i < a->data_nr; i++) {
1948 if (a->data[i].percent_sum == b->data[i].percent_sum)
1950 return a->data[i].percent_sum > b->data[i].percent_sum;
1956 static void __resort_source_line(struct rb_root *root, struct annotation_line *al)
1958 struct annotation_line *iter;
1959 struct rb_node **p = &root->rb_node;
1960 struct rb_node *parent = NULL;
1962 while (*p != NULL) {
1964 iter = rb_entry(parent, struct annotation_line, rb_node);
1966 if (cmp_source_line(al, iter))
1969 p = &(*p)->rb_right;
1972 rb_link_node(&al->rb_node, parent, p);
1973 rb_insert_color(&al->rb_node, root);
1976 static void resort_source_line(struct rb_root *dest_root, struct rb_root *src_root)
1978 struct annotation_line *al;
1979 struct rb_node *node;
1981 node = rb_first(src_root);
1983 struct rb_node *next;
1985 al = rb_entry(node, struct annotation_line, rb_node);
1986 next = rb_next(node);
1987 rb_erase(node, src_root);
1989 __resort_source_line(dest_root, al);
1994 static void print_summary(struct rb_root *root, const char *filename)
1996 struct annotation_line *al;
1997 struct rb_node *node;
1999 printf("\nSorted summary for file %s\n", filename);
2000 printf("----------------------------------------------\n\n");
2002 if (RB_EMPTY_ROOT(root)) {
2003 printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
2007 node = rb_first(root);
2009 double percent, percent_max = 0.0;
2014 al = rb_entry(node, struct annotation_line, rb_node);
2015 for (i = 0; i < al->data_nr; i++) {
2016 percent = al->data[i].percent_sum;
2017 color = get_percent_color(percent);
2018 color_fprintf(stdout, color, " %7.2f", percent);
2020 if (percent > percent_max)
2021 percent_max = percent;
2025 color = get_percent_color(percent_max);
2026 color_fprintf(stdout, color, " %s\n", path);
2028 node = rb_next(node);
2032 static void symbol__annotate_hits(struct symbol *sym, struct perf_evsel *evsel)
2034 struct annotation *notes = symbol__annotation(sym);
2035 struct sym_hist *h = annotation__histogram(notes, evsel->idx);
2036 u64 len = symbol__size(sym), offset;
2038 for (offset = 0; offset < len; ++offset)
2039 if (h->addr[offset].nr_samples != 0)
2040 printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
2041 sym->start + offset, h->addr[offset].nr_samples);
2042 printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->nr_samples", h->nr_samples);
2045 static int annotated_source__addr_fmt_width(struct list_head *lines, u64 start)
2048 struct annotation_line *line;
2050 list_for_each_entry_reverse(line, lines, node) {
2051 if (line->offset != -1)
2052 return scnprintf(bf, sizeof(bf), "%" PRIx64, start + line->offset);
2058 int symbol__annotate_printf(struct symbol *sym, struct map *map,
2059 struct perf_evsel *evsel,
2060 struct annotation_options *opts)
2062 struct dso *dso = map->dso;
2064 const char *d_filename;
2065 const char *evsel_name = perf_evsel__name(evsel);
2066 struct annotation *notes = symbol__annotation(sym);
2067 struct sym_hist *h = annotation__histogram(notes, evsel->idx);
2068 struct annotation_line *pos, *queue = NULL;
2069 u64 start = map__rip_2objdump(map, sym->start);
2070 int printed = 2, queue_len = 0, addr_fmt_width;
2072 bool context = opts->context;
2074 int width = symbol_conf.show_total_period ? 12 : 8;
2075 int graph_dotted_len;
2078 filename = strdup(dso->long_name);
2082 if (opts->full_path)
2083 d_filename = filename;
2085 d_filename = basename(filename);
2087 len = symbol__size(sym);
2089 if (perf_evsel__is_group_event(evsel)) {
2090 width *= evsel->nr_members;
2091 perf_evsel__group_desc(evsel, buf, sizeof(buf));
2095 graph_dotted_len = printf(" %-*.*s| Source code & Disassembly of %s for %s (%" PRIu64 " samples, "
2097 width, width, symbol_conf.show_total_period ? "Period" :
2098 symbol_conf.show_nr_samples ? "Samples" : "Percent",
2099 d_filename, evsel_name, h->nr_samples,
2100 percent_type_str(opts->percent_type));
2102 printf("%-*.*s----\n",
2103 graph_dotted_len, graph_dotted_len, graph_dotted_line);
2106 symbol__annotate_hits(sym, evsel);
2108 addr_fmt_width = annotated_source__addr_fmt_width(¬es->src->source, start);
2110 list_for_each_entry(pos, ¬es->src->source, node) {
2113 if (context && queue == NULL) {
2118 err = annotation_line__print(pos, sym, start, evsel, len,
2119 opts->min_pcnt, printed, opts->max_lines,
2120 queue, addr_fmt_width, opts->percent_type);
2126 printed += queue_len;
2132 /* filtered by max_lines */
2138 * Filtered by min_pcnt or non IP lines when
2143 if (queue_len == context)
2144 queue = list_entry(queue->node.next, typeof(*queue), node);
2156 static void FILE__set_percent_color(void *fp __maybe_unused,
2157 double percent __maybe_unused,
2158 bool current __maybe_unused)
2162 static int FILE__set_jumps_percent_color(void *fp __maybe_unused,
2163 int nr __maybe_unused, bool current __maybe_unused)
2168 static int FILE__set_color(void *fp __maybe_unused, int color __maybe_unused)
2173 static void FILE__printf(void *fp, const char *fmt, ...)
2177 va_start(args, fmt);
2178 vfprintf(fp, fmt, args);
2182 static void FILE__write_graph(void *fp, int graph)
2187 case DARROW_CHAR: s = "↓"; break;
2188 case UARROW_CHAR: s = "↑"; break;
2189 case LARROW_CHAR: s = "←"; break;
2190 case RARROW_CHAR: s = "→"; break;
2191 default: s = "?"; break;
2197 static int symbol__annotate_fprintf2(struct symbol *sym, FILE *fp,
2198 struct annotation_options *opts)
2200 struct annotation *notes = symbol__annotation(sym);
2201 struct annotation_write_ops wops = {
2204 .set_color = FILE__set_color,
2205 .set_percent_color = FILE__set_percent_color,
2206 .set_jumps_percent_color = FILE__set_jumps_percent_color,
2207 .printf = FILE__printf,
2208 .write_graph = FILE__write_graph,
2210 struct annotation_line *al;
2212 list_for_each_entry(al, ¬es->src->source, node) {
2213 if (annotation_line__filter(al, notes))
2215 annotation_line__write(al, notes, &wops, opts);
2217 wops.first_line = false;
2223 int map_symbol__annotation_dump(struct map_symbol *ms, struct perf_evsel *evsel,
2224 struct annotation_options *opts)
2226 const char *ev_name = perf_evsel__name(evsel);
2232 if (asprintf(&filename, "%s.annotation", ms->sym->name) < 0)
2235 fp = fopen(filename, "w");
2237 goto out_free_filename;
2239 if (perf_evsel__is_group_event(evsel)) {
2240 perf_evsel__group_desc(evsel, buf, sizeof(buf));
2244 fprintf(fp, "%s() %s\nEvent: %s\n\n",
2245 ms->sym->name, ms->map->dso->long_name, ev_name);
2246 symbol__annotate_fprintf2(ms->sym, fp, opts);
2255 void symbol__annotate_zero_histogram(struct symbol *sym, int evidx)
2257 struct annotation *notes = symbol__annotation(sym);
2258 struct sym_hist *h = annotation__histogram(notes, evidx);
2260 memset(h, 0, notes->src->sizeof_sym_hist);
2263 void symbol__annotate_decay_histogram(struct symbol *sym, int evidx)
2265 struct annotation *notes = symbol__annotation(sym);
2266 struct sym_hist *h = annotation__histogram(notes, evidx);
2267 int len = symbol__size(sym), offset;
2270 for (offset = 0; offset < len; ++offset) {
2271 h->addr[offset].nr_samples = h->addr[offset].nr_samples * 7 / 8;
2272 h->nr_samples += h->addr[offset].nr_samples;
2276 void annotated_source__purge(struct annotated_source *as)
2278 struct annotation_line *al, *n;
2280 list_for_each_entry_safe(al, n, &as->source, node) {
2281 list_del(&al->node);
2282 disasm_line__free(disasm_line(al));
2286 static size_t disasm_line__fprintf(struct disasm_line *dl, FILE *fp)
2290 if (dl->al.offset == -1)
2291 return fprintf(fp, "%s\n", dl->al.line);
2293 printed = fprintf(fp, "%#" PRIx64 " %s", dl->al.offset, dl->ins.name);
2295 if (dl->ops.raw[0] != '\0') {
2296 printed += fprintf(fp, "%.*s %s\n", 6 - (int)printed, " ",
2300 return printed + fprintf(fp, "\n");
2303 size_t disasm__fprintf(struct list_head *head, FILE *fp)
2305 struct disasm_line *pos;
2308 list_for_each_entry(pos, head, al.node)
2309 printed += disasm_line__fprintf(pos, fp);
2314 bool disasm_line__is_valid_local_jump(struct disasm_line *dl, struct symbol *sym)
2316 if (!dl || !dl->ins.ops || !ins__is_jump(&dl->ins) ||
2317 !disasm_line__has_local_offset(dl) || dl->ops.target.offset < 0 ||
2318 dl->ops.target.offset >= (s64)symbol__size(sym))
2324 void annotation__mark_jump_targets(struct annotation *notes, struct symbol *sym)
2326 u64 offset, size = symbol__size(sym);
2328 /* PLT symbols contain external offsets */
2329 if (strstr(sym->name, "@plt"))
2332 for (offset = 0; offset < size; ++offset) {
2333 struct annotation_line *al = notes->offsets[offset];
2334 struct disasm_line *dl;
2336 dl = disasm_line(al);
2338 if (!disasm_line__is_valid_local_jump(dl, sym))
2341 al = notes->offsets[dl->ops.target.offset];
2344 * FIXME: Oops, no jump target? Buggy disassembler? Or do we
2345 * have to adjust to the previous offset?
2350 if (++al->jump_sources > notes->max_jump_sources)
2351 notes->max_jump_sources = al->jump_sources;
2357 void annotation__set_offsets(struct annotation *notes, s64 size)
2359 struct annotation_line *al;
2361 notes->max_line_len = 0;
2363 list_for_each_entry(al, ¬es->src->source, node) {
2364 size_t line_len = strlen(al->line);
2366 if (notes->max_line_len < line_len)
2367 notes->max_line_len = line_len;
2368 al->idx = notes->nr_entries++;
2369 if (al->offset != -1) {
2370 al->idx_asm = notes->nr_asm_entries++;
2372 * FIXME: short term bandaid to cope with assembly
2373 * routines that comes with labels in the same column
2374 * as the address in objdump, sigh.
2376 * E.g. copy_user_generic_unrolled
2378 if (al->offset < size)
2379 notes->offsets[al->offset] = al;
2385 static inline int width_jumps(int n)
2394 void annotation__init_column_widths(struct annotation *notes, struct symbol *sym)
2396 notes->widths.addr = notes->widths.target =
2397 notes->widths.min_addr = hex_width(symbol__size(sym));
2398 notes->widths.max_addr = hex_width(sym->end);
2399 notes->widths.jumps = width_jumps(notes->max_jump_sources);
2402 void annotation__update_column_widths(struct annotation *notes)
2404 if (notes->options->use_offset)
2405 notes->widths.target = notes->widths.min_addr;
2407 notes->widths.target = notes->widths.max_addr;
2409 notes->widths.addr = notes->widths.target;
2411 if (notes->options->show_nr_jumps)
2412 notes->widths.addr += notes->widths.jumps + 1;
2415 static void annotation__calc_lines(struct annotation *notes, struct map *map,
2416 struct rb_root *root,
2417 struct annotation_options *opts)
2419 struct annotation_line *al;
2420 struct rb_root tmp_root = RB_ROOT;
2422 list_for_each_entry(al, ¬es->src->source, node) {
2423 double percent_max = 0.0;
2426 for (i = 0; i < al->data_nr; i++) {
2429 percent = annotation_data__percent(&al->data[i],
2430 opts->percent_type);
2432 if (percent > percent_max)
2433 percent_max = percent;
2436 if (percent_max <= 0.5)
2439 al->path = get_srcline(map->dso, notes->start + al->offset, NULL,
2440 false, true, notes->start + al->offset);
2441 insert_source_line(&tmp_root, al, opts);
2444 resort_source_line(root, &tmp_root);
2447 static void symbol__calc_lines(struct symbol *sym, struct map *map,
2448 struct rb_root *root,
2449 struct annotation_options *opts)
2451 struct annotation *notes = symbol__annotation(sym);
2453 annotation__calc_lines(notes, map, root, opts);
2456 int symbol__tty_annotate2(struct symbol *sym, struct map *map,
2457 struct perf_evsel *evsel,
2458 struct annotation_options *opts)
2460 struct dso *dso = map->dso;
2461 struct rb_root source_line = RB_ROOT;
2462 struct hists *hists = evsel__hists(evsel);
2465 if (symbol__annotate2(sym, map, evsel, opts, NULL) < 0)
2468 if (opts->print_lines) {
2469 srcline_full_filename = opts->full_path;
2470 symbol__calc_lines(sym, map, &source_line, opts);
2471 print_summary(&source_line, dso->long_name);
2474 hists__scnprintf_title(hists, buf, sizeof(buf));
2475 fprintf(stdout, "%s, [percent: %s]\n%s() %s\n",
2476 buf, percent_type_str(opts->percent_type), sym->name, dso->long_name);
2477 symbol__annotate_fprintf2(sym, stdout, opts);
2479 annotated_source__purge(symbol__annotation(sym)->src);
2484 int symbol__tty_annotate(struct symbol *sym, struct map *map,
2485 struct perf_evsel *evsel,
2486 struct annotation_options *opts)
2488 struct dso *dso = map->dso;
2489 struct rb_root source_line = RB_ROOT;
2491 if (symbol__annotate(sym, map, evsel, 0, opts, NULL) < 0)
2494 symbol__calc_percent(sym, evsel);
2496 if (opts->print_lines) {
2497 srcline_full_filename = opts->full_path;
2498 symbol__calc_lines(sym, map, &source_line, opts);
2499 print_summary(&source_line, dso->long_name);
2502 symbol__annotate_printf(sym, map, evsel, opts);
2504 annotated_source__purge(symbol__annotation(sym)->src);
2509 bool ui__has_annotation(void)
2511 return use_browser == 1 && perf_hpp_list.sym;
2515 static double annotation_line__max_percent(struct annotation_line *al,
2516 struct annotation *notes,
2517 unsigned int percent_type)
2519 double percent_max = 0.0;
2522 for (i = 0; i < notes->nr_events; i++) {
2525 percent = annotation_data__percent(&al->data[i],
2528 if (percent > percent_max)
2529 percent_max = percent;
2535 static void disasm_line__write(struct disasm_line *dl, struct annotation *notes,
2536 void *obj, char *bf, size_t size,
2537 void (*obj__printf)(void *obj, const char *fmt, ...),
2538 void (*obj__write_graph)(void *obj, int graph))
2540 if (dl->ins.ops && dl->ins.ops->scnprintf) {
2541 if (ins__is_jump(&dl->ins)) {
2544 if (dl->ops.target.outside)
2546 fwd = dl->ops.target.offset > dl->al.offset;
2547 obj__write_graph(obj, fwd ? DARROW_CHAR : UARROW_CHAR);
2548 obj__printf(obj, " ");
2549 } else if (ins__is_call(&dl->ins)) {
2551 obj__write_graph(obj, RARROW_CHAR);
2552 obj__printf(obj, " ");
2553 } else if (ins__is_ret(&dl->ins)) {
2554 obj__write_graph(obj, LARROW_CHAR);
2555 obj__printf(obj, " ");
2557 obj__printf(obj, " ");
2560 obj__printf(obj, " ");
2563 disasm_line__scnprintf(dl, bf, size, !notes->options->use_offset);
2566 static void __annotation_line__write(struct annotation_line *al, struct annotation *notes,
2567 bool first_line, bool current_entry, bool change_color, int width,
2568 void *obj, unsigned int percent_type,
2569 int (*obj__set_color)(void *obj, int color),
2570 void (*obj__set_percent_color)(void *obj, double percent, bool current),
2571 int (*obj__set_jumps_percent_color)(void *obj, int nr, bool current),
2572 void (*obj__printf)(void *obj, const char *fmt, ...),
2573 void (*obj__write_graph)(void *obj, int graph))
2576 double percent_max = annotation_line__max_percent(al, notes, percent_type);
2577 int pcnt_width = annotation__pcnt_width(notes),
2578 cycles_width = annotation__cycles_width(notes);
2579 bool show_title = false;
2583 if (first_line && (al->offset == -1 || percent_max == 0.0)) {
2584 if (notes->have_cycles) {
2585 if (al->ipc == 0.0 && al->cycles == 0)
2591 if (al->offset != -1 && percent_max != 0.0) {
2594 for (i = 0; i < notes->nr_events; i++) {
2597 percent = annotation_data__percent(&al->data[i], percent_type);
2599 obj__set_percent_color(obj, percent, current_entry);
2600 if (notes->options->show_total_period) {
2601 obj__printf(obj, "%11" PRIu64 " ", al->data[i].he.period);
2602 } else if (notes->options->show_nr_samples) {
2603 obj__printf(obj, "%6" PRIu64 " ",
2604 al->data[i].he.nr_samples);
2606 obj__printf(obj, "%6.2f ", percent);
2610 obj__set_percent_color(obj, 0, current_entry);
2613 obj__printf(obj, "%-*s", pcnt_width, " ");
2615 obj__printf(obj, "%-*s", pcnt_width,
2616 notes->options->show_total_period ? "Period" :
2617 notes->options->show_nr_samples ? "Samples" : "Percent");
2621 if (notes->have_cycles) {
2623 obj__printf(obj, "%*.2f ", ANNOTATION__IPC_WIDTH - 1, al->ipc);
2624 else if (!show_title)
2625 obj__printf(obj, "%*s", ANNOTATION__IPC_WIDTH, " ");
2627 obj__printf(obj, "%*s ", ANNOTATION__IPC_WIDTH - 1, "IPC");
2629 if (!notes->options->show_minmax_cycle) {
2631 obj__printf(obj, "%*" PRIu64 " ",
2632 ANNOTATION__CYCLES_WIDTH - 1, al->cycles);
2633 else if (!show_title)
2634 obj__printf(obj, "%*s",
2635 ANNOTATION__CYCLES_WIDTH, " ");
2637 obj__printf(obj, "%*s ",
2638 ANNOTATION__CYCLES_WIDTH - 1,
2644 scnprintf(str, sizeof(str),
2645 "%" PRIu64 "(%" PRIu64 "/%" PRIu64 ")",
2646 al->cycles, al->cycles_min,
2649 obj__printf(obj, "%*s ",
2650 ANNOTATION__MINMAX_CYCLES_WIDTH - 1,
2652 } else if (!show_title)
2653 obj__printf(obj, "%*s",
2654 ANNOTATION__MINMAX_CYCLES_WIDTH,
2657 obj__printf(obj, "%*s ",
2658 ANNOTATION__MINMAX_CYCLES_WIDTH - 1,
2663 obj__printf(obj, " ");
2666 obj__printf(obj, "%-*s", width - pcnt_width - cycles_width, " ");
2667 else if (al->offset == -1) {
2668 if (al->line_nr && notes->options->show_linenr)
2669 printed = scnprintf(bf, sizeof(bf), "%-*d ", notes->widths.addr + 1, al->line_nr);
2671 printed = scnprintf(bf, sizeof(bf), "%-*s ", notes->widths.addr, " ");
2672 obj__printf(obj, bf);
2673 obj__printf(obj, "%-*s", width - printed - pcnt_width - cycles_width + 1, al->line);
2675 u64 addr = al->offset;
2678 if (!notes->options->use_offset)
2679 addr += notes->start;
2681 if (!notes->options->use_offset) {
2682 printed = scnprintf(bf, sizeof(bf), "%" PRIx64 ": ", addr);
2684 if (al->jump_sources &&
2685 notes->options->offset_level >= ANNOTATION__OFFSET_JUMP_TARGETS) {
2686 if (notes->options->show_nr_jumps) {
2688 printed = scnprintf(bf, sizeof(bf), "%*d ",
2689 notes->widths.jumps,
2691 prev = obj__set_jumps_percent_color(obj, al->jump_sources,
2693 obj__printf(obj, bf);
2694 obj__set_color(obj, prev);
2697 printed = scnprintf(bf, sizeof(bf), "%*" PRIx64 ": ",
2698 notes->widths.target, addr);
2699 } else if (ins__is_call(&disasm_line(al)->ins) &&
2700 notes->options->offset_level >= ANNOTATION__OFFSET_CALL) {
2702 } else if (notes->options->offset_level == ANNOTATION__MAX_OFFSET_LEVEL) {
2705 printed = scnprintf(bf, sizeof(bf), "%-*s ",
2706 notes->widths.addr, " ");
2711 color = obj__set_color(obj, HE_COLORSET_ADDR);
2712 obj__printf(obj, bf);
2714 obj__set_color(obj, color);
2716 disasm_line__write(disasm_line(al), notes, obj, bf, sizeof(bf), obj__printf, obj__write_graph);
2718 obj__printf(obj, "%-*s", width - pcnt_width - cycles_width - 3 - printed, bf);
2723 void annotation_line__write(struct annotation_line *al, struct annotation *notes,
2724 struct annotation_write_ops *wops,
2725 struct annotation_options *opts)
2727 __annotation_line__write(al, notes, wops->first_line, wops->current_entry,
2728 wops->change_color, wops->width, wops->obj,
2730 wops->set_color, wops->set_percent_color,
2731 wops->set_jumps_percent_color, wops->printf,
2735 int symbol__annotate2(struct symbol *sym, struct map *map, struct perf_evsel *evsel,
2736 struct annotation_options *options, struct arch **parch)
2738 struct annotation *notes = symbol__annotation(sym);
2739 size_t size = symbol__size(sym);
2740 int nr_pcnt = 1, err;
2742 notes->offsets = zalloc(size * sizeof(struct annotation_line *));
2743 if (notes->offsets == NULL)
2746 if (perf_evsel__is_group_event(evsel))
2747 nr_pcnt = evsel->nr_members;
2749 err = symbol__annotate(sym, map, evsel, 0, options, parch);
2751 goto out_free_offsets;
2753 notes->options = options;
2755 symbol__calc_percent(sym, evsel);
2757 notes->start = map__rip_2objdump(map, sym->start);
2759 annotation__set_offsets(notes, size);
2760 annotation__mark_jump_targets(notes, sym);
2761 annotation__compute_ipc(notes, size);
2762 annotation__init_column_widths(notes, sym);
2763 notes->nr_events = nr_pcnt;
2765 annotation__update_column_widths(notes);
2770 zfree(¬es->offsets);
2774 #define ANNOTATION__CFG(n) \
2775 { .name = #n, .value = &annotation__default_options.n, }
2778 * Keep the entries sorted, they are bsearch'ed
2780 static struct annotation_config {
2783 } annotation__configs[] = {
2784 ANNOTATION__CFG(hide_src_code),
2785 ANNOTATION__CFG(jump_arrows),
2786 ANNOTATION__CFG(offset_level),
2787 ANNOTATION__CFG(show_linenr),
2788 ANNOTATION__CFG(show_nr_jumps),
2789 ANNOTATION__CFG(show_nr_samples),
2790 ANNOTATION__CFG(show_total_period),
2791 ANNOTATION__CFG(use_offset),
2794 #undef ANNOTATION__CFG
2796 static int annotation_config__cmp(const void *name, const void *cfgp)
2798 const struct annotation_config *cfg = cfgp;
2800 return strcmp(name, cfg->name);
2803 static int annotation__config(const char *var, const char *value,
2804 void *data __maybe_unused)
2806 struct annotation_config *cfg;
2809 if (!strstarts(var, "annotate."))
2813 cfg = bsearch(name, annotation__configs, ARRAY_SIZE(annotation__configs),
2814 sizeof(struct annotation_config), annotation_config__cmp);
2817 pr_debug("%s variable unknown, ignoring...", var);
2818 else if (strcmp(var, "annotate.offset_level") == 0) {
2819 perf_config_int(cfg->value, name, value);
2821 if (*(int *)cfg->value > ANNOTATION__MAX_OFFSET_LEVEL)
2822 *(int *)cfg->value = ANNOTATION__MAX_OFFSET_LEVEL;
2823 else if (*(int *)cfg->value < ANNOTATION__MIN_OFFSET_LEVEL)
2824 *(int *)cfg->value = ANNOTATION__MIN_OFFSET_LEVEL;
2826 *(bool *)cfg->value = perf_config_bool(name, value);
2831 void annotation_config__init(void)
2833 perf_config(annotation__config, NULL);
2835 annotation__default_options.show_total_period = symbol_conf.show_total_period;
2836 annotation__default_options.show_nr_samples = symbol_conf.show_nr_samples;
2839 static unsigned int parse_percent_type(char *str1, char *str2)
2841 unsigned int type = (unsigned int) -1;
2843 if (!strcmp("period", str1)) {
2844 if (!strcmp("local", str2))
2845 type = PERCENT_PERIOD_LOCAL;
2846 else if (!strcmp("global", str2))
2847 type = PERCENT_PERIOD_GLOBAL;
2850 if (!strcmp("hits", str1)) {
2851 if (!strcmp("local", str2))
2852 type = PERCENT_HITS_LOCAL;
2853 else if (!strcmp("global", str2))
2854 type = PERCENT_HITS_GLOBAL;
2860 int annotate_parse_percent_type(const struct option *opt, const char *_str,
2861 int unset __maybe_unused)
2863 struct annotation_options *opts = opt->value;
2868 str1 = strdup(_str);
2872 str2 = strchr(str1, '-');
2878 type = parse_percent_type(str1, str2);
2879 if (type == (unsigned int) -1)
2880 type = parse_percent_type(str2, str1);
2881 if (type != (unsigned int) -1) {
2882 opts->percent_type = type;