7 struct callchain_param callchain_param = {
8 .mode = CHAIN_GRAPH_REL,
12 static void hist_entry__add_cpumode_period(struct hist_entry *self,
13 unsigned int cpumode, u64 period)
16 case PERF_RECORD_MISC_KERNEL:
17 self->period_sys += period;
19 case PERF_RECORD_MISC_USER:
20 self->period_us += period;
22 case PERF_RECORD_MISC_GUEST_KERNEL:
23 self->period_guest_sys += period;
25 case PERF_RECORD_MISC_GUEST_USER:
26 self->period_guest_us += period;
34 * histogram, sorted on item, collects periods
37 static struct hist_entry *hist_entry__new(struct hist_entry *template)
39 size_t callchain_size = symbol_conf.use_callchain ? sizeof(struct callchain_node) : 0;
40 struct hist_entry *self = malloc(sizeof(*self) + callchain_size);
45 if (symbol_conf.use_callchain)
46 callchain_init(self->callchain);
52 static void hists__inc_nr_entries(struct hists *self, struct hist_entry *entry)
54 if (entry->ms.sym && self->max_sym_namelen < entry->ms.sym->namelen)
55 self->max_sym_namelen = entry->ms.sym->namelen;
59 struct hist_entry *__hists__add_entry(struct hists *self,
60 struct addr_location *al,
61 struct symbol *sym_parent, u64 period)
63 struct rb_node **p = &self->entries.rb_node;
64 struct rb_node *parent = NULL;
65 struct hist_entry *he;
66 struct hist_entry entry = {
81 he = rb_entry(parent, struct hist_entry, rb_node);
83 cmp = hist_entry__cmp(&entry, he);
97 he = hist_entry__new(&entry);
100 rb_link_node(&he->rb_node, parent, p);
101 rb_insert_color(&he->rb_node, &self->entries);
102 hists__inc_nr_entries(self, he);
104 hist_entry__add_cpumode_period(he, al->cpumode, period);
109 hist_entry__cmp(struct hist_entry *left, struct hist_entry *right)
111 struct sort_entry *se;
114 list_for_each_entry(se, &hist_entry__sort_list, list) {
115 cmp = se->se_cmp(left, right);
124 hist_entry__collapse(struct hist_entry *left, struct hist_entry *right)
126 struct sort_entry *se;
129 list_for_each_entry(se, &hist_entry__sort_list, list) {
130 int64_t (*f)(struct hist_entry *, struct hist_entry *);
132 f = se->se_collapse ?: se->se_cmp;
134 cmp = f(left, right);
142 void hist_entry__free(struct hist_entry *he)
148 * collapse the histogram
151 static bool collapse__insert_entry(struct rb_root *root, struct hist_entry *he)
153 struct rb_node **p = &root->rb_node;
154 struct rb_node *parent = NULL;
155 struct hist_entry *iter;
160 iter = rb_entry(parent, struct hist_entry, rb_node);
162 cmp = hist_entry__collapse(iter, he);
165 iter->period += he->period;
166 hist_entry__free(he);
176 rb_link_node(&he->rb_node, parent, p);
177 rb_insert_color(&he->rb_node, root);
181 void hists__collapse_resort(struct hists *self)
184 struct rb_node *next;
185 struct hist_entry *n;
187 if (!sort__need_collapse)
191 next = rb_first(&self->entries);
192 self->nr_entries = 0;
193 self->max_sym_namelen = 0;
196 n = rb_entry(next, struct hist_entry, rb_node);
197 next = rb_next(&n->rb_node);
199 rb_erase(&n->rb_node, &self->entries);
200 if (collapse__insert_entry(&tmp, n))
201 hists__inc_nr_entries(self, n);
208 * reverse the map, sort on period.
211 static void __hists__insert_output_entry(struct rb_root *entries,
212 struct hist_entry *he,
213 u64 min_callchain_hits)
215 struct rb_node **p = &entries->rb_node;
216 struct rb_node *parent = NULL;
217 struct hist_entry *iter;
219 if (symbol_conf.use_callchain)
220 callchain_param.sort(&he->sorted_chain, he->callchain,
221 min_callchain_hits, &callchain_param);
225 iter = rb_entry(parent, struct hist_entry, rb_node);
227 if (he->period > iter->period)
233 rb_link_node(&he->rb_node, parent, p);
234 rb_insert_color(&he->rb_node, entries);
237 void hists__output_resort(struct hists *self)
240 struct rb_node *next;
241 struct hist_entry *n;
242 u64 min_callchain_hits;
244 min_callchain_hits = self->stats.total_period * (callchain_param.min_percent / 100);
247 next = rb_first(&self->entries);
249 self->nr_entries = 0;
250 self->max_sym_namelen = 0;
253 n = rb_entry(next, struct hist_entry, rb_node);
254 next = rb_next(&n->rb_node);
256 rb_erase(&n->rb_node, &self->entries);
257 __hists__insert_output_entry(&tmp, n, min_callchain_hits);
258 hists__inc_nr_entries(self, n);
264 static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin)
267 int ret = fprintf(fp, " ");
269 for (i = 0; i < left_margin; i++)
270 ret += fprintf(fp, " ");
275 static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask,
279 size_t ret = callchain__fprintf_left_margin(fp, left_margin);
281 for (i = 0; i < depth; i++)
282 if (depth_mask & (1 << i))
283 ret += fprintf(fp, "| ");
285 ret += fprintf(fp, " ");
287 ret += fprintf(fp, "\n");
292 static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain,
293 int depth, int depth_mask, int period,
294 u64 total_samples, int hits,
300 ret += callchain__fprintf_left_margin(fp, left_margin);
301 for (i = 0; i < depth; i++) {
302 if (depth_mask & (1 << i))
303 ret += fprintf(fp, "|");
305 ret += fprintf(fp, " ");
306 if (!period && i == depth - 1) {
309 percent = hits * 100.0 / total_samples;
310 ret += percent_color_fprintf(fp, "--%2.2f%%-- ", percent);
312 ret += fprintf(fp, "%s", " ");
315 ret += fprintf(fp, "%s\n", chain->ms.sym->name);
317 ret += fprintf(fp, "%p\n", (void *)(long)chain->ip);
322 static struct symbol *rem_sq_bracket;
323 static struct callchain_list rem_hits;
325 static void init_rem_hits(void)
327 rem_sq_bracket = malloc(sizeof(*rem_sq_bracket) + 6);
328 if (!rem_sq_bracket) {
329 fprintf(stderr, "Not enough memory to display remaining hits\n");
333 strcpy(rem_sq_bracket->name, "[...]");
334 rem_hits.ms.sym = rem_sq_bracket;
337 static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
338 u64 total_samples, int depth,
339 int depth_mask, int left_margin)
341 struct rb_node *node, *next;
342 struct callchain_node *child;
343 struct callchain_list *chain;
344 int new_depth_mask = depth_mask;
349 uint entries_printed = 0;
351 if (callchain_param.mode == CHAIN_GRAPH_REL)
352 new_total = self->children_hit;
354 new_total = total_samples;
356 remaining = new_total;
358 node = rb_first(&self->rb_root);
362 child = rb_entry(node, struct callchain_node, rb_node);
363 cumul = cumul_hits(child);
367 * The depth mask manages the output of pipes that show
368 * the depth. We don't want to keep the pipes of the current
369 * level for the last child of this depth.
370 * Except if we have remaining filtered hits. They will
371 * supersede the last child
373 next = rb_next(node);
374 if (!next && (callchain_param.mode != CHAIN_GRAPH_REL || !remaining))
375 new_depth_mask &= ~(1 << (depth - 1));
378 * But we keep the older depth mask for the line separator
379 * to keep the level link until we reach the last child
381 ret += ipchain__fprintf_graph_line(fp, depth, depth_mask,
384 list_for_each_entry(chain, &child->val, list) {
385 ret += ipchain__fprintf_graph(fp, chain, depth,
391 ret += __callchain__fprintf_graph(fp, child, new_total,
393 new_depth_mask | (1 << depth),
396 if (++entries_printed == callchain_param.print_limit)
400 if (callchain_param.mode == CHAIN_GRAPH_REL &&
401 remaining && remaining != new_total) {
406 new_depth_mask &= ~(1 << (depth - 1));
408 ret += ipchain__fprintf_graph(fp, &rem_hits, depth,
409 new_depth_mask, 0, new_total,
410 remaining, left_margin);
416 static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
417 u64 total_samples, int left_margin)
419 struct callchain_list *chain;
420 bool printed = false;
423 u32 entries_printed = 0;
425 list_for_each_entry(chain, &self->val, list) {
426 if (!i++ && sort__first_dimension == SORT_SYM)
430 ret += callchain__fprintf_left_margin(fp, left_margin);
431 ret += fprintf(fp, "|\n");
432 ret += callchain__fprintf_left_margin(fp, left_margin);
433 ret += fprintf(fp, "---");
438 ret += callchain__fprintf_left_margin(fp, left_margin);
441 ret += fprintf(fp, " %s\n", chain->ms.sym->name);
443 ret += fprintf(fp, " %p\n", (void *)(long)chain->ip);
445 if (++entries_printed == callchain_param.print_limit)
449 ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin);
454 static size_t callchain__fprintf_flat(FILE *fp, struct callchain_node *self,
457 struct callchain_list *chain;
463 ret += callchain__fprintf_flat(fp, self->parent, total_samples);
466 list_for_each_entry(chain, &self->val, list) {
467 if (chain->ip >= PERF_CONTEXT_MAX)
470 ret += fprintf(fp, " %s\n", chain->ms.sym->name);
472 ret += fprintf(fp, " %p\n",
473 (void *)(long)chain->ip);
479 static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
480 u64 total_samples, int left_margin)
482 struct rb_node *rb_node;
483 struct callchain_node *chain;
485 u32 entries_printed = 0;
487 rb_node = rb_first(&self->sorted_chain);
491 chain = rb_entry(rb_node, struct callchain_node, rb_node);
492 percent = chain->hit * 100.0 / total_samples;
493 switch (callchain_param.mode) {
495 ret += percent_color_fprintf(fp, " %6.2f%%\n",
497 ret += callchain__fprintf_flat(fp, chain, total_samples);
499 case CHAIN_GRAPH_ABS: /* Falldown */
500 case CHAIN_GRAPH_REL:
501 ret += callchain__fprintf_graph(fp, chain, total_samples,
507 ret += fprintf(fp, "\n");
508 if (++entries_printed == callchain_param.print_limit)
510 rb_node = rb_next(rb_node);
516 int hist_entry__snprintf(struct hist_entry *self, char *s, size_t size,
517 struct hists *pair_hists, bool show_displacement,
518 long displacement, bool color, u64 session_total)
520 struct sort_entry *se;
521 u64 period, total, period_sys, period_us, period_guest_sys, period_guest_us;
522 const char *sep = symbol_conf.field_sep;
525 if (symbol_conf.exclude_other && !self->parent)
529 period = self->pair ? self->pair->period : 0;
530 total = pair_hists->stats.total_period;
531 period_sys = self->pair ? self->pair->period_sys : 0;
532 period_us = self->pair ? self->pair->period_us : 0;
533 period_guest_sys = self->pair ? self->pair->period_guest_sys : 0;
534 period_guest_us = self->pair ? self->pair->period_guest_us : 0;
536 period = self->period;
537 total = session_total;
538 period_sys = self->period_sys;
539 period_us = self->period_us;
540 period_guest_sys = self->period_guest_sys;
541 period_guest_us = self->period_guest_us;
546 ret = percent_color_snprintf(s, size,
547 sep ? "%.2f" : " %6.2f%%",
548 (period * 100.0) / total);
550 ret = snprintf(s, size, sep ? "%.2f" : " %6.2f%%",
551 (period * 100.0) / total);
552 if (symbol_conf.show_cpu_utilization) {
553 ret += percent_color_snprintf(s + ret, size - ret,
554 sep ? "%.2f" : " %6.2f%%",
555 (period_sys * 100.0) / total);
556 ret += percent_color_snprintf(s + ret, size - ret,
557 sep ? "%.2f" : " %6.2f%%",
558 (period_us * 100.0) / total);
560 ret += percent_color_snprintf(s + ret,
562 sep ? "%.2f" : " %6.2f%%",
563 (period_guest_sys * 100.0) /
565 ret += percent_color_snprintf(s + ret,
567 sep ? "%.2f" : " %6.2f%%",
568 (period_guest_us * 100.0) /
573 ret = snprintf(s, size, sep ? "%lld" : "%12lld ", period);
575 if (symbol_conf.show_nr_samples) {
577 ret += snprintf(s + ret, size - ret, "%c%lld", *sep, period);
579 ret += snprintf(s + ret, size - ret, "%11lld", period);
584 double old_percent = 0, new_percent = 0, diff;
587 old_percent = (period * 100.0) / total;
588 if (session_total > 0)
589 new_percent = (self->period * 100.0) / session_total;
591 diff = new_percent - old_percent;
593 if (fabs(diff) >= 0.01)
594 snprintf(bf, sizeof(bf), "%+4.2F%%", diff);
596 snprintf(bf, sizeof(bf), " ");
599 ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf);
601 ret += snprintf(s + ret, size - ret, "%11.11s", bf);
603 if (show_displacement) {
605 snprintf(bf, sizeof(bf), "%+4ld", displacement);
607 snprintf(bf, sizeof(bf), " ");
610 ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf);
612 ret += snprintf(s + ret, size - ret, "%6.6s", bf);
616 list_for_each_entry(se, &hist_entry__sort_list, list) {
620 ret += snprintf(s + ret, size - ret, "%s", sep ?: " ");
621 ret += se->se_snprintf(self, s + ret, size - ret,
622 se->se_width ? *se->se_width : 0);
628 int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists,
629 bool show_displacement, long displacement, FILE *fp,
633 hist_entry__snprintf(self, bf, sizeof(bf), pair_hists,
634 show_displacement, displacement,
635 true, session_total);
636 return fprintf(fp, "%s\n", bf);
639 static size_t hist_entry__fprintf_callchain(struct hist_entry *self, FILE *fp,
644 if (sort__first_dimension == SORT_COMM) {
645 struct sort_entry *se = list_first_entry(&hist_entry__sort_list,
647 left_margin = se->se_width ? *se->se_width : 0;
648 left_margin -= thread__comm_len(self->thread);
651 return hist_entry_callchain__fprintf(fp, self, session_total,
655 size_t hists__fprintf(struct hists *self, struct hists *pair,
656 bool show_displacement, FILE *fp)
658 struct sort_entry *se;
661 unsigned long position = 1;
662 long displacement = 0;
664 const char *sep = symbol_conf.field_sep;
665 const char *col_width = symbol_conf.col_width_list_str;
669 fprintf(fp, "# %s", pair ? "Baseline" : "Overhead");
671 if (symbol_conf.show_nr_samples) {
673 fprintf(fp, "%cSamples", *sep);
675 fputs(" Samples ", fp);
678 if (symbol_conf.show_cpu_utilization) {
680 ret += fprintf(fp, "%csys", *sep);
681 ret += fprintf(fp, "%cus", *sep);
683 ret += fprintf(fp, "%cguest sys", *sep);
684 ret += fprintf(fp, "%cguest us", *sep);
687 ret += fprintf(fp, " sys ");
688 ret += fprintf(fp, " us ");
690 ret += fprintf(fp, " guest sys ");
691 ret += fprintf(fp, " guest us ");
698 ret += fprintf(fp, "%cDelta", *sep);
700 ret += fprintf(fp, " Delta ");
702 if (show_displacement) {
704 ret += fprintf(fp, "%cDisplacement", *sep);
706 ret += fprintf(fp, " Displ");
710 list_for_each_entry(se, &hist_entry__sort_list, list) {
714 fprintf(fp, "%c%s", *sep, se->se_header);
717 width = strlen(se->se_header);
719 if (symbol_conf.col_width_list_str) {
721 *se->se_width = atoi(col_width);
722 col_width = strchr(col_width, ',');
727 width = *se->se_width = max(*se->se_width, width);
729 fprintf(fp, " %*s", width, se->se_header);
736 fprintf(fp, "# ........");
737 if (symbol_conf.show_nr_samples)
738 fprintf(fp, " ..........");
740 fprintf(fp, " ..........");
741 if (show_displacement)
742 fprintf(fp, " .....");
744 list_for_each_entry(se, &hist_entry__sort_list, list) {
752 width = *se->se_width;
754 width = strlen(se->se_header);
755 for (i = 0; i < width; i++)
759 fprintf(fp, "\n#\n");
762 for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
763 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
765 if (show_displacement) {
767 displacement = ((long)h->pair->position -
773 ret += hist_entry__fprintf(h, pair, show_displacement,
774 displacement, fp, self->stats.total_period);
776 if (symbol_conf.use_callchain)
777 ret += hist_entry__fprintf_callchain(h, fp, self->stats.total_period);
779 if (h->ms.map == NULL && verbose > 1) {
780 __map_groups__fprintf_maps(&h->thread->mg,
781 MAP__FUNCTION, verbose, fp);
782 fprintf(fp, "%.10s end\n", graph_dotted_line);
786 free(rem_sq_bracket);
796 void hists__filter_by_dso(struct hists *self, const struct dso *dso)
800 self->nr_entries = self->stats.total_period = 0;
801 self->stats.nr_events[PERF_RECORD_SAMPLE] = 0;
802 self->max_sym_namelen = 0;
804 for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
805 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
807 if (symbol_conf.exclude_other && !h->parent)
810 if (dso != NULL && (h->ms.map == NULL || h->ms.map->dso != dso)) {
811 h->filtered |= (1 << HIST_FILTER__DSO);
815 h->filtered &= ~(1 << HIST_FILTER__DSO);
818 self->stats.total_period += h->period;
819 self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events;
821 self->max_sym_namelen < h->ms.sym->namelen)
822 self->max_sym_namelen = h->ms.sym->namelen;
827 void hists__filter_by_thread(struct hists *self, const struct thread *thread)
831 self->nr_entries = self->stats.total_period = 0;
832 self->stats.nr_events[PERF_RECORD_SAMPLE] = 0;
833 self->max_sym_namelen = 0;
835 for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
836 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
838 if (thread != NULL && h->thread != thread) {
839 h->filtered |= (1 << HIST_FILTER__THREAD);
842 h->filtered &= ~(1 << HIST_FILTER__THREAD);
845 self->stats.total_period += h->period;
846 self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events;
848 self->max_sym_namelen < h->ms.sym->namelen)
849 self->max_sym_namelen = h->ms.sym->namelen;
854 static int symbol__alloc_hist(struct symbol *self)
856 struct sym_priv *priv = symbol__priv(self);
857 const int size = (sizeof(*priv->hist) +
858 (self->end - self->start) * sizeof(u64));
860 priv->hist = zalloc(size);
861 return priv->hist == NULL ? -1 : 0;
864 int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip)
866 unsigned int sym_size, offset;
867 struct symbol *sym = self->ms.sym;
868 struct sym_priv *priv;
871 if (!sym || !self->ms.map)
874 priv = symbol__priv(sym);
875 if (priv->hist == NULL && symbol__alloc_hist(sym) < 0)
878 sym_size = sym->end - sym->start;
879 offset = ip - sym->start;
881 pr_debug3("%s: ip=%#Lx\n", __func__, self->ms.map->unmap_ip(self->ms.map, ip));
883 if (offset >= sym_size)
890 pr_debug3("%#Lx %s: period++ [ip: %#Lx, %#Lx] => %Ld\n", self->ms.sym->start,
891 self->ms.sym->name, ip, ip - self->ms.sym->start, h->ip[offset]);
895 static struct objdump_line *objdump_line__new(s64 offset, char *line)
897 struct objdump_line *self = malloc(sizeof(*self));
900 self->offset = offset;
907 void objdump_line__free(struct objdump_line *self)
913 static void objdump__add_line(struct list_head *head, struct objdump_line *line)
915 list_add_tail(&line->node, head);
918 struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
919 struct objdump_line *pos)
921 list_for_each_entry_continue(pos, head, node)
922 if (pos->offset >= 0)
928 static int hist_entry__parse_objdump_line(struct hist_entry *self, FILE *file,
929 struct list_head *head)
931 struct symbol *sym = self->ms.sym;
932 struct objdump_line *objdump_line;
933 char *line = NULL, *tmp, *tmp2, *c;
935 s64 line_ip, offset = -1;
937 if (getline(&line, &line_len, file) < 0)
943 while (line_len != 0 && isspace(line[line_len - 1]))
944 line[--line_len] = '\0';
946 c = strchr(line, '\n');
953 * Strip leading spaces:
964 * Parse hexa addresses followed by ':'
966 line_ip = strtoull(tmp, &tmp2, 16);
972 u64 start = map__rip_2objdump(self->ms.map, sym->start);
973 offset = line_ip - start;
976 objdump_line = objdump_line__new(offset, line);
977 if (objdump_line == NULL) {
981 objdump__add_line(head, objdump_line);
986 int hist_entry__annotate(struct hist_entry *self, struct list_head *head)
988 struct symbol *sym = self->ms.sym;
989 struct map *map = self->ms.map;
990 struct dso *dso = map->dso;
991 const char *filename = dso->long_name;
992 char command[PATH_MAX * 2];
999 if (dso->origin == DSO__ORIG_KERNEL) {
1000 if (dso->annotate_warned)
1002 dso->annotate_warned = 1;
1003 pr_err("Can't annotate %s: No vmlinux file was found in the "
1004 "path:\n", sym->name);
1005 vmlinux_path__fprintf(stderr);
1009 pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__,
1010 filename, sym->name, map->unmap_ip(map, sym->start),
1011 map->unmap_ip(map, sym->end));
1013 len = sym->end - sym->start;
1015 pr_debug("annotating [%p] %30s : [%p] %30s\n",
1016 dso, dso->long_name, sym, sym->name);
1018 snprintf(command, sizeof(command),
1019 "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s|expand",
1020 map__rip_2objdump(map, sym->start),
1021 map__rip_2objdump(map, sym->end),
1022 filename, filename);
1024 pr_debug("Executing: %s\n", command);
1026 file = popen(command, "r");
1031 if (hist_entry__parse_objdump_line(self, file, head) < 0)
1038 void hists__inc_nr_events(struct hists *self, u32 type)
1040 ++self->stats.nr_events[0];
1041 ++self->stats.nr_events[type];
1044 size_t hists__fprintf_nr_events(struct hists *self, FILE *fp)
1049 for (i = 0; i < PERF_RECORD_HEADER_MAX; ++i) {
1050 if (!event__name[i])
1052 ret += fprintf(fp, "%10s events: %10d\n",
1053 event__name[i], self->stats.nr_events[i]);