]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blob - tools/perf/util/hist.c
perf: Fix orphan callchain branches
[mirror_ubuntu-bionic-kernel.git] / tools / perf / util / hist.c
1 #include "hist.h"
2 #include "session.h"
3 #include "sort.h"
4 #include <math.h>
5
6 struct callchain_param callchain_param = {
7 .mode = CHAIN_GRAPH_REL,
8 .min_percent = 0.5
9 };
10
11 /*
12 * histogram, sorted on item, collects counts
13 */
14
15 struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists,
16 struct addr_location *al,
17 struct symbol *sym_parent,
18 u64 count, bool *hit)
19 {
20 struct rb_node **p = &hists->rb_node;
21 struct rb_node *parent = NULL;
22 struct hist_entry *he;
23 struct hist_entry entry = {
24 .thread = al->thread,
25 .map = al->map,
26 .sym = al->sym,
27 .ip = al->addr,
28 .level = al->level,
29 .count = count,
30 .parent = sym_parent,
31 };
32 int cmp;
33
34 while (*p != NULL) {
35 parent = *p;
36 he = rb_entry(parent, struct hist_entry, rb_node);
37
38 cmp = hist_entry__cmp(&entry, he);
39
40 if (!cmp) {
41 *hit = true;
42 return he;
43 }
44
45 if (cmp < 0)
46 p = &(*p)->rb_left;
47 else
48 p = &(*p)->rb_right;
49 }
50
51 he = malloc(sizeof(*he));
52 if (!he)
53 return NULL;
54 *he = entry;
55 rb_link_node(&he->rb_node, parent, p);
56 rb_insert_color(&he->rb_node, hists);
57 *hit = false;
58 return he;
59 }
60
61 int64_t
62 hist_entry__cmp(struct hist_entry *left, struct hist_entry *right)
63 {
64 struct sort_entry *se;
65 int64_t cmp = 0;
66
67 list_for_each_entry(se, &hist_entry__sort_list, list) {
68 cmp = se->cmp(left, right);
69 if (cmp)
70 break;
71 }
72
73 return cmp;
74 }
75
76 int64_t
77 hist_entry__collapse(struct hist_entry *left, struct hist_entry *right)
78 {
79 struct sort_entry *se;
80 int64_t cmp = 0;
81
82 list_for_each_entry(se, &hist_entry__sort_list, list) {
83 int64_t (*f)(struct hist_entry *, struct hist_entry *);
84
85 f = se->collapse ?: se->cmp;
86
87 cmp = f(left, right);
88 if (cmp)
89 break;
90 }
91
92 return cmp;
93 }
94
95 void hist_entry__free(struct hist_entry *he)
96 {
97 free(he);
98 }
99
100 /*
101 * collapse the histogram
102 */
103
104 static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he)
105 {
106 struct rb_node **p = &root->rb_node;
107 struct rb_node *parent = NULL;
108 struct hist_entry *iter;
109 int64_t cmp;
110
111 while (*p != NULL) {
112 parent = *p;
113 iter = rb_entry(parent, struct hist_entry, rb_node);
114
115 cmp = hist_entry__collapse(iter, he);
116
117 if (!cmp) {
118 iter->count += he->count;
119 hist_entry__free(he);
120 return;
121 }
122
123 if (cmp < 0)
124 p = &(*p)->rb_left;
125 else
126 p = &(*p)->rb_right;
127 }
128
129 rb_link_node(&he->rb_node, parent, p);
130 rb_insert_color(&he->rb_node, root);
131 }
132
133 void perf_session__collapse_resort(struct rb_root *hists)
134 {
135 struct rb_root tmp;
136 struct rb_node *next;
137 struct hist_entry *n;
138
139 if (!sort__need_collapse)
140 return;
141
142 tmp = RB_ROOT;
143 next = rb_first(hists);
144
145 while (next) {
146 n = rb_entry(next, struct hist_entry, rb_node);
147 next = rb_next(&n->rb_node);
148
149 rb_erase(&n->rb_node, hists);
150 collapse__insert_entry(&tmp, n);
151 }
152
153 *hists = tmp;
154 }
155
156 /*
157 * reverse the map, sort on count.
158 */
159
160 static void perf_session__insert_output_hist_entry(struct rb_root *root,
161 struct hist_entry *he,
162 u64 min_callchain_hits)
163 {
164 struct rb_node **p = &root->rb_node;
165 struct rb_node *parent = NULL;
166 struct hist_entry *iter;
167
168 if (symbol_conf.use_callchain)
169 callchain_param.sort(&he->sorted_chain, &he->callchain,
170 min_callchain_hits, &callchain_param);
171
172 while (*p != NULL) {
173 parent = *p;
174 iter = rb_entry(parent, struct hist_entry, rb_node);
175
176 if (he->count > iter->count)
177 p = &(*p)->rb_left;
178 else
179 p = &(*p)->rb_right;
180 }
181
182 rb_link_node(&he->rb_node, parent, p);
183 rb_insert_color(&he->rb_node, root);
184 }
185
186 void perf_session__output_resort(struct rb_root *hists, u64 total_samples)
187 {
188 struct rb_root tmp;
189 struct rb_node *next;
190 struct hist_entry *n;
191 u64 min_callchain_hits;
192
193 min_callchain_hits =
194 total_samples * (callchain_param.min_percent / 100);
195
196 tmp = RB_ROOT;
197 next = rb_first(hists);
198
199 while (next) {
200 n = rb_entry(next, struct hist_entry, rb_node);
201 next = rb_next(&n->rb_node);
202
203 rb_erase(&n->rb_node, hists);
204 perf_session__insert_output_hist_entry(&tmp, n,
205 min_callchain_hits);
206 }
207
208 *hists = tmp;
209 }
210
211 static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin)
212 {
213 int i;
214 int ret = fprintf(fp, " ");
215
216 for (i = 0; i < left_margin; i++)
217 ret += fprintf(fp, " ");
218
219 return ret;
220 }
221
222 static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask,
223 int left_margin)
224 {
225 int i;
226 size_t ret = callchain__fprintf_left_margin(fp, left_margin);
227
228 for (i = 0; i < depth; i++)
229 if (depth_mask & (1 << i))
230 ret += fprintf(fp, "| ");
231 else
232 ret += fprintf(fp, " ");
233
234 ret += fprintf(fp, "\n");
235
236 return ret;
237 }
238
239 static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain,
240 int depth, int depth_mask, int count,
241 u64 total_samples, int hits,
242 int left_margin)
243 {
244 int i;
245 size_t ret = 0;
246
247 ret += callchain__fprintf_left_margin(fp, left_margin);
248 for (i = 0; i < depth; i++) {
249 if (depth_mask & (1 << i))
250 ret += fprintf(fp, "|");
251 else
252 ret += fprintf(fp, " ");
253 if (!count && i == depth - 1) {
254 double percent;
255
256 percent = hits * 100.0 / total_samples;
257 ret += percent_color_fprintf(fp, "--%2.2f%%-- ", percent);
258 } else
259 ret += fprintf(fp, "%s", " ");
260 }
261 if (chain->sym)
262 ret += fprintf(fp, "%s\n", chain->sym->name);
263 else
264 ret += fprintf(fp, "%p\n", (void *)(long)chain->ip);
265
266 return ret;
267 }
268
269 static struct symbol *rem_sq_bracket;
270 static struct callchain_list rem_hits;
271
272 static void init_rem_hits(void)
273 {
274 rem_sq_bracket = malloc(sizeof(*rem_sq_bracket) + 6);
275 if (!rem_sq_bracket) {
276 fprintf(stderr, "Not enough memory to display remaining hits\n");
277 return;
278 }
279
280 strcpy(rem_sq_bracket->name, "[...]");
281 rem_hits.sym = rem_sq_bracket;
282 }
283
284 static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
285 u64 total_samples, int depth,
286 int depth_mask, int left_margin)
287 {
288 struct rb_node *node, *next;
289 struct callchain_node *child;
290 struct callchain_list *chain;
291 int new_depth_mask = depth_mask;
292 u64 new_total;
293 u64 remaining;
294 size_t ret = 0;
295 int i;
296
297 if (callchain_param.mode == CHAIN_GRAPH_REL)
298 new_total = self->children_hit;
299 else
300 new_total = total_samples;
301
302 remaining = new_total;
303
304 node = rb_first(&self->rb_root);
305 while (node) {
306 u64 cumul;
307
308 child = rb_entry(node, struct callchain_node, rb_node);
309 cumul = cumul_hits(child);
310 remaining -= cumul;
311
312 /*
313 * The depth mask manages the output of pipes that show
314 * the depth. We don't want to keep the pipes of the current
315 * level for the last child of this depth.
316 * Except if we have remaining filtered hits. They will
317 * supersede the last child
318 */
319 next = rb_next(node);
320 if (!next && (callchain_param.mode != CHAIN_GRAPH_REL || !remaining))
321 new_depth_mask &= ~(1 << (depth - 1));
322
323 /*
324 * But we keep the older depth mask for the line separator
325 * to keep the level link until we reach the last child
326 */
327 ret += ipchain__fprintf_graph_line(fp, depth, depth_mask,
328 left_margin);
329 i = 0;
330 list_for_each_entry(chain, &child->val, list) {
331 ret += ipchain__fprintf_graph(fp, chain, depth,
332 new_depth_mask, i++,
333 new_total,
334 cumul,
335 left_margin);
336 }
337 ret += __callchain__fprintf_graph(fp, child, new_total,
338 depth + 1,
339 new_depth_mask | (1 << depth),
340 left_margin);
341 node = next;
342 }
343
344 if (callchain_param.mode == CHAIN_GRAPH_REL &&
345 remaining && remaining != new_total) {
346
347 if (!rem_sq_bracket)
348 return ret;
349
350 new_depth_mask &= ~(1 << (depth - 1));
351
352 ret += ipchain__fprintf_graph(fp, &rem_hits, depth,
353 new_depth_mask, 0, new_total,
354 remaining, left_margin);
355 }
356
357 return ret;
358 }
359
360 static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
361 u64 total_samples, int left_margin)
362 {
363 struct callchain_list *chain;
364 bool printed = false;
365 int i = 0;
366 int ret = 0;
367
368 list_for_each_entry(chain, &self->val, list) {
369 if (!i++ && sort__first_dimension == SORT_SYM)
370 continue;
371
372 if (!printed) {
373 ret += callchain__fprintf_left_margin(fp, left_margin);
374 ret += fprintf(fp, "|\n");
375 ret += callchain__fprintf_left_margin(fp, left_margin);
376 ret += fprintf(fp, "---");
377
378 left_margin += 3;
379 printed = true;
380 } else
381 ret += callchain__fprintf_left_margin(fp, left_margin);
382
383 if (chain->sym)
384 ret += fprintf(fp, " %s\n", chain->sym->name);
385 else
386 ret += fprintf(fp, " %p\n", (void *)(long)chain->ip);
387 }
388
389 ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin);
390
391 return ret;
392 }
393
394 static size_t callchain__fprintf_flat(FILE *fp, struct callchain_node *self,
395 u64 total_samples)
396 {
397 struct callchain_list *chain;
398 size_t ret = 0;
399
400 if (!self)
401 return 0;
402
403 ret += callchain__fprintf_flat(fp, self->parent, total_samples);
404
405
406 list_for_each_entry(chain, &self->val, list) {
407 if (chain->ip >= PERF_CONTEXT_MAX)
408 continue;
409 if (chain->sym)
410 ret += fprintf(fp, " %s\n", chain->sym->name);
411 else
412 ret += fprintf(fp, " %p\n",
413 (void *)(long)chain->ip);
414 }
415
416 return ret;
417 }
418
419 static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
420 u64 total_samples, int left_margin)
421 {
422 struct rb_node *rb_node;
423 struct callchain_node *chain;
424 size_t ret = 0;
425
426 rb_node = rb_first(&self->sorted_chain);
427 while (rb_node) {
428 double percent;
429
430 chain = rb_entry(rb_node, struct callchain_node, rb_node);
431 percent = chain->hit * 100.0 / total_samples;
432 switch (callchain_param.mode) {
433 case CHAIN_FLAT:
434 ret += percent_color_fprintf(fp, " %6.2f%%\n",
435 percent);
436 ret += callchain__fprintf_flat(fp, chain, total_samples);
437 break;
438 case CHAIN_GRAPH_ABS: /* Falldown */
439 case CHAIN_GRAPH_REL:
440 ret += callchain__fprintf_graph(fp, chain, total_samples,
441 left_margin);
442 case CHAIN_NONE:
443 default:
444 break;
445 }
446 ret += fprintf(fp, "\n");
447 rb_node = rb_next(rb_node);
448 }
449
450 return ret;
451 }
452
453 size_t hist_entry__fprintf(struct hist_entry *self,
454 struct perf_session *pair_session,
455 bool show_displacement,
456 long displacement, FILE *fp,
457 u64 session_total)
458 {
459 struct sort_entry *se;
460 u64 count, total;
461 const char *sep = symbol_conf.field_sep;
462 size_t ret;
463
464 if (symbol_conf.exclude_other && !self->parent)
465 return 0;
466
467 if (pair_session) {
468 count = self->pair ? self->pair->count : 0;
469 total = pair_session->events_stats.total;
470 } else {
471 count = self->count;
472 total = session_total;
473 }
474
475 if (total)
476 ret = percent_color_fprintf(fp, sep ? "%.2f" : " %6.2f%%",
477 (count * 100.0) / total);
478 else
479 ret = fprintf(fp, sep ? "%lld" : "%12lld ", count);
480
481 if (symbol_conf.show_nr_samples) {
482 if (sep)
483 ret += fprintf(fp, "%c%lld", *sep, count);
484 else
485 ret += fprintf(fp, "%11lld", count);
486 }
487
488 if (pair_session) {
489 char bf[32];
490 double old_percent = 0, new_percent = 0, diff;
491
492 if (total > 0)
493 old_percent = (count * 100.0) / total;
494 if (session_total > 0)
495 new_percent = (self->count * 100.0) / session_total;
496
497 diff = new_percent - old_percent;
498
499 if (fabs(diff) >= 0.01)
500 snprintf(bf, sizeof(bf), "%+4.2F%%", diff);
501 else
502 snprintf(bf, sizeof(bf), " ");
503
504 if (sep)
505 ret += fprintf(fp, "%c%s", *sep, bf);
506 else
507 ret += fprintf(fp, "%11.11s", bf);
508
509 if (show_displacement) {
510 if (displacement)
511 snprintf(bf, sizeof(bf), "%+4ld", displacement);
512 else
513 snprintf(bf, sizeof(bf), " ");
514
515 if (sep)
516 ret += fprintf(fp, "%c%s", *sep, bf);
517 else
518 ret += fprintf(fp, "%6.6s", bf);
519 }
520 }
521
522 list_for_each_entry(se, &hist_entry__sort_list, list) {
523 if (se->elide)
524 continue;
525
526 ret += fprintf(fp, "%s", sep ?: " ");
527 ret += se->print(fp, self, se->width ? *se->width : 0);
528 }
529
530 return ret + fprintf(fp, "\n");
531 }
532
533 static size_t hist_entry__fprintf_callchain(struct hist_entry *self, FILE *fp,
534 u64 session_total)
535 {
536 int left_margin = 0;
537
538 if (sort__first_dimension == SORT_COMM) {
539 struct sort_entry *se = list_first_entry(&hist_entry__sort_list,
540 typeof(*se), list);
541 left_margin = se->width ? *se->width : 0;
542 left_margin -= thread__comm_len(self->thread);
543 }
544
545 return hist_entry_callchain__fprintf(fp, self, session_total,
546 left_margin);
547 }
548
549 size_t perf_session__fprintf_hists(struct rb_root *hists,
550 struct perf_session *pair,
551 bool show_displacement, FILE *fp,
552 u64 session_total)
553 {
554 struct sort_entry *se;
555 struct rb_node *nd;
556 size_t ret = 0;
557 unsigned long position = 1;
558 long displacement = 0;
559 unsigned int width;
560 const char *sep = symbol_conf.field_sep;
561 char *col_width = symbol_conf.col_width_list_str;
562
563 init_rem_hits();
564
565 fprintf(fp, "# %s", pair ? "Baseline" : "Overhead");
566
567 if (symbol_conf.show_nr_samples) {
568 if (sep)
569 fprintf(fp, "%cSamples", *sep);
570 else
571 fputs(" Samples ", fp);
572 }
573
574 if (pair) {
575 if (sep)
576 ret += fprintf(fp, "%cDelta", *sep);
577 else
578 ret += fprintf(fp, " Delta ");
579
580 if (show_displacement) {
581 if (sep)
582 ret += fprintf(fp, "%cDisplacement", *sep);
583 else
584 ret += fprintf(fp, " Displ");
585 }
586 }
587
588 list_for_each_entry(se, &hist_entry__sort_list, list) {
589 if (se->elide)
590 continue;
591 if (sep) {
592 fprintf(fp, "%c%s", *sep, se->header);
593 continue;
594 }
595 width = strlen(se->header);
596 if (se->width) {
597 if (symbol_conf.col_width_list_str) {
598 if (col_width) {
599 *se->width = atoi(col_width);
600 col_width = strchr(col_width, ',');
601 if (col_width)
602 ++col_width;
603 }
604 }
605 width = *se->width = max(*se->width, width);
606 }
607 fprintf(fp, " %*s", width, se->header);
608 }
609 fprintf(fp, "\n");
610
611 if (sep)
612 goto print_entries;
613
614 fprintf(fp, "# ........");
615 if (symbol_conf.show_nr_samples)
616 fprintf(fp, " ..........");
617 if (pair) {
618 fprintf(fp, " ..........");
619 if (show_displacement)
620 fprintf(fp, " .....");
621 }
622 list_for_each_entry(se, &hist_entry__sort_list, list) {
623 unsigned int i;
624
625 if (se->elide)
626 continue;
627
628 fprintf(fp, " ");
629 if (se->width)
630 width = *se->width;
631 else
632 width = strlen(se->header);
633 for (i = 0; i < width; i++)
634 fprintf(fp, ".");
635 }
636
637 fprintf(fp, "\n#\n");
638
639 print_entries:
640 for (nd = rb_first(hists); nd; nd = rb_next(nd)) {
641 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
642
643 if (show_displacement) {
644 if (h->pair != NULL)
645 displacement = ((long)h->pair->position -
646 (long)position);
647 else
648 displacement = 0;
649 ++position;
650 }
651 ret += hist_entry__fprintf(h, pair, show_displacement,
652 displacement, fp, session_total);
653
654 if (symbol_conf.use_callchain)
655 ret += hist_entry__fprintf_callchain(h, fp, session_total);
656
657 if (h->map == NULL && verbose > 1) {
658 __map_groups__fprintf_maps(&h->thread->mg,
659 MAP__FUNCTION, fp);
660 fprintf(fp, "%.10s end\n", graph_dotted_line);
661 }
662 }
663
664 free(rem_sq_bracket);
665
666 return ret;
667 }