]> Pileus Git - ~andy/linux/blob - tools/perf/builtin-report.c
perf tools: Bind callchains to the first sort dimension column
[~andy/linux] / tools / perf / builtin-report.c
1 /*
2  * builtin-report.c
3  *
4  * Builtin report command: Analyze the perf.data input file,
5  * look up and read DSOs and symbol information and display
6  * a histogram of results, along various sorting keys.
7  */
8 #include "builtin.h"
9
10 #include "util/util.h"
11
12 #include "util/color.h"
13 #include <linux/list.h>
14 #include "util/cache.h"
15 #include <linux/rbtree.h>
16 #include "util/symbol.h"
17 #include "util/string.h"
18 #include "util/callchain.h"
19 #include "util/strlist.h"
20 #include "util/values.h"
21
22 #include "perf.h"
23 #include "util/debug.h"
24 #include "util/header.h"
25
26 #include "util/parse-options.h"
27 #include "util/parse-events.h"
28
29 #include "util/data_map.h"
30 #include "util/thread.h"
31 #include "util/sort.h"
32 #include "util/hist.h"
33
34 static char             const *input_name = "perf.data";
35
36 static char             *dso_list_str, *comm_list_str, *sym_list_str,
37                         *col_width_list_str;
38 static struct strlist   *dso_list, *comm_list, *sym_list;
39
40 static int              force;
41
42 static int              full_paths;
43 static int              show_nr_samples;
44
45 static int              show_threads;
46 static struct perf_read_values  show_threads_values;
47
48 static char             default_pretty_printing_style[] = "normal";
49 static char             *pretty_printing_style = default_pretty_printing_style;
50
51 static int              exclude_other = 1;
52
53 static char             callchain_default_opt[] = "fractal,0.5";
54
55 static char             *cwd;
56 static int              cwdlen;
57
58 static struct perf_header *header;
59
60 static u64              sample_type;
61
62
63 static size_t
64 callchain__fprintf_left_margin(FILE *fp, int left_margin)
65 {
66         int i;
67         int ret;
68
69         ret = fprintf(fp, "            ");
70
71         for (i = 0; i < left_margin; i++)
72                 ret += fprintf(fp, " ");
73
74         return ret;
75 }
76
77 static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask,
78                                           int left_margin)
79 {
80         int i;
81         size_t ret = 0;
82
83         ret += callchain__fprintf_left_margin(fp, left_margin);
84
85         for (i = 0; i < depth; i++)
86                 if (depth_mask & (1 << i))
87                         ret += fprintf(fp, "|          ");
88                 else
89                         ret += fprintf(fp, "           ");
90
91         ret += fprintf(fp, "\n");
92
93         return ret;
94 }
95 static size_t
96 ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, int depth,
97                        int depth_mask, int count, u64 total_samples,
98                        int hits, int left_margin)
99 {
100         int i;
101         size_t ret = 0;
102
103         ret += callchain__fprintf_left_margin(fp, left_margin);
104         for (i = 0; i < depth; i++) {
105                 if (depth_mask & (1 << i))
106                         ret += fprintf(fp, "|");
107                 else
108                         ret += fprintf(fp, " ");
109                 if (!count && i == depth - 1) {
110                         double percent;
111
112                         percent = hits * 100.0 / total_samples;
113                         ret += percent_color_fprintf(fp, "--%2.2f%%-- ", percent);
114                 } else
115                         ret += fprintf(fp, "%s", "          ");
116         }
117         if (chain->sym)
118                 ret += fprintf(fp, "%s\n", chain->sym->name);
119         else
120                 ret += fprintf(fp, "%p\n", (void *)(long)chain->ip);
121
122         return ret;
123 }
124
125 static struct symbol *rem_sq_bracket;
126 static struct callchain_list rem_hits;
127
128 static void init_rem_hits(void)
129 {
130         rem_sq_bracket = malloc(sizeof(*rem_sq_bracket) + 6);
131         if (!rem_sq_bracket) {
132                 fprintf(stderr, "Not enough memory to display remaining hits\n");
133                 return;
134         }
135
136         strcpy(rem_sq_bracket->name, "[...]");
137         rem_hits.sym = rem_sq_bracket;
138 }
139
140 static size_t
141 __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
142                            u64 total_samples, int depth, int depth_mask,
143                            int left_margin)
144 {
145         struct rb_node *node, *next;
146         struct callchain_node *child;
147         struct callchain_list *chain;
148         int new_depth_mask = depth_mask;
149         u64 new_total;
150         u64 remaining;
151         size_t ret = 0;
152         int i;
153
154         if (callchain_param.mode == CHAIN_GRAPH_REL)
155                 new_total = self->children_hit;
156         else
157                 new_total = total_samples;
158
159         remaining = new_total;
160
161         node = rb_first(&self->rb_root);
162         while (node) {
163                 u64 cumul;
164
165                 child = rb_entry(node, struct callchain_node, rb_node);
166                 cumul = cumul_hits(child);
167                 remaining -= cumul;
168
169                 /*
170                  * The depth mask manages the output of pipes that show
171                  * the depth. We don't want to keep the pipes of the current
172                  * level for the last child of this depth.
173                  * Except if we have remaining filtered hits. They will
174                  * supersede the last child
175                  */
176                 next = rb_next(node);
177                 if (!next && (callchain_param.mode != CHAIN_GRAPH_REL || !remaining))
178                         new_depth_mask &= ~(1 << (depth - 1));
179
180                 /*
181                  * But we keep the older depth mask for the line seperator
182                  * to keep the level link until we reach the last child
183                  */
184                 ret += ipchain__fprintf_graph_line(fp, depth, depth_mask,
185                                                    left_margin);
186                 i = 0;
187                 list_for_each_entry(chain, &child->val, list) {
188                         if (chain->ip >= PERF_CONTEXT_MAX)
189                                 continue;
190                         ret += ipchain__fprintf_graph(fp, chain, depth,
191                                                       new_depth_mask, i++,
192                                                       new_total,
193                                                       cumul,
194                                                       left_margin);
195                 }
196                 ret += __callchain__fprintf_graph(fp, child, new_total,
197                                                   depth + 1,
198                                                   new_depth_mask | (1 << depth),
199                                                   left_margin);
200                 node = next;
201         }
202
203         if (callchain_param.mode == CHAIN_GRAPH_REL &&
204                 remaining && remaining != new_total) {
205
206                 if (!rem_sq_bracket)
207                         return ret;
208
209                 new_depth_mask &= ~(1 << (depth - 1));
210
211                 ret += ipchain__fprintf_graph(fp, &rem_hits, depth,
212                                               new_depth_mask, 0, new_total,
213                                               remaining, left_margin);
214         }
215
216         return ret;
217 }
218
219
220 static size_t
221 callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
222                          u64 total_samples, int left_margin)
223 {
224         struct callchain_list *chain;
225         bool printed = false;
226         int i = 0;
227         int ret = 0;
228
229         list_for_each_entry(chain, &self->val, list) {
230                 if (chain->ip >= PERF_CONTEXT_MAX)
231                         continue;
232
233                 if (!i++ && sort__first_dimension == SORT_SYM)
234                         continue;
235
236                 if (!printed) {
237                         ret += callchain__fprintf_left_margin(fp, left_margin);
238                         ret += fprintf(fp, "|\n");
239                         ret += callchain__fprintf_left_margin(fp, left_margin);
240                         ret += fprintf(fp, "---");
241
242                         left_margin += 3;
243                         printed = true;
244                 } else
245                         ret += callchain__fprintf_left_margin(fp, left_margin);
246
247                 if (chain->sym)
248                         ret += fprintf(fp, " %s\n", chain->sym->name);
249                 else
250                         ret += fprintf(fp, " %p\n", (void *)(long)chain->ip);
251         }
252
253         ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin);
254
255         return ret;
256 }
257
258 static size_t
259 callchain__fprintf_flat(FILE *fp, struct callchain_node *self,
260                         u64 total_samples)
261 {
262         struct callchain_list *chain;
263         size_t ret = 0;
264
265         if (!self)
266                 return 0;
267
268         ret += callchain__fprintf_flat(fp, self->parent, total_samples);
269
270
271         list_for_each_entry(chain, &self->val, list) {
272                 if (chain->ip >= PERF_CONTEXT_MAX)
273                         continue;
274                 if (chain->sym)
275                         ret += fprintf(fp, "                %s\n", chain->sym->name);
276                 else
277                         ret += fprintf(fp, "                %p\n",
278                                         (void *)(long)chain->ip);
279         }
280
281         return ret;
282 }
283
284 static size_t
285 hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
286                               u64 total_samples, int left_margin)
287 {
288         struct rb_node *rb_node;
289         struct callchain_node *chain;
290         size_t ret = 0;
291
292         rb_node = rb_first(&self->sorted_chain);
293         while (rb_node) {
294                 double percent;
295
296                 chain = rb_entry(rb_node, struct callchain_node, rb_node);
297                 percent = chain->hit * 100.0 / total_samples;
298                 switch (callchain_param.mode) {
299                 case CHAIN_FLAT:
300                         ret += percent_color_fprintf(fp, "           %6.2f%%\n",
301                                                      percent);
302                         ret += callchain__fprintf_flat(fp, chain, total_samples);
303                         break;
304                 case CHAIN_GRAPH_ABS: /* Falldown */
305                 case CHAIN_GRAPH_REL:
306                         ret += callchain__fprintf_graph(fp, chain, total_samples,
307                                                         left_margin);
308                 case CHAIN_NONE:
309                 default:
310                         break;
311                 }
312                 ret += fprintf(fp, "\n");
313                 rb_node = rb_next(rb_node);
314         }
315
316         return ret;
317 }
318
319 static size_t
320 hist_entry__fprintf(FILE *fp, struct hist_entry *self, u64 total_samples)
321 {
322         struct sort_entry *se;
323         size_t ret;
324
325         if (exclude_other && !self->parent)
326                 return 0;
327
328         if (total_samples)
329                 ret = percent_color_fprintf(fp,
330                                             field_sep ? "%.2f" : "   %6.2f%%",
331                                         (self->count * 100.0) / total_samples);
332         else
333                 ret = fprintf(fp, field_sep ? "%lld" : "%12lld ", self->count);
334
335         if (show_nr_samples) {
336                 if (field_sep)
337                         fprintf(fp, "%c%lld", *field_sep, self->count);
338                 else
339                         fprintf(fp, "%11lld", self->count);
340         }
341
342         list_for_each_entry(se, &hist_entry__sort_list, list) {
343                 if (se->elide)
344                         continue;
345
346                 fprintf(fp, "%s", field_sep ?: "  ");
347                 ret += se->print(fp, self, se->width ? *se->width : 0);
348         }
349
350         ret += fprintf(fp, "\n");
351
352         if (callchain) {
353                 int left_margin = 0;
354
355                 if (sort__first_dimension == SORT_COMM) {
356                         se = list_first_entry(&hist_entry__sort_list, typeof(*se),
357                                                 list);
358                         left_margin = se->width ? *se->width : 0;
359                         left_margin -= thread__comm_len(self->thread);
360                 }
361
362                 hist_entry_callchain__fprintf(fp, self, total_samples,
363                                               left_margin);
364         }
365
366         return ret;
367 }
368
369 /*
370  *
371  */
372
373 static void dso__calc_col_width(struct dso *self)
374 {
375         if (!col_width_list_str && !field_sep &&
376             (!dso_list || strlist__has_entry(dso_list, self->name))) {
377                 unsigned int slen = strlen(self->name);
378                 if (slen > dsos__col_width)
379                         dsos__col_width = slen;
380         }
381
382         self->slen_calculated = 1;
383 }
384
385 static void thread__comm_adjust(struct thread *self)
386 {
387         char *comm = self->comm;
388
389         if (!col_width_list_str && !field_sep &&
390             (!comm_list || strlist__has_entry(comm_list, comm))) {
391                 unsigned int slen = strlen(comm);
392
393                 if (slen > comms__col_width) {
394                         comms__col_width = slen;
395                         threads__col_width = slen + 6;
396                 }
397         }
398 }
399
400 static int thread__set_comm_adjust(struct thread *self, const char *comm)
401 {
402         int ret = thread__set_comm(self, comm);
403
404         if (ret)
405                 return ret;
406
407         thread__comm_adjust(self);
408
409         return 0;
410 }
411
412
413 static struct symbol *
414 resolve_symbol(struct thread *thread, struct map **mapp, u64 *ipp)
415 {
416         struct map *map = mapp ? *mapp : NULL;
417         u64 ip = *ipp;
418
419         if (map)
420                 goto got_map;
421
422         if (!thread)
423                 return NULL;
424
425         map = thread__find_map(thread, ip);
426         if (map != NULL) {
427                 /*
428                  * We have to do this here as we may have a dso
429                  * with no symbol hit that has a name longer than
430                  * the ones with symbols sampled.
431                  */
432                 if (!sort_dso.elide && !map->dso->slen_calculated)
433                         dso__calc_col_width(map->dso);
434
435                 if (mapp)
436                         *mapp = map;
437 got_map:
438                 ip = map->map_ip(map, ip);
439         } else {
440                 /*
441                  * If this is outside of all known maps,
442                  * and is a negative address, try to look it
443                  * up in the kernel dso, as it might be a
444                  * vsyscall or vdso (which executes in user-mode).
445                  *
446                  * XXX This is nasty, we should have a symbol list in
447                  * the "[vdso]" dso, but for now lets use the old
448                  * trick of looking in the whole kernel symbol list.
449                  */
450                 if ((long long)ip < 0)
451                         return kernel_maps__find_symbol(ip, mapp);
452         }
453         dump_printf(" ...... dso: %s\n",
454                     map ? map->dso->long_name : "<not found>");
455         dump_printf(" ...... map: %Lx -> %Lx\n", *ipp, ip);
456         *ipp  = ip;
457
458         return map ? map->dso->find_symbol(map->dso, ip) : NULL;
459 }
460
461 static int call__match(struct symbol *sym)
462 {
463         if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0))
464                 return 1;
465
466         return 0;
467 }
468
469 static struct symbol **resolve_callchain(struct thread *thread, struct map *map,
470                                          struct ip_callchain *chain,
471                                          struct symbol **parent)
472 {
473         u64 context = PERF_CONTEXT_MAX;
474         struct symbol **syms = NULL;
475         unsigned int i;
476
477         if (callchain) {
478                 syms = calloc(chain->nr, sizeof(*syms));
479                 if (!syms) {
480                         fprintf(stderr, "Can't allocate memory for symbols\n");
481                         exit(-1);
482                 }
483         }
484
485         for (i = 0; i < chain->nr; i++) {
486                 u64 ip = chain->ips[i];
487                 struct symbol *sym = NULL;
488
489                 if (ip >= PERF_CONTEXT_MAX) {
490                         context = ip;
491                         continue;
492                 }
493
494                 switch (context) {
495                 case PERF_CONTEXT_HV:
496                         break;
497                 case PERF_CONTEXT_KERNEL:
498                         sym = kernel_maps__find_symbol(ip, &map);
499                         break;
500                 default:
501                         sym = resolve_symbol(thread, &map, &ip);
502                         break;
503                 }
504
505                 if (sym) {
506                         if (sort__has_parent && !*parent && call__match(sym))
507                                 *parent = sym;
508                         if (!callchain)
509                                 break;
510                         syms[i] = sym;
511                 }
512         }
513
514         return syms;
515 }
516
517 /*
518  * collect histogram counts
519  */
520
521 static int
522 hist_entry__add(struct thread *thread, struct map *map,
523                 struct symbol *sym, u64 ip, struct ip_callchain *chain,
524                 char level, u64 count)
525 {
526         struct symbol **syms = NULL, *parent = NULL;
527         bool hit;
528         struct hist_entry *he;
529
530         if ((sort__has_parent || callchain) && chain)
531                 syms = resolve_callchain(thread, map, chain, &parent);
532
533         he = __hist_entry__add(thread, map, sym, parent,
534                                ip, count, level, &hit);
535         if (he == NULL)
536                 return -ENOMEM;
537
538         if (hit)
539                 he->count += count;
540
541         if (callchain) {
542                 if (!hit)
543                         callchain_init(&he->callchain);
544                 append_chain(&he->callchain, chain, syms);
545                 free(syms);
546         }
547
548         return 0;
549 }
550
551 static size_t output__fprintf(FILE *fp, u64 total_samples)
552 {
553         struct hist_entry *pos;
554         struct sort_entry *se;
555         struct rb_node *nd;
556         size_t ret = 0;
557         unsigned int width;
558         char *col_width = col_width_list_str;
559         int raw_printing_style;
560
561         raw_printing_style = !strcmp(pretty_printing_style, "raw");
562
563         init_rem_hits();
564
565         fprintf(fp, "# Samples: %Ld\n", (u64)total_samples);
566         fprintf(fp, "#\n");
567
568         fprintf(fp, "# Overhead");
569         if (show_nr_samples) {
570                 if (field_sep)
571                         fprintf(fp, "%cSamples", *field_sep);
572                 else
573                         fputs("  Samples  ", fp);
574         }
575         list_for_each_entry(se, &hist_entry__sort_list, list) {
576                 if (se->elide)
577                         continue;
578                 if (field_sep) {
579                         fprintf(fp, "%c%s", *field_sep, se->header);
580                         continue;
581                 }
582                 width = strlen(se->header);
583                 if (se->width) {
584                         if (col_width_list_str) {
585                                 if (col_width) {
586                                         *se->width = atoi(col_width);
587                                         col_width = strchr(col_width, ',');
588                                         if (col_width)
589                                                 ++col_width;
590                                 }
591                         }
592                         width = *se->width = max(*se->width, width);
593                 }
594                 fprintf(fp, "  %*s", width, se->header);
595         }
596         fprintf(fp, "\n");
597
598         if (field_sep)
599                 goto print_entries;
600
601         fprintf(fp, "# ........");
602         if (show_nr_samples)
603                 fprintf(fp, " ..........");
604         list_for_each_entry(se, &hist_entry__sort_list, list) {
605                 unsigned int i;
606
607                 if (se->elide)
608                         continue;
609
610                 fprintf(fp, "  ");
611                 if (se->width)
612                         width = *se->width;
613                 else
614                         width = strlen(se->header);
615                 for (i = 0; i < width; i++)
616                         fprintf(fp, ".");
617         }
618         fprintf(fp, "\n");
619
620         fprintf(fp, "#\n");
621
622 print_entries:
623         for (nd = rb_first(&output_hists); nd; nd = rb_next(nd)) {
624                 pos = rb_entry(nd, struct hist_entry, rb_node);
625                 ret += hist_entry__fprintf(fp, pos, total_samples);
626         }
627
628         if (sort_order == default_sort_order &&
629                         parent_pattern == default_parent_pattern) {
630                 fprintf(fp, "#\n");
631                 fprintf(fp, "# (For a higher level overview, try: perf report --sort comm,dso)\n");
632                 fprintf(fp, "#\n");
633         }
634         fprintf(fp, "\n");
635
636         free(rem_sq_bracket);
637
638         if (show_threads)
639                 perf_read_values_display(fp, &show_threads_values,
640                                          raw_printing_style);
641
642         return ret;
643 }
644
645 static int validate_chain(struct ip_callchain *chain, event_t *event)
646 {
647         unsigned int chain_size;
648
649         chain_size = event->header.size;
650         chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event;
651
652         if (chain->nr*sizeof(u64) > chain_size)
653                 return -1;
654
655         return 0;
656 }
657
658 static int
659 process_sample_event(event_t *event, unsigned long offset, unsigned long head)
660 {
661         char level;
662         struct symbol *sym = NULL;
663         u64 ip = event->ip.ip;
664         u64 period = 1;
665         struct map *map = NULL;
666         void *more_data = event->ip.__more_data;
667         struct ip_callchain *chain = NULL;
668         int cpumode;
669         struct thread *thread = threads__findnew(event->ip.pid);
670
671         if (sample_type & PERF_SAMPLE_PERIOD) {
672                 period = *(u64 *)more_data;
673                 more_data += sizeof(u64);
674         }
675
676         dump_printf("%p [%p]: PERF_RECORD_SAMPLE (IP, %d): %d/%d: %p period: %Ld\n",
677                 (void *)(offset + head),
678                 (void *)(long)(event->header.size),
679                 event->header.misc,
680                 event->ip.pid, event->ip.tid,
681                 (void *)(long)ip,
682                 (long long)period);
683
684         if (sample_type & PERF_SAMPLE_CALLCHAIN) {
685                 unsigned int i;
686
687                 chain = (void *)more_data;
688
689                 dump_printf("... chain: nr:%Lu\n", chain->nr);
690
691                 if (validate_chain(chain, event) < 0) {
692                         eprintf("call-chain problem with event, skipping it.\n");
693                         return 0;
694                 }
695
696                 if (dump_trace) {
697                         for (i = 0; i < chain->nr; i++)
698                                 dump_printf("..... %2d: %016Lx\n", i, chain->ips[i]);
699                 }
700         }
701
702         if (thread == NULL) {
703                 eprintf("problem processing %d event, skipping it.\n",
704                         event->header.type);
705                 return -1;
706         }
707
708         dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid);
709
710         if (comm_list && !strlist__has_entry(comm_list, thread->comm))
711                 return 0;
712
713         cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
714
715         if (cpumode == PERF_RECORD_MISC_KERNEL) {
716                 level = 'k';
717                 sym = kernel_maps__find_symbol(ip, &map);
718                 dump_printf(" ...... dso: %s\n",
719                             map ? map->dso->long_name : "<not found>");
720         } else if (cpumode == PERF_RECORD_MISC_USER) {
721                 level = '.';
722                 sym = resolve_symbol(thread, &map, &ip);
723
724         } else {
725                 level = 'H';
726                 dump_printf(" ...... dso: [hypervisor]\n");
727         }
728
729         if (dso_list &&
730             (!map || !map->dso ||
731              !(strlist__has_entry(dso_list, map->dso->short_name) ||
732                (map->dso->short_name != map->dso->long_name &&
733                 strlist__has_entry(dso_list, map->dso->long_name)))))
734                 return 0;
735
736         if (sym_list && sym && !strlist__has_entry(sym_list, sym->name))
737                 return 0;
738
739         if (hist_entry__add(thread, map, sym, ip,
740                             chain, level, period)) {
741                 eprintf("problem incrementing symbol count, skipping event\n");
742                 return -1;
743         }
744
745         total += period;
746
747         return 0;
748 }
749
750 static int
751 process_mmap_event(event_t *event, unsigned long offset, unsigned long head)
752 {
753         struct map *map = map__new(&event->mmap, cwd, cwdlen, 0, NULL, verbose);
754         struct thread *thread = threads__findnew(event->mmap.pid);
755
756         dump_printf("%p [%p]: PERF_RECORD_MMAP %d/%d: [%p(%p) @ %p]: %s\n",
757                 (void *)(offset + head),
758                 (void *)(long)(event->header.size),
759                 event->mmap.pid,
760                 event->mmap.tid,
761                 (void *)(long)event->mmap.start,
762                 (void *)(long)event->mmap.len,
763                 (void *)(long)event->mmap.pgoff,
764                 event->mmap.filename);
765
766         if (thread == NULL || map == NULL) {
767                 dump_printf("problem processing PERF_RECORD_MMAP, skipping event.\n");
768                 return 0;
769         }
770
771         thread__insert_map(thread, map);
772         total_mmap++;
773
774         return 0;
775 }
776
777 static int
778 process_comm_event(event_t *event, unsigned long offset, unsigned long head)
779 {
780         struct thread *thread = threads__findnew(event->comm.pid);
781
782         dump_printf("%p [%p]: PERF_RECORD_COMM: %s:%d\n",
783                 (void *)(offset + head),
784                 (void *)(long)(event->header.size),
785                 event->comm.comm, event->comm.pid);
786
787         if (thread == NULL ||
788             thread__set_comm_adjust(thread, event->comm.comm)) {
789                 dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
790                 return -1;
791         }
792         total_comm++;
793
794         return 0;
795 }
796
797 static int
798 process_task_event(event_t *event, unsigned long offset, unsigned long head)
799 {
800         struct thread *thread = threads__findnew(event->fork.pid);
801         struct thread *parent = threads__findnew(event->fork.ppid);
802
803         dump_printf("%p [%p]: PERF_RECORD_%s: (%d:%d):(%d:%d)\n",
804                 (void *)(offset + head),
805                 (void *)(long)(event->header.size),
806                 event->header.type == PERF_RECORD_FORK ? "FORK" : "EXIT",
807                 event->fork.pid, event->fork.tid,
808                 event->fork.ppid, event->fork.ptid);
809
810         /*
811          * A thread clone will have the same PID for both
812          * parent and child.
813          */
814         if (thread == parent)
815                 return 0;
816
817         if (event->header.type == PERF_RECORD_EXIT)
818                 return 0;
819
820         if (!thread || !parent || thread__fork(thread, parent)) {
821                 dump_printf("problem processing PERF_RECORD_FORK, skipping event.\n");
822                 return -1;
823         }
824         total_fork++;
825
826         return 0;
827 }
828
829 static int
830 process_lost_event(event_t *event, unsigned long offset, unsigned long head)
831 {
832         dump_printf("%p [%p]: PERF_RECORD_LOST: id:%Ld: lost:%Ld\n",
833                 (void *)(offset + head),
834                 (void *)(long)(event->header.size),
835                 event->lost.id,
836                 event->lost.lost);
837
838         total_lost += event->lost.lost;
839
840         return 0;
841 }
842
843 static int
844 process_read_event(event_t *event, unsigned long offset, unsigned long head)
845 {
846         struct perf_event_attr *attr;
847
848         attr = perf_header__find_attr(event->read.id, header);
849
850         if (show_threads) {
851                 const char *name = attr ? __event_name(attr->type, attr->config)
852                                    : "unknown";
853                 perf_read_values_add_value(&show_threads_values,
854                                            event->read.pid, event->read.tid,
855                                            event->read.id,
856                                            name,
857                                            event->read.value);
858         }
859
860         dump_printf("%p [%p]: PERF_RECORD_READ: %d %d %s %Lu\n",
861                         (void *)(offset + head),
862                         (void *)(long)(event->header.size),
863                         event->read.pid,
864                         event->read.tid,
865                         attr ? __event_name(attr->type, attr->config)
866                              : "FAIL",
867                         event->read.value);
868
869         return 0;
870 }
871
872 static int sample_type_check(u64 type)
873 {
874         sample_type = type;
875
876         if (!(sample_type & PERF_SAMPLE_CALLCHAIN)) {
877                 if (sort__has_parent) {
878                         fprintf(stderr, "selected --sort parent, but no"
879                                         " callchain data. Did you call"
880                                         " perf record without -g?\n");
881                         return -1;
882                 }
883                 if (callchain) {
884                         fprintf(stderr, "selected -g but no callchain data."
885                                         " Did you call perf record without"
886                                         " -g?\n");
887                         return -1;
888                 }
889         } else if (callchain_param.mode != CHAIN_NONE && !callchain) {
890                         callchain = 1;
891                         if (register_callchain_param(&callchain_param) < 0) {
892                                 fprintf(stderr, "Can't register callchain"
893                                                 " params\n");
894                                 return -1;
895                         }
896         }
897
898         return 0;
899 }
900
901 static struct perf_file_handler file_handler = {
902         .process_sample_event   = process_sample_event,
903         .process_mmap_event     = process_mmap_event,
904         .process_comm_event     = process_comm_event,
905         .process_exit_event     = process_task_event,
906         .process_fork_event     = process_task_event,
907         .process_lost_event     = process_lost_event,
908         .process_read_event     = process_read_event,
909         .sample_type_check      = sample_type_check,
910 };
911
912
913 static int __cmd_report(void)
914 {
915         struct thread *idle;
916         int ret;
917
918         idle = register_idle_thread();
919         thread__comm_adjust(idle);
920
921         if (show_threads)
922                 perf_read_values_init(&show_threads_values);
923
924         register_perf_file_handler(&file_handler);
925
926         ret = mmap_dispatch_perf_file(&header, input_name, force, full_paths,
927                                       &cwdlen, &cwd);
928         if (ret)
929                 return ret;
930
931         dump_printf("      IP events: %10ld\n", total);
932         dump_printf("    mmap events: %10ld\n", total_mmap);
933         dump_printf("    comm events: %10ld\n", total_comm);
934         dump_printf("    fork events: %10ld\n", total_fork);
935         dump_printf("    lost events: %10ld\n", total_lost);
936         dump_printf(" unknown events: %10ld\n", file_handler.total_unknown);
937
938         if (dump_trace)
939                 return 0;
940
941         if (verbose > 3)
942                 threads__fprintf(stdout);
943
944         if (verbose > 2)
945                 dsos__fprintf(stdout);
946
947         collapse__resort();
948         output__resort(total);
949         output__fprintf(stdout, total);
950
951         if (show_threads)
952                 perf_read_values_destroy(&show_threads_values);
953
954         return ret;
955 }
956
957 static int
958 parse_callchain_opt(const struct option *opt __used, const char *arg,
959                     int unset __used)
960 {
961         char *tok;
962         char *endptr;
963
964         callchain = 1;
965
966         if (!arg)
967                 return 0;
968
969         tok = strtok((char *)arg, ",");
970         if (!tok)
971                 return -1;
972
973         /* get the output mode */
974         if (!strncmp(tok, "graph", strlen(arg)))
975                 callchain_param.mode = CHAIN_GRAPH_ABS;
976
977         else if (!strncmp(tok, "flat", strlen(arg)))
978                 callchain_param.mode = CHAIN_FLAT;
979
980         else if (!strncmp(tok, "fractal", strlen(arg)))
981                 callchain_param.mode = CHAIN_GRAPH_REL;
982
983         else if (!strncmp(tok, "none", strlen(arg))) {
984                 callchain_param.mode = CHAIN_NONE;
985                 callchain = 0;
986
987                 return 0;
988         }
989
990         else
991                 return -1;
992
993         /* get the min percentage */
994         tok = strtok(NULL, ",");
995         if (!tok)
996                 goto setup;
997
998         callchain_param.min_percent = strtod(tok, &endptr);
999         if (tok == endptr)
1000                 return -1;
1001
1002 setup:
1003         if (register_callchain_param(&callchain_param) < 0) {
1004                 fprintf(stderr, "Can't register callchain params\n");
1005                 return -1;
1006         }
1007         return 0;
1008 }
1009
1010 //static const char * const report_usage[] = {
1011 const char * const report_usage[] = {
1012         "perf report [<options>] <command>",
1013         NULL
1014 };
1015
1016 static const struct option options[] = {
1017         OPT_STRING('i', "input", &input_name, "file",
1018                     "input file name"),
1019         OPT_BOOLEAN('v', "verbose", &verbose,
1020                     "be more verbose (show symbol address, etc)"),
1021         OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
1022                     "dump raw trace in ASCII"),
1023         OPT_STRING('k', "vmlinux", &vmlinux_name, "file", "vmlinux pathname"),
1024         OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
1025         OPT_BOOLEAN('m', "modules", &modules,
1026                     "load module symbols - WARNING: use only with -k and LIVE kernel"),
1027         OPT_BOOLEAN('n', "show-nr-samples", &show_nr_samples,
1028                     "Show a column with the number of samples"),
1029         OPT_BOOLEAN('T', "threads", &show_threads,
1030                     "Show per-thread event counters"),
1031         OPT_STRING(0, "pretty", &pretty_printing_style, "key",
1032                    "pretty printing style key: normal raw"),
1033         OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
1034                    "sort by key(s): pid, comm, dso, symbol, parent"),
1035         OPT_BOOLEAN('P', "full-paths", &full_paths,
1036                     "Don't shorten the pathnames taking into account the cwd"),
1037         OPT_STRING('p', "parent", &parent_pattern, "regex",
1038                    "regex filter to identify parent, see: '--sort parent'"),
1039         OPT_BOOLEAN('x', "exclude-other", &exclude_other,
1040                     "Only display entries with parent-match"),
1041         OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent",
1042                      "Display callchains using output_type and min percent threshold. "
1043                      "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt),
1044         OPT_STRING('d', "dsos", &dso_list_str, "dso[,dso...]",
1045                    "only consider symbols in these dsos"),
1046         OPT_STRING('C', "comms", &comm_list_str, "comm[,comm...]",
1047                    "only consider symbols in these comms"),
1048         OPT_STRING('S', "symbols", &sym_list_str, "symbol[,symbol...]",
1049                    "only consider these symbols"),
1050         OPT_STRING('w', "column-widths", &col_width_list_str,
1051                    "width[,width...]",
1052                    "don't try to adjust column width, use these fixed values"),
1053         OPT_STRING('t', "field-separator", &field_sep, "separator",
1054                    "separator for columns, no spaces will be added between "
1055                    "columns '.' is reserved."),
1056         OPT_END()
1057 };
1058
1059 static void setup_sorting(void)
1060 {
1061         char *tmp, *tok, *str = strdup(sort_order);
1062
1063         for (tok = strtok_r(str, ", ", &tmp);
1064                         tok; tok = strtok_r(NULL, ", ", &tmp)) {
1065                 if (sort_dimension__add(tok) < 0) {
1066                         error("Unknown --sort key: `%s'", tok);
1067                         usage_with_options(report_usage, options);
1068                 }
1069         }
1070
1071         free(str);
1072 }
1073
1074 static void setup_list(struct strlist **list, const char *list_str,
1075                        struct sort_entry *se, const char *list_name,
1076                        FILE *fp)
1077 {
1078         if (list_str) {
1079                 *list = strlist__new(true, list_str);
1080                 if (!*list) {
1081                         fprintf(stderr, "problems parsing %s list\n",
1082                                 list_name);
1083                         exit(129);
1084                 }
1085                 if (strlist__nr_entries(*list) == 1) {
1086                         fprintf(fp, "# %s: %s\n", list_name,
1087                                 strlist__entry(*list, 0)->s);
1088                         se->elide = true;
1089                 }
1090         }
1091 }
1092
1093 int cmd_report(int argc, const char **argv, const char *prefix __used)
1094 {
1095         symbol__init();
1096
1097         argc = parse_options(argc, argv, options, report_usage, 0);
1098
1099         setup_sorting();
1100
1101         if (parent_pattern != default_parent_pattern) {
1102                 sort_dimension__add("parent");
1103                 sort_parent.elide = 1;
1104         } else
1105                 exclude_other = 0;
1106
1107         /*
1108          * Any (unrecognized) arguments left?
1109          */
1110         if (argc)
1111                 usage_with_options(report_usage, options);
1112
1113         setup_pager();
1114
1115         setup_list(&dso_list, dso_list_str, &sort_dso, "dso", stdout);
1116         setup_list(&comm_list, comm_list_str, &sort_comm, "comm", stdout);
1117         setup_list(&sym_list, sym_list_str, &sort_sym, "symbol", stdout);
1118
1119         if (field_sep && *field_sep == '.') {
1120                 fputs("'.' is the only non valid --field-separator argument\n",
1121                       stderr);
1122                 exit(129);
1123         }
1124
1125         return __cmd_report();
1126 }