b75ea770d44316f48e13e2556bbba17ba873fe0d
[cascardo/linux.git] / tools / perf / builtin-diff.c
1 /*
2  * builtin-diff.c
3  *
4  * Builtin diff command: Analyze two perf.data input files, look up and read
5  * DSOs and symbol information, sort them and produce a diff.
6  */
7 #include "builtin.h"
8
9 #include "util/debug.h"
10 #include "util/event.h"
11 #include "util/hist.h"
12 #include "util/evsel.h"
13 #include "util/evlist.h"
14 #include "util/session.h"
15 #include "util/tool.h"
16 #include "util/sort.h"
17 #include "util/symbol.h"
18 #include "util/util.h"
19 #include "util/data.h"
20
21 #include <stdlib.h>
22 #include <math.h>
23
24 /* Diff command specific HPP columns. */
25 enum {
26         PERF_HPP_DIFF__BASELINE,
27         PERF_HPP_DIFF__PERIOD,
28         PERF_HPP_DIFF__PERIOD_BASELINE,
29         PERF_HPP_DIFF__DELTA,
30         PERF_HPP_DIFF__RATIO,
31         PERF_HPP_DIFF__WEIGHTED_DIFF,
32         PERF_HPP_DIFF__FORMULA,
33
34         PERF_HPP_DIFF__MAX_INDEX
35 };
36
37 struct diff_hpp_fmt {
38         struct perf_hpp_fmt      fmt;
39         int                      idx;
40         char                    *header;
41         int                      header_width;
42 };
43
44 struct data__file {
45         struct perf_session     *session;
46         struct perf_data_file   file;
47         int                      idx;
48         struct hists            *hists;
49         struct diff_hpp_fmt      fmt[PERF_HPP_DIFF__MAX_INDEX];
50 };
51
52 static struct data__file *data__files;
53 static int data__files_cnt;
54
55 #define data__for_each_file_start(i, d, s)      \
56         for (i = s, d = &data__files[s];        \
57              i < data__files_cnt;               \
58              i++, d = &data__files[i])
59
60 #define data__for_each_file(i, d) data__for_each_file_start(i, d, 0)
61 #define data__for_each_file_new(i, d) data__for_each_file_start(i, d, 1)
62
63 static bool force;
64 static bool show_period;
65 static bool show_formula;
66 static bool show_baseline_only;
67 static unsigned int sort_compute;
68
69 static s64 compute_wdiff_w1;
70 static s64 compute_wdiff_w2;
71
72 enum {
73         COMPUTE_DELTA,
74         COMPUTE_RATIO,
75         COMPUTE_WEIGHTED_DIFF,
76         COMPUTE_MAX,
77 };
78
79 const char *compute_names[COMPUTE_MAX] = {
80         [COMPUTE_DELTA] = "delta",
81         [COMPUTE_RATIO] = "ratio",
82         [COMPUTE_WEIGHTED_DIFF] = "wdiff",
83 };
84
85 static int compute;
86
87 static int compute_2_hpp[COMPUTE_MAX] = {
88         [COMPUTE_DELTA]         = PERF_HPP_DIFF__DELTA,
89         [COMPUTE_RATIO]         = PERF_HPP_DIFF__RATIO,
90         [COMPUTE_WEIGHTED_DIFF] = PERF_HPP_DIFF__WEIGHTED_DIFF,
91 };
92
93 #define MAX_COL_WIDTH 70
94
95 static struct header_column {
96         const char *name;
97         int width;
98 } columns[PERF_HPP_DIFF__MAX_INDEX] = {
99         [PERF_HPP_DIFF__BASELINE] = {
100                 .name  = "Baseline",
101         },
102         [PERF_HPP_DIFF__PERIOD] = {
103                 .name  = "Period",
104                 .width = 14,
105         },
106         [PERF_HPP_DIFF__PERIOD_BASELINE] = {
107                 .name  = "Base period",
108                 .width = 14,
109         },
110         [PERF_HPP_DIFF__DELTA] = {
111                 .name  = "Delta",
112                 .width = 7,
113         },
114         [PERF_HPP_DIFF__RATIO] = {
115                 .name  = "Ratio",
116                 .width = 14,
117         },
118         [PERF_HPP_DIFF__WEIGHTED_DIFF] = {
119                 .name  = "Weighted diff",
120                 .width = 14,
121         },
122         [PERF_HPP_DIFF__FORMULA] = {
123                 .name  = "Formula",
124                 .width = MAX_COL_WIDTH,
125         }
126 };
127
128 static int setup_compute_opt_wdiff(char *opt)
129 {
130         char *w1_str = opt;
131         char *w2_str;
132
133         int ret = -EINVAL;
134
135         if (!opt)
136                 goto out;
137
138         w2_str = strchr(opt, ',');
139         if (!w2_str)
140                 goto out;
141
142         *w2_str++ = 0x0;
143         if (!*w2_str)
144                 goto out;
145
146         compute_wdiff_w1 = strtol(w1_str, NULL, 10);
147         compute_wdiff_w2 = strtol(w2_str, NULL, 10);
148
149         if (!compute_wdiff_w1 || !compute_wdiff_w2)
150                 goto out;
151
152         pr_debug("compute wdiff w1(%" PRId64 ") w2(%" PRId64 ")\n",
153                   compute_wdiff_w1, compute_wdiff_w2);
154
155         ret = 0;
156
157  out:
158         if (ret)
159                 pr_err("Failed: wrong weight data, use 'wdiff:w1,w2'\n");
160
161         return ret;
162 }
163
164 static int setup_compute_opt(char *opt)
165 {
166         if (compute == COMPUTE_WEIGHTED_DIFF)
167                 return setup_compute_opt_wdiff(opt);
168
169         if (opt) {
170                 pr_err("Failed: extra option specified '%s'", opt);
171                 return -EINVAL;
172         }
173
174         return 0;
175 }
176
177 static int setup_compute(const struct option *opt, const char *str,
178                          int unset __maybe_unused)
179 {
180         int *cp = (int *) opt->value;
181         char *cstr = (char *) str;
182         char buf[50];
183         unsigned i;
184         char *option;
185
186         if (!str) {
187                 *cp = COMPUTE_DELTA;
188                 return 0;
189         }
190
191         option = strchr(str, ':');
192         if (option) {
193                 unsigned len = option++ - str;
194
195                 /*
196                  * The str data are not writeable, so we need
197                  * to use another buffer.
198                  */
199
200                 /* No option value is longer. */
201                 if (len >= sizeof(buf))
202                         return -EINVAL;
203
204                 strncpy(buf, str, len);
205                 buf[len] = 0x0;
206                 cstr = buf;
207         }
208
209         for (i = 0; i < COMPUTE_MAX; i++)
210                 if (!strcmp(cstr, compute_names[i])) {
211                         *cp = i;
212                         return setup_compute_opt(option);
213                 }
214
215         pr_err("Failed: '%s' is not computation method "
216                "(use 'delta','ratio' or 'wdiff')\n", str);
217         return -EINVAL;
218 }
219
220 static double period_percent(struct hist_entry *he, u64 period)
221 {
222         u64 total = hists__total_period(he->hists);
223
224         return (period * 100.0) / total;
225 }
226
227 static double compute_delta(struct hist_entry *he, struct hist_entry *pair)
228 {
229         double old_percent = period_percent(he, he->stat.period);
230         double new_percent = period_percent(pair, pair->stat.period);
231
232         pair->diff.period_ratio_delta = new_percent - old_percent;
233         pair->diff.computed = true;
234         return pair->diff.period_ratio_delta;
235 }
236
237 static double compute_ratio(struct hist_entry *he, struct hist_entry *pair)
238 {
239         double old_period = he->stat.period ?: 1;
240         double new_period = pair->stat.period;
241
242         pair->diff.computed = true;
243         pair->diff.period_ratio = new_period / old_period;
244         return pair->diff.period_ratio;
245 }
246
247 static s64 compute_wdiff(struct hist_entry *he, struct hist_entry *pair)
248 {
249         u64 old_period = he->stat.period;
250         u64 new_period = pair->stat.period;
251
252         pair->diff.computed = true;
253         pair->diff.wdiff = new_period * compute_wdiff_w2 -
254                            old_period * compute_wdiff_w1;
255
256         return pair->diff.wdiff;
257 }
258
259 static int formula_delta(struct hist_entry *he, struct hist_entry *pair,
260                          char *buf, size_t size)
261 {
262         u64 he_total = he->hists->stats.total_period;
263         u64 pair_total = pair->hists->stats.total_period;
264
265         if (symbol_conf.filter_relative) {
266                 he_total = he->hists->stats.total_non_filtered_period;
267                 pair_total = pair->hists->stats.total_non_filtered_period;
268         }
269         return scnprintf(buf, size,
270                          "(%" PRIu64 " * 100 / %" PRIu64 ") - "
271                          "(%" PRIu64 " * 100 / %" PRIu64 ")",
272                          pair->stat.period, pair_total,
273                          he->stat.period, he_total);
274 }
275
276 static int formula_ratio(struct hist_entry *he, struct hist_entry *pair,
277                          char *buf, size_t size)
278 {
279         double old_period = he->stat.period;
280         double new_period = pair->stat.period;
281
282         return scnprintf(buf, size, "%.0F / %.0F", new_period, old_period);
283 }
284
285 static int formula_wdiff(struct hist_entry *he, struct hist_entry *pair,
286                          char *buf, size_t size)
287 {
288         u64 old_period = he->stat.period;
289         u64 new_period = pair->stat.period;
290
291         return scnprintf(buf, size,
292                   "(%" PRIu64 " * " "%" PRId64 ") - (%" PRIu64 " * " "%" PRId64 ")",
293                   new_period, compute_wdiff_w2, old_period, compute_wdiff_w1);
294 }
295
296 static int formula_fprintf(struct hist_entry *he, struct hist_entry *pair,
297                            char *buf, size_t size)
298 {
299         switch (compute) {
300         case COMPUTE_DELTA:
301                 return formula_delta(he, pair, buf, size);
302         case COMPUTE_RATIO:
303                 return formula_ratio(he, pair, buf, size);
304         case COMPUTE_WEIGHTED_DIFF:
305                 return formula_wdiff(he, pair, buf, size);
306         default:
307                 BUG_ON(1);
308         }
309
310         return -1;
311 }
312
313 static int hists__add_entry(struct hists *hists,
314                             struct addr_location *al,
315                             struct perf_sample *sample)
316 {
317         if (__hists__add_entry(hists, al, NULL, NULL, NULL,
318                                sample, true) != NULL)
319                 return 0;
320         return -ENOMEM;
321 }
322
323 static int diff__process_sample_event(struct perf_tool *tool __maybe_unused,
324                                       union perf_event *event,
325                                       struct perf_sample *sample,
326                                       struct perf_evsel *evsel,
327                                       struct machine *machine)
328 {
329         struct addr_location al;
330         struct hists *hists = evsel__hists(evsel);
331         int ret = -1;
332
333         if (machine__resolve(machine, &al, sample) < 0) {
334                 pr_warning("problem processing %d event, skipping it.\n",
335                            event->header.type);
336                 return -1;
337         }
338
339         if (hists__add_entry(hists, &al, sample)) {
340                 pr_warning("problem incrementing symbol period, skipping event\n");
341                 goto out_put;
342         }
343
344         /*
345          * The total_period is updated here before going to the output
346          * tree since normally only the baseline hists will call
347          * hists__output_resort() and precompute needs the total
348          * period in order to sort entries by percentage delta.
349          */
350         hists->stats.total_period += sample->period;
351         if (!al.filtered)
352                 hists->stats.total_non_filtered_period += sample->period;
353         ret = 0;
354 out_put:
355         addr_location__put(&al);
356         return ret;
357 }
358
359 static struct perf_tool tool = {
360         .sample = diff__process_sample_event,
361         .mmap   = perf_event__process_mmap,
362         .mmap2  = perf_event__process_mmap2,
363         .comm   = perf_event__process_comm,
364         .exit   = perf_event__process_exit,
365         .fork   = perf_event__process_fork,
366         .lost   = perf_event__process_lost,
367         .ordered_events = true,
368         .ordering_requires_timestamps = true,
369 };
370
371 static struct perf_evsel *evsel_match(struct perf_evsel *evsel,
372                                       struct perf_evlist *evlist)
373 {
374         struct perf_evsel *e;
375
376         evlist__for_each(evlist, e) {
377                 if (perf_evsel__match2(evsel, e))
378                         return e;
379         }
380
381         return NULL;
382 }
383
384 static void perf_evlist__collapse_resort(struct perf_evlist *evlist)
385 {
386         struct perf_evsel *evsel;
387
388         evlist__for_each(evlist, evsel) {
389                 struct hists *hists = evsel__hists(evsel);
390
391                 hists__collapse_resort(hists, NULL);
392         }
393 }
394
395 static struct data__file *fmt_to_data_file(struct perf_hpp_fmt *fmt)
396 {
397         struct diff_hpp_fmt *dfmt = container_of(fmt, struct diff_hpp_fmt, fmt);
398         void *ptr = dfmt - dfmt->idx;
399         struct data__file *d = container_of(ptr, struct data__file, fmt);
400
401         return d;
402 }
403
404 static struct hist_entry*
405 get_pair_data(struct hist_entry *he, struct data__file *d)
406 {
407         if (hist_entry__has_pairs(he)) {
408                 struct hist_entry *pair;
409
410                 list_for_each_entry(pair, &he->pairs.head, pairs.node)
411                         if (pair->hists == d->hists)
412                                 return pair;
413         }
414
415         return NULL;
416 }
417
418 static struct hist_entry*
419 get_pair_fmt(struct hist_entry *he, struct diff_hpp_fmt *dfmt)
420 {
421         struct data__file *d = fmt_to_data_file(&dfmt->fmt);
422
423         return get_pair_data(he, d);
424 }
425
426 static void hists__baseline_only(struct hists *hists)
427 {
428         struct rb_root *root;
429         struct rb_node *next;
430
431         if (hists__has(hists, need_collapse))
432                 root = &hists->entries_collapsed;
433         else
434                 root = hists->entries_in;
435
436         next = rb_first(root);
437         while (next != NULL) {
438                 struct hist_entry *he = rb_entry(next, struct hist_entry, rb_node_in);
439
440                 next = rb_next(&he->rb_node_in);
441                 if (!hist_entry__next_pair(he)) {
442                         rb_erase(&he->rb_node_in, root);
443                         hist_entry__delete(he);
444                 }
445         }
446 }
447
448 static void hists__precompute(struct hists *hists)
449 {
450         struct rb_root *root;
451         struct rb_node *next;
452
453         if (hists__has(hists, need_collapse))
454                 root = &hists->entries_collapsed;
455         else
456                 root = hists->entries_in;
457
458         next = rb_first(root);
459         while (next != NULL) {
460                 struct hist_entry *he, *pair;
461                 struct data__file *d;
462                 int i;
463
464                 he   = rb_entry(next, struct hist_entry, rb_node_in);
465                 next = rb_next(&he->rb_node_in);
466
467                 data__for_each_file_new(i, d) {
468                         pair = get_pair_data(he, d);
469                         if (!pair)
470                                 continue;
471
472                         switch (compute) {
473                         case COMPUTE_DELTA:
474                                 compute_delta(he, pair);
475                                 break;
476                         case COMPUTE_RATIO:
477                                 compute_ratio(he, pair);
478                                 break;
479                         case COMPUTE_WEIGHTED_DIFF:
480                                 compute_wdiff(he, pair);
481                                 break;
482                         default:
483                                 BUG_ON(1);
484                         }
485                 }
486         }
487 }
488
489 static int64_t cmp_doubles(double l, double r)
490 {
491         if (l > r)
492                 return -1;
493         else if (l < r)
494                 return 1;
495         else
496                 return 0;
497 }
498
499 static int64_t
500 __hist_entry__cmp_compute(struct hist_entry *left, struct hist_entry *right,
501                         int c)
502 {
503         switch (c) {
504         case COMPUTE_DELTA:
505         {
506                 double l = left->diff.period_ratio_delta;
507                 double r = right->diff.period_ratio_delta;
508
509                 return cmp_doubles(l, r);
510         }
511         case COMPUTE_RATIO:
512         {
513                 double l = left->diff.period_ratio;
514                 double r = right->diff.period_ratio;
515
516                 return cmp_doubles(l, r);
517         }
518         case COMPUTE_WEIGHTED_DIFF:
519         {
520                 s64 l = left->diff.wdiff;
521                 s64 r = right->diff.wdiff;
522
523                 return r - l;
524         }
525         default:
526                 BUG_ON(1);
527         }
528
529         return 0;
530 }
531
532 static int64_t
533 hist_entry__cmp_compute(struct hist_entry *left, struct hist_entry *right,
534                         int c, int sort_idx)
535 {
536         bool pairs_left  = hist_entry__has_pairs(left);
537         bool pairs_right = hist_entry__has_pairs(right);
538         struct hist_entry *p_right, *p_left;
539
540         if (!pairs_left && !pairs_right)
541                 return 0;
542
543         if (!pairs_left || !pairs_right)
544                 return pairs_left ? -1 : 1;
545
546         p_left  = get_pair_data(left,  &data__files[sort_idx]);
547         p_right = get_pair_data(right, &data__files[sort_idx]);
548
549         if (!p_left && !p_right)
550                 return 0;
551
552         if (!p_left || !p_right)
553                 return p_left ? -1 : 1;
554
555         /*
556          * We have 2 entries of same kind, let's
557          * make the data comparison.
558          */
559         return __hist_entry__cmp_compute(p_left, p_right, c);
560 }
561
562 static int64_t
563 hist_entry__cmp_compute_idx(struct hist_entry *left, struct hist_entry *right,
564                             int c, int sort_idx)
565 {
566         struct hist_entry *p_right, *p_left;
567
568         p_left  = get_pair_data(left,  &data__files[sort_idx]);
569         p_right = get_pair_data(right, &data__files[sort_idx]);
570
571         if (!p_left && !p_right)
572                 return 0;
573
574         if (!p_left || !p_right)
575                 return p_left ? -1 : 1;
576
577         if (c != COMPUTE_DELTA) {
578                 /*
579                  * The delta can be computed without the baseline, but
580                  * others are not.  Put those entries which have no
581                  * values below.
582                  */
583                 if (left->dummy && right->dummy)
584                         return 0;
585
586                 if (left->dummy || right->dummy)
587                         return left->dummy ? 1 : -1;
588         }
589
590         return __hist_entry__cmp_compute(p_left, p_right, c);
591 }
592
593 static int64_t
594 hist_entry__cmp_nop(struct perf_hpp_fmt *fmt __maybe_unused,
595                     struct hist_entry *left __maybe_unused,
596                     struct hist_entry *right __maybe_unused)
597 {
598         return 0;
599 }
600
601 static int64_t
602 hist_entry__cmp_baseline(struct perf_hpp_fmt *fmt __maybe_unused,
603                          struct hist_entry *left, struct hist_entry *right)
604 {
605         if (left->stat.period == right->stat.period)
606                 return 0;
607         return left->stat.period > right->stat.period ? 1 : -1;
608 }
609
610 static int64_t
611 hist_entry__cmp_delta(struct perf_hpp_fmt *fmt,
612                       struct hist_entry *left, struct hist_entry *right)
613 {
614         struct data__file *d = fmt_to_data_file(fmt);
615
616         return hist_entry__cmp_compute(right, left, COMPUTE_DELTA, d->idx);
617 }
618
619 static int64_t
620 hist_entry__cmp_ratio(struct perf_hpp_fmt *fmt,
621                       struct hist_entry *left, struct hist_entry *right)
622 {
623         struct data__file *d = fmt_to_data_file(fmt);
624
625         return hist_entry__cmp_compute(right, left, COMPUTE_RATIO, d->idx);
626 }
627
628 static int64_t
629 hist_entry__cmp_wdiff(struct perf_hpp_fmt *fmt,
630                       struct hist_entry *left, struct hist_entry *right)
631 {
632         struct data__file *d = fmt_to_data_file(fmt);
633
634         return hist_entry__cmp_compute(right, left, COMPUTE_WEIGHTED_DIFF, d->idx);
635 }
636
637 static int64_t
638 hist_entry__cmp_delta_idx(struct perf_hpp_fmt *fmt __maybe_unused,
639                           struct hist_entry *left, struct hist_entry *right)
640 {
641         return hist_entry__cmp_compute_idx(right, left, COMPUTE_DELTA,
642                                            sort_compute);
643 }
644
645 static int64_t
646 hist_entry__cmp_ratio_idx(struct perf_hpp_fmt *fmt __maybe_unused,
647                           struct hist_entry *left, struct hist_entry *right)
648 {
649         return hist_entry__cmp_compute_idx(right, left, COMPUTE_RATIO,
650                                            sort_compute);
651 }
652
653 static int64_t
654 hist_entry__cmp_wdiff_idx(struct perf_hpp_fmt *fmt __maybe_unused,
655                           struct hist_entry *left, struct hist_entry *right)
656 {
657         return hist_entry__cmp_compute_idx(right, left, COMPUTE_WEIGHTED_DIFF,
658                                            sort_compute);
659 }
660
661 static void hists__process(struct hists *hists)
662 {
663         if (show_baseline_only)
664                 hists__baseline_only(hists);
665
666         hists__precompute(hists);
667         hists__output_resort(hists, NULL);
668
669         hists__fprintf(hists, true, 0, 0, 0, stdout,
670                        symbol_conf.use_callchain);
671 }
672
673 static void data__fprintf(void)
674 {
675         struct data__file *d;
676         int i;
677
678         fprintf(stdout, "# Data files:\n");
679
680         data__for_each_file(i, d)
681                 fprintf(stdout, "#  [%d] %s %s\n",
682                         d->idx, d->file.path,
683                         !d->idx ? "(Baseline)" : "");
684
685         fprintf(stdout, "#\n");
686 }
687
688 static void data_process(void)
689 {
690         struct perf_evlist *evlist_base = data__files[0].session->evlist;
691         struct perf_evsel *evsel_base;
692         bool first = true;
693
694         evlist__for_each(evlist_base, evsel_base) {
695                 struct hists *hists_base = evsel__hists(evsel_base);
696                 struct data__file *d;
697                 int i;
698
699                 data__for_each_file_new(i, d) {
700                         struct perf_evlist *evlist = d->session->evlist;
701                         struct perf_evsel *evsel;
702                         struct hists *hists;
703
704                         evsel = evsel_match(evsel_base, evlist);
705                         if (!evsel)
706                                 continue;
707
708                         hists = evsel__hists(evsel);
709                         d->hists = hists;
710
711                         hists__match(hists_base, hists);
712
713                         if (!show_baseline_only)
714                                 hists__link(hists_base, hists);
715                 }
716
717                 fprintf(stdout, "%s# Event '%s'\n#\n", first ? "" : "\n",
718                         perf_evsel__name(evsel_base));
719
720                 first = false;
721
722                 if (verbose || data__files_cnt > 2)
723                         data__fprintf();
724
725                 /* Don't sort callchain for perf diff */
726                 perf_evsel__reset_sample_bit(evsel_base, CALLCHAIN);
727
728                 hists__process(hists_base);
729         }
730 }
731
732 static void data__free(struct data__file *d)
733 {
734         int col;
735
736         for (col = 0; col < PERF_HPP_DIFF__MAX_INDEX; col++) {
737                 struct diff_hpp_fmt *fmt = &d->fmt[col];
738
739                 zfree(&fmt->header);
740         }
741 }
742
743 static int __cmd_diff(void)
744 {
745         struct data__file *d;
746         int ret = -EINVAL, i;
747
748         data__for_each_file(i, d) {
749                 d->session = perf_session__new(&d->file, false, &tool);
750                 if (!d->session) {
751                         pr_err("Failed to open %s\n", d->file.path);
752                         ret = -1;
753                         goto out_delete;
754                 }
755
756                 ret = perf_session__process_events(d->session);
757                 if (ret) {
758                         pr_err("Failed to process %s\n", d->file.path);
759                         goto out_delete;
760                 }
761
762                 perf_evlist__collapse_resort(d->session->evlist);
763         }
764
765         data_process();
766
767  out_delete:
768         data__for_each_file(i, d) {
769                 if (d->session)
770                         perf_session__delete(d->session);
771
772                 data__free(d);
773         }
774
775         free(data__files);
776         return ret;
777 }
778
779 static const char * const diff_usage[] = {
780         "perf diff [<options>] [old_file] [new_file]",
781         NULL,
782 };
783
784 static const struct option options[] = {
785         OPT_INCR('v', "verbose", &verbose,
786                     "be more verbose (show symbol address, etc)"),
787         OPT_BOOLEAN('b', "baseline-only", &show_baseline_only,
788                     "Show only items with match in baseline"),
789         OPT_CALLBACK('c', "compute", &compute,
790                      "delta,ratio,wdiff:w1,w2 (default delta)",
791                      "Entries differential computation selection",
792                      setup_compute),
793         OPT_BOOLEAN('p', "period", &show_period,
794                     "Show period values."),
795         OPT_BOOLEAN('F', "formula", &show_formula,
796                     "Show formula."),
797         OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
798                     "dump raw trace in ASCII"),
799         OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
800         OPT_STRING(0, "kallsyms", &symbol_conf.kallsyms_name,
801                    "file", "kallsyms pathname"),
802         OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
803                     "load module symbols - WARNING: use only with -k and LIVE kernel"),
804         OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
805                    "only consider symbols in these dsos"),
806         OPT_STRING('C', "comms", &symbol_conf.comm_list_str, "comm[,comm...]",
807                    "only consider symbols in these comms"),
808         OPT_STRING('S', "symbols", &symbol_conf.sym_list_str, "symbol[,symbol...]",
809                    "only consider these symbols"),
810         OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
811                    "sort by key(s): pid, comm, dso, symbol, parent, cpu, srcline, ..."
812                    " Please refer the man page for the complete list."),
813         OPT_STRING_NOEMPTY('t', "field-separator", &symbol_conf.field_sep, "separator",
814                    "separator for columns, no spaces will be added between "
815                    "columns '.' is reserved."),
816         OPT_CALLBACK(0, "symfs", NULL, "directory",
817                      "Look for files with symbols relative to this directory",
818                      symbol__config_symfs),
819         OPT_UINTEGER('o', "order", &sort_compute, "Specify compute sorting."),
820         OPT_CALLBACK(0, "percentage", NULL, "relative|absolute",
821                      "How to display percentage of filtered entries", parse_filter_percentage),
822         OPT_END()
823 };
824
825 static double baseline_percent(struct hist_entry *he)
826 {
827         u64 total = hists__total_period(he->hists);
828
829         return 100.0 * he->stat.period / total;
830 }
831
832 static int hpp__color_baseline(struct perf_hpp_fmt *fmt,
833                                struct perf_hpp *hpp, struct hist_entry *he)
834 {
835         struct diff_hpp_fmt *dfmt =
836                 container_of(fmt, struct diff_hpp_fmt, fmt);
837         double percent = baseline_percent(he);
838         char pfmt[20] = " ";
839
840         if (!he->dummy) {
841                 scnprintf(pfmt, 20, "%%%d.2f%%%%", dfmt->header_width - 1);
842                 return percent_color_snprintf(hpp->buf, hpp->size,
843                                               pfmt, percent);
844         } else
845                 return scnprintf(hpp->buf, hpp->size, "%*s",
846                                  dfmt->header_width, pfmt);
847 }
848
849 static int hpp__entry_baseline(struct hist_entry *he, char *buf, size_t size)
850 {
851         double percent = baseline_percent(he);
852         const char *fmt = symbol_conf.field_sep ? "%.2f" : "%6.2f%%";
853         int ret = 0;
854
855         if (!he->dummy)
856                 ret = scnprintf(buf, size, fmt, percent);
857
858         return ret;
859 }
860
861 static int __hpp__color_compare(struct perf_hpp_fmt *fmt,
862                                 struct perf_hpp *hpp, struct hist_entry *he,
863                                 int comparison_method)
864 {
865         struct diff_hpp_fmt *dfmt =
866                 container_of(fmt, struct diff_hpp_fmt, fmt);
867         struct hist_entry *pair = get_pair_fmt(he, dfmt);
868         double diff;
869         s64 wdiff;
870         char pfmt[20] = " ";
871
872         if (!pair)
873                 goto no_print;
874
875         switch (comparison_method) {
876         case COMPUTE_DELTA:
877                 if (pair->diff.computed)
878                         diff = pair->diff.period_ratio_delta;
879                 else
880                         diff = compute_delta(he, pair);
881
882                 scnprintf(pfmt, 20, "%%%+d.2f%%%%", dfmt->header_width - 1);
883                 return percent_color_snprintf(hpp->buf, hpp->size,
884                                         pfmt, diff);
885         case COMPUTE_RATIO:
886                 if (he->dummy)
887                         goto dummy_print;
888                 if (pair->diff.computed)
889                         diff = pair->diff.period_ratio;
890                 else
891                         diff = compute_ratio(he, pair);
892
893                 scnprintf(pfmt, 20, "%%%d.6f", dfmt->header_width);
894                 return value_color_snprintf(hpp->buf, hpp->size,
895                                         pfmt, diff);
896         case COMPUTE_WEIGHTED_DIFF:
897                 if (he->dummy)
898                         goto dummy_print;
899                 if (pair->diff.computed)
900                         wdiff = pair->diff.wdiff;
901                 else
902                         wdiff = compute_wdiff(he, pair);
903
904                 scnprintf(pfmt, 20, "%%14ld", dfmt->header_width);
905                 return color_snprintf(hpp->buf, hpp->size,
906                                 get_percent_color(wdiff),
907                                 pfmt, wdiff);
908         default:
909                 BUG_ON(1);
910         }
911 dummy_print:
912         return scnprintf(hpp->buf, hpp->size, "%*s",
913                         dfmt->header_width, "N/A");
914 no_print:
915         return scnprintf(hpp->buf, hpp->size, "%*s",
916                         dfmt->header_width, pfmt);
917 }
918
919 static int hpp__color_delta(struct perf_hpp_fmt *fmt,
920                         struct perf_hpp *hpp, struct hist_entry *he)
921 {
922         return __hpp__color_compare(fmt, hpp, he, COMPUTE_DELTA);
923 }
924
925 static int hpp__color_ratio(struct perf_hpp_fmt *fmt,
926                         struct perf_hpp *hpp, struct hist_entry *he)
927 {
928         return __hpp__color_compare(fmt, hpp, he, COMPUTE_RATIO);
929 }
930
931 static int hpp__color_wdiff(struct perf_hpp_fmt *fmt,
932                         struct perf_hpp *hpp, struct hist_entry *he)
933 {
934         return __hpp__color_compare(fmt, hpp, he, COMPUTE_WEIGHTED_DIFF);
935 }
936
937 static void
938 hpp__entry_unpair(struct hist_entry *he, int idx, char *buf, size_t size)
939 {
940         switch (idx) {
941         case PERF_HPP_DIFF__PERIOD_BASELINE:
942                 scnprintf(buf, size, "%" PRIu64, he->stat.period);
943                 break;
944
945         default:
946                 break;
947         }
948 }
949
950 static void
951 hpp__entry_pair(struct hist_entry *he, struct hist_entry *pair,
952                 int idx, char *buf, size_t size)
953 {
954         double diff;
955         double ratio;
956         s64 wdiff;
957
958         switch (idx) {
959         case PERF_HPP_DIFF__DELTA:
960                 if (pair->diff.computed)
961                         diff = pair->diff.period_ratio_delta;
962                 else
963                         diff = compute_delta(he, pair);
964
965                 scnprintf(buf, size, "%+4.2F%%", diff);
966                 break;
967
968         case PERF_HPP_DIFF__RATIO:
969                 /* No point for ratio number if we are dummy.. */
970                 if (he->dummy) {
971                         scnprintf(buf, size, "N/A");
972                         break;
973                 }
974
975                 if (pair->diff.computed)
976                         ratio = pair->diff.period_ratio;
977                 else
978                         ratio = compute_ratio(he, pair);
979
980                 if (ratio > 0.0)
981                         scnprintf(buf, size, "%14.6F", ratio);
982                 break;
983
984         case PERF_HPP_DIFF__WEIGHTED_DIFF:
985                 /* No point for wdiff number if we are dummy.. */
986                 if (he->dummy) {
987                         scnprintf(buf, size, "N/A");
988                         break;
989                 }
990
991                 if (pair->diff.computed)
992                         wdiff = pair->diff.wdiff;
993                 else
994                         wdiff = compute_wdiff(he, pair);
995
996                 if (wdiff != 0)
997                         scnprintf(buf, size, "%14ld", wdiff);
998                 break;
999
1000         case PERF_HPP_DIFF__FORMULA:
1001                 formula_fprintf(he, pair, buf, size);
1002                 break;
1003
1004         case PERF_HPP_DIFF__PERIOD:
1005                 scnprintf(buf, size, "%" PRIu64, pair->stat.period);
1006                 break;
1007
1008         default:
1009                 BUG_ON(1);
1010         };
1011 }
1012
1013 static void
1014 __hpp__entry_global(struct hist_entry *he, struct diff_hpp_fmt *dfmt,
1015                     char *buf, size_t size)
1016 {
1017         struct hist_entry *pair = get_pair_fmt(he, dfmt);
1018         int idx = dfmt->idx;
1019
1020         /* baseline is special */
1021         if (idx == PERF_HPP_DIFF__BASELINE)
1022                 hpp__entry_baseline(he, buf, size);
1023         else {
1024                 if (pair)
1025                         hpp__entry_pair(he, pair, idx, buf, size);
1026                 else
1027                         hpp__entry_unpair(he, idx, buf, size);
1028         }
1029 }
1030
1031 static int hpp__entry_global(struct perf_hpp_fmt *_fmt, struct perf_hpp *hpp,
1032                              struct hist_entry *he)
1033 {
1034         struct diff_hpp_fmt *dfmt =
1035                 container_of(_fmt, struct diff_hpp_fmt, fmt);
1036         char buf[MAX_COL_WIDTH] = " ";
1037
1038         __hpp__entry_global(he, dfmt, buf, MAX_COL_WIDTH);
1039
1040         if (symbol_conf.field_sep)
1041                 return scnprintf(hpp->buf, hpp->size, "%s", buf);
1042         else
1043                 return scnprintf(hpp->buf, hpp->size, "%*s",
1044                                  dfmt->header_width, buf);
1045 }
1046
1047 static int hpp__header(struct perf_hpp_fmt *fmt, struct perf_hpp *hpp,
1048                        struct hists *hists __maybe_unused)
1049 {
1050         struct diff_hpp_fmt *dfmt =
1051                 container_of(fmt, struct diff_hpp_fmt, fmt);
1052
1053         BUG_ON(!dfmt->header);
1054         return scnprintf(hpp->buf, hpp->size, dfmt->header);
1055 }
1056
1057 static int hpp__width(struct perf_hpp_fmt *fmt,
1058                       struct perf_hpp *hpp __maybe_unused,
1059                       struct perf_evsel *evsel __maybe_unused)
1060 {
1061         struct diff_hpp_fmt *dfmt =
1062                 container_of(fmt, struct diff_hpp_fmt, fmt);
1063
1064         BUG_ON(dfmt->header_width <= 0);
1065         return dfmt->header_width;
1066 }
1067
1068 static void init_header(struct data__file *d, struct diff_hpp_fmt *dfmt)
1069 {
1070 #define MAX_HEADER_NAME 100
1071         char buf_indent[MAX_HEADER_NAME];
1072         char buf[MAX_HEADER_NAME];
1073         const char *header = NULL;
1074         int width = 0;
1075
1076         BUG_ON(dfmt->idx >= PERF_HPP_DIFF__MAX_INDEX);
1077         header = columns[dfmt->idx].name;
1078         width  = columns[dfmt->idx].width;
1079
1080         /* Only our defined HPP fmts should appear here. */
1081         BUG_ON(!header);
1082
1083         if (data__files_cnt > 2)
1084                 scnprintf(buf, MAX_HEADER_NAME, "%s/%d", header, d->idx);
1085
1086 #define NAME (data__files_cnt > 2 ? buf : header)
1087         dfmt->header_width = width;
1088         width = (int) strlen(NAME);
1089         if (dfmt->header_width < width)
1090                 dfmt->header_width = width;
1091
1092         scnprintf(buf_indent, MAX_HEADER_NAME, "%*s",
1093                   dfmt->header_width, NAME);
1094
1095         dfmt->header = strdup(buf_indent);
1096 #undef MAX_HEADER_NAME
1097 #undef NAME
1098 }
1099
1100 static void data__hpp_register(struct data__file *d, int idx)
1101 {
1102         struct diff_hpp_fmt *dfmt = &d->fmt[idx];
1103         struct perf_hpp_fmt *fmt = &dfmt->fmt;
1104
1105         dfmt->idx = idx;
1106
1107         fmt->header = hpp__header;
1108         fmt->width  = hpp__width;
1109         fmt->entry  = hpp__entry_global;
1110         fmt->cmp    = hist_entry__cmp_nop;
1111         fmt->collapse = hist_entry__cmp_nop;
1112
1113         /* TODO more colors */
1114         switch (idx) {
1115         case PERF_HPP_DIFF__BASELINE:
1116                 fmt->color = hpp__color_baseline;
1117                 fmt->sort  = hist_entry__cmp_baseline;
1118                 break;
1119         case PERF_HPP_DIFF__DELTA:
1120                 fmt->color = hpp__color_delta;
1121                 fmt->sort  = hist_entry__cmp_delta;
1122                 break;
1123         case PERF_HPP_DIFF__RATIO:
1124                 fmt->color = hpp__color_ratio;
1125                 fmt->sort  = hist_entry__cmp_ratio;
1126                 break;
1127         case PERF_HPP_DIFF__WEIGHTED_DIFF:
1128                 fmt->color = hpp__color_wdiff;
1129                 fmt->sort  = hist_entry__cmp_wdiff;
1130                 break;
1131         default:
1132                 fmt->sort  = hist_entry__cmp_nop;
1133                 break;
1134         }
1135
1136         init_header(d, dfmt);
1137         perf_hpp__column_register(fmt);
1138         perf_hpp__register_sort_field(fmt);
1139 }
1140
1141 static int ui_init(void)
1142 {
1143         struct data__file *d;
1144         struct perf_hpp_fmt *fmt;
1145         int i;
1146
1147         data__for_each_file(i, d) {
1148
1149                 /*
1150                  * Baseline or compute realted columns:
1151                  *
1152                  *   PERF_HPP_DIFF__BASELINE
1153                  *   PERF_HPP_DIFF__DELTA
1154                  *   PERF_HPP_DIFF__RATIO
1155                  *   PERF_HPP_DIFF__WEIGHTED_DIFF
1156                  */
1157                 data__hpp_register(d, i ? compute_2_hpp[compute] :
1158                                           PERF_HPP_DIFF__BASELINE);
1159
1160                 /*
1161                  * And the rest:
1162                  *
1163                  * PERF_HPP_DIFF__FORMULA
1164                  * PERF_HPP_DIFF__PERIOD
1165                  * PERF_HPP_DIFF__PERIOD_BASELINE
1166                  */
1167                 if (show_formula && i)
1168                         data__hpp_register(d, PERF_HPP_DIFF__FORMULA);
1169
1170                 if (show_period)
1171                         data__hpp_register(d, i ? PERF_HPP_DIFF__PERIOD :
1172                                                   PERF_HPP_DIFF__PERIOD_BASELINE);
1173         }
1174
1175         if (!sort_compute)
1176                 return 0;
1177
1178         /*
1179          * Prepend an fmt to sort on columns at 'sort_compute' first.
1180          * This fmt is added only to the sort list but not to the
1181          * output fields list.
1182          *
1183          * Note that this column (data) can be compared twice - one
1184          * for this 'sort_compute' fmt and another for the normal
1185          * diff_hpp_fmt.  But it shouldn't a problem as most entries
1186          * will be sorted out by first try or baseline and comparing
1187          * is not a costly operation.
1188          */
1189         fmt = zalloc(sizeof(*fmt));
1190         if (fmt == NULL) {
1191                 pr_err("Memory allocation failed\n");
1192                 return -1;
1193         }
1194
1195         fmt->cmp      = hist_entry__cmp_nop;
1196         fmt->collapse = hist_entry__cmp_nop;
1197
1198         switch (compute) {
1199         case COMPUTE_DELTA:
1200                 fmt->sort = hist_entry__cmp_delta_idx;
1201                 break;
1202         case COMPUTE_RATIO:
1203                 fmt->sort = hist_entry__cmp_ratio_idx;
1204                 break;
1205         case COMPUTE_WEIGHTED_DIFF:
1206                 fmt->sort = hist_entry__cmp_wdiff_idx;
1207                 break;
1208         default:
1209                 BUG_ON(1);
1210         }
1211
1212         perf_hpp__register_sort_field(fmt);
1213         return 0;
1214 }
1215
1216 static int data_init(int argc, const char **argv)
1217 {
1218         struct data__file *d;
1219         static const char *defaults[] = {
1220                 "perf.data.old",
1221                 "perf.data",
1222         };
1223         bool use_default = true;
1224         int i;
1225
1226         data__files_cnt = 2;
1227
1228         if (argc) {
1229                 if (argc == 1)
1230                         defaults[1] = argv[0];
1231                 else {
1232                         data__files_cnt = argc;
1233                         use_default = false;
1234                 }
1235         } else if (perf_guest) {
1236                 defaults[0] = "perf.data.host";
1237                 defaults[1] = "perf.data.guest";
1238         }
1239
1240         if (sort_compute >= (unsigned int) data__files_cnt) {
1241                 pr_err("Order option out of limit.\n");
1242                 return -EINVAL;
1243         }
1244
1245         data__files = zalloc(sizeof(*data__files) * data__files_cnt);
1246         if (!data__files)
1247                 return -ENOMEM;
1248
1249         data__for_each_file(i, d) {
1250                 struct perf_data_file *file = &d->file;
1251
1252                 file->path  = use_default ? defaults[i] : argv[i];
1253                 file->mode  = PERF_DATA_MODE_READ,
1254                 file->force = force,
1255
1256                 d->idx  = i;
1257         }
1258
1259         return 0;
1260 }
1261
1262 int cmd_diff(int argc, const char **argv, const char *prefix __maybe_unused)
1263 {
1264         int ret = hists__init();
1265
1266         if (ret < 0)
1267                 return ret;
1268
1269         argc = parse_options(argc, argv, options, diff_usage, 0);
1270
1271         if (symbol__init(NULL) < 0)
1272                 return -1;
1273
1274         if (data_init(argc, argv) < 0)
1275                 return -1;
1276
1277         if (ui_init() < 0)
1278                 return -1;
1279
1280         sort__mode = SORT_MODE__DIFF;
1281
1282         if (setup_sorting(NULL) < 0)
1283                 usage_with_options(diff_usage, options);
1284
1285         setup_pager();
1286
1287         sort__setup_elide(NULL);
1288
1289         return __cmd_diff();
1290 }