Re: [PATCH v6 7/7] perf diff: Support hot streams comparison

From: Arnaldo Carvalho de Melo
Date: Thu Sep 17 2020 - 16:26:14 EST


Em Fri, Sep 11, 2020 at 04:03:53PM +0800, Jin Yao escreveu:
> This patch enables perf-diff with "--stream" option.
>
> "--stream": Enable hot streams comparison
>
> Now let's see examples.
>
> perf record -b ... Generate perf.data.old with branch data
> perf record -b ... Generate perf.data with branch data
> perf diff --stream
>
> [ Matched hot streams ]
>
> hot chain pair 1:
> cycles: 1, hits: 27.77% cycles: 1, hits: 9.24%
> --------------------------- --------------------------
> main div.c:39 main div.c:39
> main div.c:44 main div.c:44
>
> hot chain pair 2:
> cycles: 34, hits: 20.06% cycles: 27, hits: 16.98%
> --------------------------- --------------------------
> __random_r random_r.c:360 __random_r random_r.c:360

Would it be interesting to get the associated source code and show right below
these file:number lines?

- Arnaldo

> __random_r random_r.c:388 __random_r random_r.c:388
> __random_r random_r.c:388 __random_r random_r.c:388
> __random_r random_r.c:380 __random_r random_r.c:380
> __random_r random_r.c:357 __random_r random_r.c:357
> __random random.c:293 __random random.c:293
> __random random.c:293 __random random.c:293
> __random random.c:291 __random random.c:291
> __random random.c:291 __random random.c:291
> __random random.c:291 __random random.c:291
> __random random.c:288 __random random.c:288
> rand rand.c:27 rand rand.c:27
> rand rand.c:26 rand rand.c:26
> rand@plt rand@plt
> rand@plt rand@plt
> compute_flag div.c:25 compute_flag div.c:25
> compute_flag div.c:22 compute_flag div.c:22
> main div.c:40 main div.c:40
> main div.c:40 main div.c:40
> main div.c:39 main div.c:39
>
> hot chain pair 3:
> cycles: 9, hits: 4.48% cycles: 6, hits: 4.51%
> --------------------------- --------------------------
> __random_r random_r.c:360 __random_r random_r.c:360
> __random_r random_r.c:388 __random_r random_r.c:388
> __random_r random_r.c:388 __random_r random_r.c:388
> __random_r random_r.c:380 __random_r random_r.c:380
>
> [ Hot streams in old perf data only ]
>
> hot chain 1:
> cycles: 18, hits: 6.75%
> --------------------------
> __random_r random_r.c:360
> __random_r random_r.c:388
> __random_r random_r.c:388
> __random_r random_r.c:380
> __random_r random_r.c:357
> __random random.c:293
> __random random.c:293
> __random random.c:291
> __random random.c:291
> __random random.c:291
> __random random.c:288
> rand rand.c:27
> rand rand.c:26
> rand@plt
> rand@plt
> compute_flag div.c:25
> compute_flag div.c:22
> main div.c:40
>
> hot chain 2:
> cycles: 29, hits: 2.78%
> --------------------------
> compute_flag div.c:22
> main div.c:40
> main div.c:40
> main div.c:39
>
> [ Hot streams in new perf data only ]
>
> hot chain 1:
> cycles: 4, hits: 4.54%
> --------------------------
> main div.c:42
> compute_flag div.c:28
>
> hot chain 2:
> cycles: 5, hits: 3.51%
> --------------------------
> main div.c:39
> main div.c:44
> main div.c:42
> compute_flag div.c:28
>
> Signed-off-by: Jin Yao <yao.jin@xxxxxxxxxxxxxxx>
> ---
> v6:
> - Rebase to perf/core
>
> v5:
> - Remove enum stream_type
> - Rebase to perf/core
>
> v4:
> - Remove the "--before" and "--after" options since they are for
> source line based comparison. In this patchset, we will not
> support source line based comparison.
>
> tools/perf/Documentation/perf-diff.txt | 4 +
> tools/perf/builtin-diff.c | 133 ++++++++++++++++++++++---
> 2 files changed, 124 insertions(+), 13 deletions(-)
>
> diff --git a/tools/perf/Documentation/perf-diff.txt b/tools/perf/Documentation/perf-diff.txt
> index f50ca0fef0a4..be65bd55ab2a 100644
> --- a/tools/perf/Documentation/perf-diff.txt
> +++ b/tools/perf/Documentation/perf-diff.txt
> @@ -182,6 +182,10 @@ OPTIONS
> --tid=::
> Only diff samples for given thread ID (comma separated list).
>
> +--stream::
> + Enable hot streams comparison. Stream can be a callchain which is
> + aggregated by the branch records from samples.
> +
> COMPARISON
> ----------
> The comparison is governed by the baseline file. The baseline perf.data
> diff --git a/tools/perf/builtin-diff.c b/tools/perf/builtin-diff.c
> index f8c9bdd8269a..d6db473cd010 100644
> --- a/tools/perf/builtin-diff.c
> +++ b/tools/perf/builtin-diff.c
> @@ -25,6 +25,7 @@
> #include "util/map.h"
> #include "util/spark.h"
> #include "util/block-info.h"
> +#include "util/stream.h"
> #include <linux/err.h>
> #include <linux/zalloc.h>
> #include <subcmd/pager.h>
> @@ -42,6 +43,7 @@ struct perf_diff {
> int range_size;
> int range_num;
> bool has_br_stack;
> + bool stream;
> };
>
> /* Diff command specific HPP columns. */
> @@ -72,6 +74,8 @@ struct data__file {
> struct perf_data data;
> int idx;
> struct hists *hists;
> + struct evsel_streams *evsel_streams;
> + int nr_evsel_streams;
> struct diff_hpp_fmt fmt[PERF_HPP_DIFF__MAX_INDEX];
> };
>
> @@ -106,6 +110,7 @@ enum {
> COMPUTE_DELTA_ABS,
> COMPUTE_CYCLES,
> COMPUTE_MAX,
> + COMPUTE_STREAM, /* After COMPUTE_MAX to avoid use current compute arrays */
> };
>
> const char *compute_names[COMPUTE_MAX] = {
> @@ -393,6 +398,11 @@ static int diff__process_sample_event(struct perf_tool *tool,
> struct perf_diff *pdiff = container_of(tool, struct perf_diff, tool);
> struct addr_location al;
> struct hists *hists = evsel__hists(evsel);
> + struct hist_entry_iter iter = {
> + .evsel = evsel,
> + .sample = sample,
> + .ops = &hist_iter_normal,
> + };
> int ret = -1;
>
> if (perf_time__ranges_skip_sample(pdiff->ptime_range, pdiff->range_num,
> @@ -411,14 +421,8 @@ static int diff__process_sample_event(struct perf_tool *tool,
> goto out_put;
> }
>
> - if (compute != COMPUTE_CYCLES) {
> - if (!hists__add_entry(hists, &al, NULL, NULL, NULL, sample,
> - true)) {
> - pr_warning("problem incrementing symbol period, "
> - "skipping event\n");
> - goto out_put;
> - }
> - } else {
> + switch (compute) {
> + case COMPUTE_CYCLES:
> if (!hists__add_entry_ops(hists, &block_hist_ops, &al, NULL,
> NULL, NULL, sample, true)) {
> pr_warning("problem incrementing symbol period, "
> @@ -428,6 +432,23 @@ static int diff__process_sample_event(struct perf_tool *tool,
>
> hist__account_cycles(sample->branch_stack, &al, sample, false,
> NULL);
> + break;
> +
> + case COMPUTE_STREAM:
> + if (hist_entry_iter__add(&iter, &al, PERF_MAX_STACK_DEPTH,
> + NULL)) {
> + pr_debug("problem adding hist entry, skipping event\n");
> + goto out_put;
> + }
> + break;
> +
> + default:
> + if (!hists__add_entry(hists, &al, NULL, NULL, NULL, sample,
> + true)) {
> + pr_warning("problem incrementing symbol period, "
> + "skipping event\n");
> + goto out_put;
> + }
> }
>
> /*
> @@ -996,6 +1017,50 @@ static void data_process(void)
> }
> }
>
> +static int process_base_stream(struct data__file *data_base,
> + struct data__file *data_pair,
> + const char *title __maybe_unused)
> +{
> + struct evlist *evlist_base = data_base->session->evlist;
> + struct evlist *evlist_pair = data_pair->session->evlist;
> + struct evsel *evsel_base, *evsel_pair;
> + struct evsel_streams *es_base, *es_pair;
> +
> + evlist__for_each_entry(evlist_base, evsel_base) {
> + evsel_pair = evsel_match(evsel_base, evlist_pair);
> + if (!evsel_pair)
> + continue;
> +
> + es_base = evsel_streams_get(data_base->evsel_streams,
> + data_base->nr_evsel_streams,
> + evsel_base->idx);
> + if (!es_base)
> + return -1;
> +
> + es_pair = evsel_streams_get(data_pair->evsel_streams,
> + data_pair->nr_evsel_streams,
> + evsel_pair->idx);
> + if (!es_pair)
> + return -1;
> +
> + match_evsel_streams(es_base, es_pair);
> + evsel_streams_report(es_base, es_pair);
> + }
> +
> + return 0;
> +}
> +
> +static void stream_process(void)
> +{
> + /*
> + * Stream comparison only supports two data files.
> + * perf.data.old and perf.data. data__files[0] is perf.data.old,
> + * data__files[1] is perf.data.
> + */
> + process_base_stream(&data__files[0], &data__files[1],
> + "# Output based on old perf data:\n#\n");
> +}
> +
> static void data__free(struct data__file *d)
> {
> int col;
> @@ -1109,6 +1174,18 @@ static int check_file_brstack(void)
> return 0;
> }
>
> +static struct evsel_streams *create_evsel_streams(struct evlist *evlist,
> + int nr_streams_max,
> + int *nr_evsel_streams)
> +{
> + struct evsel_streams *es;
> +
> + es = perf_evlist__create_streams(evlist, nr_streams_max);
> + *nr_evsel_streams = evlist->core.nr_entries;
> +
> + return es;
> +}
> +
> static int __cmd_diff(void)
> {
> struct data__file *d;
> @@ -1153,9 +1230,21 @@ static int __cmd_diff(void)
>
> if (pdiff.ptime_range)
> zfree(&pdiff.ptime_range);
> +
> + if (compute == COMPUTE_STREAM) {
> + d->evsel_streams = create_evsel_streams(
> + d->session->evlist,
> + 5,
> + &d->nr_evsel_streams);
> + if (!d->evsel_streams)
> + goto out_delete;
> + }
> }
>
> - data_process();
> + if (compute == COMPUTE_STREAM)
> + stream_process();
> + else
> + data_process();
>
> out_delete:
> data__for_each_file(i, d) {
> @@ -1228,6 +1317,8 @@ static const struct option options[] = {
> "only consider symbols in these pids"),
> OPT_STRING(0, "tid", &symbol_conf.tid_list_str, "tid[,tid...]",
> "only consider symbols in these tids"),
> + OPT_BOOLEAN(0, "stream", &pdiff.stream,
> + "Enable hot streams comparison."),
> OPT_END()
> };
>
> @@ -1887,6 +1978,9 @@ int cmd_diff(int argc, const char **argv)
> if (cycles_hist && (compute != COMPUTE_CYCLES))
> usage_with_options(diff_usage, options);
>
> + if (pdiff.stream)
> + compute = COMPUTE_STREAM;
> +
> symbol__annotation_init();
>
> if (symbol__init(NULL) < 0)
> @@ -1898,13 +1992,26 @@ int cmd_diff(int argc, const char **argv)
> if (check_file_brstack() < 0)
> return -1;
>
> - if (compute == COMPUTE_CYCLES && !pdiff.has_br_stack)
> + if ((compute == COMPUTE_CYCLES || compute == COMPUTE_STREAM)
> + && !pdiff.has_br_stack) {
> return -1;
> + }
>
> - if (ui_init() < 0)
> - return -1;
> + if (compute == COMPUTE_STREAM) {
> + symbol_conf.show_branchflag_count = true;
> + symbol_conf.disable_add2line_warn = true;
> + callchain_param.mode = CHAIN_FLAT;
> + callchain_param.key = CCKEY_SRCLINE;
> + callchain_param.branch_callstack = 1;
> + symbol_conf.use_callchain = true;
> + callchain_register_param(&callchain_param);
> + sort_order = "srcline,symbol,dso";
> + } else {
> + if (ui_init() < 0)
> + return -1;
>
> - sort__mode = SORT_MODE__DIFF;
> + sort__mode = SORT_MODE__DIFF;
> + }
>
> if (setup_sorting(NULL) < 0)
> usage_with_options(diff_usage, options);
> --
> 2.17.1
>

--

- Arnaldo