]> www.infradead.org Git - users/hch/dma-mapping.git/commitdiff
perf stat: Display percore events properly
authorNamhyung Kim <namhyung@kernel.org>
Tue, 18 Oct 2022 02:02:26 +0000 (19:02 -0700)
committerArnaldo Carvalho de Melo <acme@redhat.com>
Thu, 27 Oct 2022 19:37:25 +0000 (16:37 -0300)
The recent change in the perf stat broke the percore event display.
Note that the aggr counts are already processed so that the every
sibling thread in the same core will get the per-core counter values.

Check percore evsels and skip the sibling threads in the display.

Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Acked-by: Ian Rogers <irogers@google.com>
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Andi Kleen <ak@linux.intel.com>
Cc: Athira Jajeev <atrajeev@linux.vnet.ibm.com>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: James Clark <james.clark@arm.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Kan Liang <kan.liang@linux.intel.com>
Cc: Leo Yan <leo.yan@linaro.org>
Cc: Michael Petlan <mpetlan@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Xing Zhengjun <zhengjun.xing@linux.intel.com>
Link: https://lore.kernel.org/r/20221018020227.85905-20-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
tools/perf/builtin-stat.c
tools/perf/util/stat-display.c

index d7c52cef70a3a020b66e9a797dab098f5196485b..9d35a33389766a99d8d22b0cde5fdc20b4253464 100644 (file)
@@ -1404,18 +1404,6 @@ static struct aggr_cpu_id perf_stat__get_cpu_cached(struct perf_stat_config *con
        return perf_stat__get_aggr(config, perf_stat__get_cpu, cpu);
 }
 
-static bool term_percore_set(void)
-{
-       struct evsel *counter;
-
-       evlist__for_each_entry(evsel_list, counter) {
-               if (counter->percore)
-                       return true;
-       }
-
-       return false;
-}
-
 static aggr_cpu_id_get_t aggr_mode__get_aggr(enum aggr_mode aggr_mode)
 {
        switch (aggr_mode) {
@@ -1428,8 +1416,6 @@ static aggr_cpu_id_get_t aggr_mode__get_aggr(enum aggr_mode aggr_mode)
        case AGGR_NODE:
                return aggr_cpu_id__node;
        case AGGR_NONE:
-               if (term_percore_set())
-                       return aggr_cpu_id__core;
                return aggr_cpu_id__cpu;
        case AGGR_GLOBAL:
                return aggr_cpu_id__global;
@@ -1453,8 +1439,6 @@ static aggr_get_id_t aggr_mode__get_id(enum aggr_mode aggr_mode)
        case AGGR_NODE:
                return perf_stat__get_node_cached;
        case AGGR_NONE:
-               if (term_percore_set())
-                       return perf_stat__get_core_cached;
                return perf_stat__get_cpu_cached;
        case AGGR_GLOBAL:
                return perf_stat__get_global_cached;
index bfae2784609c83041d5217c7e42a08cc5166cf84..657434cd29eea9f84b6bcae0a730e4eca66d7680 100644 (file)
@@ -1091,7 +1091,8 @@ static void print_percore(struct perf_stat_config *config,
 {
        bool metric_only = config->metric_only;
        FILE *output = config->output;
-       int s;
+       struct cpu_aggr_map *core_map;
+       int s, c, i;
        bool first = true;
 
        if (!config->aggr_map || !config->aggr_get_id)
@@ -1100,13 +1101,35 @@ static void print_percore(struct perf_stat_config *config,
        if (config->percore_show_thread)
                return print_counter(config, counter, prefix);
 
-       for (s = 0; s < config->aggr_map->nr; s++) {
+       core_map = cpu_aggr_map__empty_new(config->aggr_map->nr);
+       if (core_map == NULL) {
+               fprintf(output, "Cannot allocate per-core aggr map for display\n");
+               return;
+       }
+
+       for (s = 0, c = 0; s < config->aggr_map->nr; s++) {
+               struct perf_cpu curr_cpu = config->aggr_map->map[s].cpu;
+               struct aggr_cpu_id core_id = aggr_cpu_id__core(curr_cpu, NULL);
+               bool found = false;
+
+               for (i = 0; i < c; i++) {
+                       if (aggr_cpu_id__equal(&core_map->map[i], &core_id)) {
+                               found = true;
+                               break;
+                       }
+               }
+               if (found)
+                       continue;
+
                if (prefix && metric_only)
                        fprintf(output, "%s", prefix);
 
                print_counter_aggrdata(config, counter, s,
                                       prefix, metric_only, &first);
+
+               core_map->map[c++] = core_id;
        }
+       free(core_map);
 
        if (metric_only)
                fputc('\n', output);