On hybrid platform, atom events can be only enabled on atom CPUs. Core
events can be only enabled on core CPUs. So for a hybrid event, it can
be only enabled on it's own CPUs.

But the problem for current perf is, the cpus for evsel (via PMU sysfs)
have been merged to evsel_list->core.all_cpus. It might be all CPUs.

So we need to figure out one way to let the hybrid event only use it's
own CPUs.

The idea is to create a new evlist__invalidate_all_cpus to invalidate
the evsel_list->core.all_cpus then evlist__for_each_cpu returns cpu -1
for hybrid evsel. If cpu is -1, hybrid evsel will use it's own cpus.

We will see following code piece in patch.

if (cpu == -1 && !evlist->thread_mode)
        evsel__enable_cpus(pos);

It lets the event be enabled on event's own cpus.

Signed-off-by: Jin Yao <yao....@linux.intel.com>
---
 tools/perf/builtin-stat.c          | 37 ++++++++++++++-
 tools/perf/util/evlist.c           | 72 ++++++++++++++++++++++++++++--
 tools/perf/util/evlist.h           |  4 ++
 tools/perf/util/evsel.h            |  8 ++++
 tools/perf/util/python-ext-sources |  2 +
 5 files changed, 117 insertions(+), 6 deletions(-)

diff --git a/tools/perf/builtin-stat.c b/tools/perf/builtin-stat.c
index 2e2e4a8345ea..68ecf68699a9 100644
--- a/tools/perf/builtin-stat.c
+++ b/tools/perf/builtin-stat.c
@@ -393,6 +393,18 @@ static int read_counter_cpu(struct evsel *counter, struct 
timespec *rs, int cpu)
        return 0;
 }
 
+static int read_counter_cpus(struct evsel *counter, struct timespec *rs)
+{
+       int cpu, nr_cpus, err = 0;
+       struct perf_cpu_map *cpus = evsel__cpus(counter);
+
+       nr_cpus = cpus ? cpus->nr : 1;
+       for (cpu = 0; cpu < nr_cpus; cpu++)
+               err = read_counter_cpu(counter, rs, cpu);
+
+       return err;
+}
+
 static int read_affinity_counters(struct timespec *rs)
 {
        struct evsel *counter;
@@ -414,8 +426,14 @@ static int read_affinity_counters(struct timespec *rs)
                        if (evsel__cpu_iter_skip(counter, cpu))
                                continue;
                        if (!counter->err) {
-                               counter->err = read_counter_cpu(counter, rs,
-                                                               
counter->cpu_iter - 1);
+                               if (cpu == -1 && !evsel_list->thread_mode) {
+                                       counter->err = 
read_counter_cpus(counter, rs);
+                               } else if (evsel_list->thread_mode) {
+                                       counter->err = 
read_counter_cpu(counter, rs, 0);
+                               } else {
+                                       counter->err = 
read_counter_cpu(counter, rs,
+                                                                       
counter->cpu_iter - 1);
+                               }
                        }
                }
        }
@@ -781,6 +799,21 @@ static int __run_perf_stat(int argc, const char **argv, 
int run_idx)
        if (group)
                evlist__set_leader(evsel_list);
 
+       /*
+        * On hybrid platform, the cpus for evsel (via PMU sysfs) have been
+        * merged to evsel_list->core.all_cpus. We use 
evlist__invalidate_all_cpus
+        * to invalidate the evsel_list->core.all_cpus then evlist__for_each_cpu
+        * returns cpu -1 for hybrid evsel. If cpu is -1, hybrid evsel will
+        * use it's own cpus.
+        */
+       if (evlist__has_hybrid_events(evsel_list)) {
+               evlist__invalidate_all_cpus(evsel_list);
+               if (!target__has_cpu(&target) ||
+                   target__has_per_thread(&target)) {
+                       evsel_list->thread_mode = true;
+               }
+       }
+
        if (affinity__setup(&affinity) < 0)
                return -1;
 
diff --git a/tools/perf/util/evlist.c b/tools/perf/util/evlist.c
index 882cd1f721d9..3ee12fcd0c9f 100644
--- a/tools/perf/util/evlist.c
+++ b/tools/perf/util/evlist.c
@@ -381,7 +381,8 @@ bool evsel__cpu_iter_skip_no_inc(struct evsel *ev, int cpu)
 bool evsel__cpu_iter_skip(struct evsel *ev, int cpu)
 {
        if (!evsel__cpu_iter_skip_no_inc(ev, cpu)) {
-               ev->cpu_iter++;
+               if (cpu != -1)
+                       ev->cpu_iter++;
                return false;
        }
        return true;
@@ -410,6 +411,16 @@ static int evlist__is_enabled(struct evlist *evlist)
        return false;
 }
 
+static void evsel__disable_cpus(struct evsel *evsel)
+{
+       int cpu, nr_cpus;
+       struct perf_cpu_map *cpus = evsel__cpus(evsel);
+
+       nr_cpus = cpus ? cpus->nr : 1;
+       for (cpu = 0; cpu < nr_cpus; cpu++)
+               evsel__disable_cpu(evsel, cpu);
+}
+
 static void __evlist__disable(struct evlist *evlist, char *evsel_name)
 {
        struct evsel *pos;
@@ -436,7 +447,12 @@ static void __evlist__disable(struct evlist *evlist, char 
*evsel_name)
                                        has_imm = true;
                                if (pos->immediate != imm)
                                        continue;
-                               evsel__disable_cpu(pos, pos->cpu_iter - 1);
+                               if (cpu == -1 && !evlist->thread_mode)
+                                       evsel__disable_cpus(pos);
+                               else if (evlist->thread_mode)
+                                       evsel__disable_cpu(pos, 0);
+                               else
+                                       evsel__disable_cpu(pos, pos->cpu_iter - 
1);
                        }
                }
                if (!has_imm)
@@ -472,6 +488,15 @@ void evlist__disable_evsel(struct evlist *evlist, char 
*evsel_name)
        __evlist__disable(evlist, evsel_name);
 }
 
+static void evsel__enable_cpus(struct evsel *evsel)
+{
+       int cpu, nr_cpus;
+       struct perf_cpu_map *cpus = evsel__cpus(evsel);
+
+       nr_cpus = cpus ? cpus->nr : 1;
+       for (cpu = 0; cpu < nr_cpus; cpu++)
+               evsel__enable_cpu(evsel, cpu);
+}
 static void __evlist__enable(struct evlist *evlist, char *evsel_name)
 {
        struct evsel *pos;
@@ -491,7 +516,12 @@ static void __evlist__enable(struct evlist *evlist, char 
*evsel_name)
                                continue;
                        if (!evsel__is_group_leader(pos) || !pos->core.fd)
                                continue;
-                       evsel__enable_cpu(pos, pos->cpu_iter - 1);
+                        if (cpu == -1 && !evlist->thread_mode)
+                                evsel__enable_cpus(pos);
+                        else if (evlist->thread_mode)
+                                evsel__enable_cpu(pos, 0);
+                        else
+                                evsel__enable_cpu(pos, pos->cpu_iter - 1);
                }
        }
        affinity__cleanup(&affinity);
@@ -1274,6 +1304,16 @@ void evlist__set_selected(struct evlist *evlist, struct 
evsel *evsel)
        evlist->selected = evsel;
 }
 
+static void evsel__close_cpus(struct evsel *evsel)
+{
+       int cpu, nr_cpus;
+       struct perf_cpu_map *cpus = evsel__cpus(evsel);
+
+       nr_cpus = cpus ? cpus->nr : 1;
+       for (cpu = 0; cpu < nr_cpus; cpu++)
+               perf_evsel__close_cpu(&evsel->core, cpu);
+}
+
 void evlist__close(struct evlist *evlist)
 {
        struct evsel *evsel;
@@ -1298,7 +1338,13 @@ void evlist__close(struct evlist *evlist)
                evlist__for_each_entry_reverse(evlist, evsel) {
                        if (evsel__cpu_iter_skip(evsel, cpu))
                            continue;
-                       perf_evsel__close_cpu(&evsel->core, evsel->cpu_iter - 
1);
+
+                       if (cpu == -1 && !evlist->thread_mode)
+                               evsel__close_cpus(evsel);
+                       else if (evlist->thread_mode)
+                               perf_evsel__close_cpu(&evsel->core, 0);
+                       else
+                               perf_evsel__close_cpu(&evsel->core, 
evsel->cpu_iter - 1);
                }
        }
        affinity__cleanup(&affinity);
@@ -2130,3 +2176,21 @@ struct evsel *evlist__find_evsel(struct evlist *evlist, 
int idx)
        }
        return NULL;
 }
+
+bool evlist__has_hybrid_events(struct evlist *evlist)
+{
+       struct evsel *evsel;
+
+       evlist__for_each_entry(evlist, evsel) {
+               if (evsel__is_hybrid_event(evsel))
+                       return true;
+       }
+
+       return false;
+}
+
+void evlist__invalidate_all_cpus(struct evlist *evlist)
+{
+       perf_cpu_map__put(evlist->core.all_cpus);
+       evlist->core.all_cpus = perf_cpu_map__empty_new(1);
+}
diff --git a/tools/perf/util/evlist.h b/tools/perf/util/evlist.h
index b695ffaae519..0da683511d98 100644
--- a/tools/perf/util/evlist.h
+++ b/tools/perf/util/evlist.h
@@ -52,6 +52,7 @@ struct evlist {
        struct perf_evlist core;
        int              nr_groups;
        bool             enabled;
+       bool             thread_mode;
        int              id_pos;
        int              is_pos;
        u64              combined_sample_type;
@@ -365,4 +366,7 @@ int evlist__ctlfd_ack(struct evlist *evlist);
 #define EVLIST_DISABLED_MSG "Events disabled\n"
 
 struct evsel *evlist__find_evsel(struct evlist *evlist, int idx);
+void evlist__invalidate_all_cpus(struct evlist *evlist);
+
+bool evlist__has_hybrid_events(struct evlist *evlist);
 #endif /* __PERF_EVLIST_H */
diff --git a/tools/perf/util/evsel.h b/tools/perf/util/evsel.h
index 6026487353dd..69aadc52c1bd 100644
--- a/tools/perf/util/evsel.h
+++ b/tools/perf/util/evsel.h
@@ -7,9 +7,11 @@
 #include <sys/types.h>
 #include <linux/perf_event.h>
 #include <linux/types.h>
+#include <string.h>
 #include <internal/evsel.h>
 #include <perf/evsel.h>
 #include "symbol_conf.h"
+#include "pmu-hybrid.h"
 #include <internal/cpumap.h>
 
 struct bpf_object;
@@ -435,4 +437,10 @@ struct perf_env *evsel__env(struct evsel *evsel);
 int evsel__store_ids(struct evsel *evsel, struct evlist *evlist);
 
 void evsel__zero_per_pkg(struct evsel *evsel);
+
+static inline bool evsel__is_hybrid_event(struct evsel *evsel)
+{
+       return evsel->pmu_name && perf_pmu__is_hybrid(evsel->pmu_name);
+}
+
 #endif /* __PERF_EVSEL_H */
diff --git a/tools/perf/util/python-ext-sources 
b/tools/perf/util/python-ext-sources
index 845dd46e3c61..d7c976671e3a 100644
--- a/tools/perf/util/python-ext-sources
+++ b/tools/perf/util/python-ext-sources
@@ -37,3 +37,5 @@ util/units.c
 util/affinity.c
 util/rwsem.c
 util/hashmap.c
+util/pmu-hybrid.c
+util/fncache.c
-- 
2.17.1

Reply via email to