Both cpu__max_cpu and env.nr_cpus_online are dynamic alternatives for
MAX_NR_CPUS, a macro currently used throughout perf. The function cpu__max_cpu
returns the possible number of CPUS as defined in the sysfs, whereas
env.nr_cpus_online is the number of CPUs that were online during the recording
session. MAX_NR_CPUS is still used by DECLARE_BITMAP at compile time, however,
it's replaced elsewhere.

This patch was tested using "perf record -a -g" on both an eight socket 288 CPU
system and a single socket 36 CPU system. Each system was then rebooted single
socket and eight socket before "perf report" was used to read the perf.data out
file. "perf report --header" was used to confirm that each perf.data file had
information on the correct number of CPUs.

Cc: Peter Zijlstra <pet...@infradead.org>
Cc: Ingo Molnar <mi...@redhat.com>
Cc: Arnaldo Carvalho de Melo <a...@kernel.org>
Cc: Alexander Shishkin <alexander.shish...@linux.intel.com>
Cc: Jiri Olsa <jo...@redhat.com>
Cc: Namhyung Kim <namhy...@kernel.org>
Cc: linux-kernel@vger.kernel.org
Cc: Russ Anderson <russ.ander...@hpe.com>
Signed-off-by: Kyle Meyer <kyle.me...@hpe.com>
---
 tools/perf/util/header.c    |  6 +++---
 tools/perf/util/machine.c   | 11 ++++++-----
 tools/perf/util/session.c   |  6 +++---
 tools/perf/util/stat.c      |  4 ++--
 tools/perf/util/svghelper.c | 31 +++++++++++++++----------------
 5 files changed, 29 insertions(+), 29 deletions(-)

diff --git a/tools/perf/util/header.c b/tools/perf/util/header.c
index b04c2b6b28b3..cf8ce839cb47 100644
--- a/tools/perf/util/header.c
+++ b/tools/perf/util/header.c
@@ -1121,16 +1121,16 @@ static int build_caches(struct cpu_cache_level 
caches[], u32 size, u32 *cntp)
        return 0;
 }
 
-#define MAX_CACHES (MAX_NR_CPUS * 4)
+#define MAX_CACHE_LVL 4
 
 static int write_cache(struct feat_fd *ff,
                       struct evlist *evlist __maybe_unused)
 {
-       struct cpu_cache_level caches[MAX_CACHES];
+       struct cpu_cache_level caches[(cpu__max_cpu() * MAX_CACHE_LVL)];
        u32 cnt = 0, i, version = 1;
        int ret;
 
-       ret = build_caches(caches, MAX_CACHES, &cnt);
+       ret = build_caches(caches, (cpu__max_cpu() * MAX_CACHE_LVL), &cnt);
        if (ret)
                goto out;
 
diff --git a/tools/perf/util/machine.c b/tools/perf/util/machine.c
index 5734460fc89e..cf5f4b4eeea0 100644
--- a/tools/perf/util/machine.c
+++ b/tools/perf/util/machine.c
@@ -2616,7 +2616,8 @@ int __machine__synthesize_threads(struct machine 
*machine, struct perf_tool *too
 
 pid_t machine__get_current_tid(struct machine *machine, int cpu)
 {
-       if (cpu < 0 || cpu >= MAX_NR_CPUS || !machine->current_tid)
+       int nr_cpus_online = machine->env->nr_cpus_online;
+       if (cpu < 0 || cpu >= nr_cpus_online || !machine->current_tid)
                return -1;
 
        return machine->current_tid[cpu];
@@ -2626,6 +2627,7 @@ int machine__set_current_tid(struct machine *machine, int 
cpu, pid_t pid,
                             pid_t tid)
 {
        struct thread *thread;
+       int nr_cpus_online = machine->env->nr_cpus_online;
 
        if (cpu < 0)
                return -EINVAL;
@@ -2633,16 +2635,15 @@ int machine__set_current_tid(struct machine *machine, 
int cpu, pid_t pid,
        if (!machine->current_tid) {
                int i;
 
-               machine->current_tid = calloc(MAX_NR_CPUS, sizeof(pid_t));
+               machine->current_tid = calloc(nr_cpus_online, sizeof(pid_t));
                if (!machine->current_tid)
                        return -ENOMEM;
-               for (i = 0; i < MAX_NR_CPUS; i++)
+               for (i = 0; i < nr_cpus_online; i++)
                        machine->current_tid[i] = -1;
        }
 
-       if (cpu >= MAX_NR_CPUS) {
+       if (cpu >= nr_cpus_online) {
                pr_err("Requested CPU %d too large. ", cpu);
-               pr_err("Consider raising MAX_NR_CPUS\n");
                return -EINVAL;
        }
 
diff --git a/tools/perf/util/session.c b/tools/perf/util/session.c
index 11e6093c941b..a9d244a94e24 100644
--- a/tools/perf/util/session.c
+++ b/tools/perf/util/session.c
@@ -2275,6 +2275,7 @@ int perf_session__cpu_bitmap(struct perf_session *session,
 {
        int i, err = -1;
        struct perf_cpu_map *map;
+       int nr_cpus_online = session->header.env.nr_cpus_online;
 
        for (i = 0; i < PERF_TYPE_MAX; ++i) {
                struct evsel *evsel;
@@ -2299,9 +2300,8 @@ int perf_session__cpu_bitmap(struct perf_session *session,
        for (i = 0; i < map->nr; i++) {
                int cpu = map->map[i];
 
-               if (cpu >= MAX_NR_CPUS) {
-                       pr_err("Requested CPU %d too large. "
-                              "Consider raising MAX_NR_CPUS\n", cpu);
+               if (cpu >= nr_cpus_online) {
+                       pr_err("Requested CPU %d too large\n", cpu);
                        goto out_delete_map;
                }
 
diff --git a/tools/perf/util/stat.c b/tools/perf/util/stat.c
index e4e4e3bf8b2b..199008ce936d 100644
--- a/tools/perf/util/stat.c
+++ b/tools/perf/util/stat.c
@@ -208,7 +208,7 @@ void perf_evlist__reset_stats(struct evlist *evlist)
 static void zero_per_pkg(struct evsel *counter)
 {
        if (counter->per_pkg_mask)
-               memset(counter->per_pkg_mask, 0, MAX_NR_CPUS);
+               memset(counter->per_pkg_mask, 0, cpu__max_cpu());
 }
 
 static int check_per_pkg(struct evsel *counter,
@@ -227,7 +227,7 @@ static int check_per_pkg(struct evsel *counter,
                return 0;
 
        if (!mask) {
-               mask = zalloc(MAX_NR_CPUS);
+               mask = zalloc(cpu__max_cpu());
                if (!mask)
                        return -ENOMEM;
 
diff --git a/tools/perf/util/svghelper.c b/tools/perf/util/svghelper.c
index 1beeb7291361..6e8433e97f21 100644
--- a/tools/perf/util/svghelper.c
+++ b/tools/perf/util/svghelper.c
@@ -695,7 +695,8 @@ struct topology {
        int sib_thr_nr;
 };
 
-static void scan_thread_topology(int *map, struct topology *t, int cpu, int 
*pos)
+static void scan_thread_topology(int *map, struct topology *t, int cpu,
+int *pos, int max_cpus)
 {
        int i;
        int thr;
@@ -704,28 +705,24 @@ static void scan_thread_topology(int *map, struct 
topology *t, int cpu, int *pos
                if (!test_bit(cpu, cpumask_bits(&t->sib_thr[i])))
                        continue;
 
-               for_each_set_bit(thr,
-                                cpumask_bits(&t->sib_thr[i]),
-                                MAX_NR_CPUS)
+               for_each_set_bit(thr, cpumask_bits(&t->sib_thr[i]), max_cpus)
                        if (map[thr] == -1)
                                map[thr] = (*pos)++;
        }
 }
 
-static void scan_core_topology(int *map, struct topology *t)
+static void scan_core_topology(int *map, struct topology *t, int max_cpus)
 {
        int pos = 0;
        int i;
        int cpu;
 
        for (i = 0; i < t->sib_core_nr; i++)
-               for_each_set_bit(cpu,
-                                cpumask_bits(&t->sib_core[i]),
-                                MAX_NR_CPUS)
-                       scan_thread_topology(map, t, cpu, &pos);
+               for_each_set_bit(cpu, cpumask_bits(&t->sib_core[i]), max_cpus)
+                       scan_thread_topology(map, t, cpu, &pos, max_cpus);
 }
 
-static int str_to_bitmap(char *s, cpumask_t *b)
+static int str_to_bitmap(char *s, cpumask_t *b, int max_cpus)
 {
        int i;
        int ret = 0;
@@ -738,7 +735,7 @@ static int str_to_bitmap(char *s, cpumask_t *b)
 
        for (i = 0; i < m->nr; i++) {
                c = m->map[i];
-               if (c >= MAX_NR_CPUS) {
+               if (c >= max_cpus) {
                        ret = -1;
                        break;
                }
@@ -767,7 +764,8 @@ int svg_build_topology_map(struct perf_env *env)
        }
 
        for (i = 0; i < env->nr_sibling_cores; i++) {
-               if (str_to_bitmap(env->sibling_cores, &t.sib_core[i])) {
+               if (str_to_bitmap(env->sibling_cores, &t.sib_core[i],
+                       env->nr_cpus_online)) {
                        fprintf(stderr, "topology: can't parse siblings map\n");
                        goto exit;
                }
@@ -776,7 +774,8 @@ int svg_build_topology_map(struct perf_env *env)
        }
 
        for (i = 0; i < env->nr_sibling_threads; i++) {
-               if (str_to_bitmap(env->sibling_threads, &t.sib_thr[i])) {
+               if (str_to_bitmap(env->sibling_threads, &t.sib_thr[i],
+                       env->nr_cpus_online)) {
                        fprintf(stderr, "topology: can't parse siblings map\n");
                        goto exit;
                }
@@ -784,16 +783,16 @@ int svg_build_topology_map(struct perf_env *env)
                env->sibling_threads += strlen(env->sibling_threads) + 1;
        }
 
-       topology_map = malloc(sizeof(int) * MAX_NR_CPUS);
+       topology_map = malloc(sizeof(int) * env->nr_cpus_online);
        if (!topology_map) {
                fprintf(stderr, "topology: no memory\n");
                goto exit;
        }
 
-       for (i = 0; i < MAX_NR_CPUS; i++)
+       for (i = 0; i < env->nr_cpus_online; i++)
                topology_map[i] = -1;
 
-       scan_core_topology(topology_map, &t);
+       scan_core_topology(topology_map, &t, env->nr_cpus_online);
 
        return 0;
 
-- 
2.12.3

Reply via email to