Merge tag 'trace-printf-v6.13' of git://git.kernel.org/pub/scm/linux/kernel/git/trace...
[drm/drm-misc.git] / tools / perf / util / cputopo.c
blob8bbeb2dc76fda994b7f83abd227aceaed6e78c55
1 // SPDX-License-Identifier: GPL-2.0
2 #include <sys/param.h>
3 #include <sys/utsname.h>
4 #include <inttypes.h>
5 #include <stdlib.h>
6 #include <string.h>
7 #include <api/fs/fs.h>
8 #include <linux/zalloc.h>
9 #include <perf/cpumap.h>
11 #include "cputopo.h"
12 #include "cpumap.h"
13 #include "debug.h"
14 #include "env.h"
15 #include "pmu.h"
16 #include "pmus.h"
18 #define PACKAGE_CPUS_FMT \
19 "%s/devices/system/cpu/cpu%d/topology/package_cpus_list"
20 #define PACKAGE_CPUS_FMT_OLD \
21 "%s/devices/system/cpu/cpu%d/topology/core_siblings_list"
22 #define DIE_CPUS_FMT \
23 "%s/devices/system/cpu/cpu%d/topology/die_cpus_list"
24 #define CORE_CPUS_FMT \
25 "%s/devices/system/cpu/cpu%d/topology/core_cpus_list"
26 #define CORE_CPUS_FMT_OLD \
27 "%s/devices/system/cpu/cpu%d/topology/thread_siblings_list"
28 #define NODE_ONLINE_FMT \
29 "%s/devices/system/node/online"
30 #define NODE_MEMINFO_FMT \
31 "%s/devices/system/node/node%d/meminfo"
32 #define NODE_CPULIST_FMT \
33 "%s/devices/system/node/node%d/cpulist"
35 static int build_cpu_topology(struct cpu_topology *tp, int cpu)
37 FILE *fp;
38 char filename[MAXPATHLEN];
39 char *buf = NULL, *p;
40 size_t len = 0;
41 ssize_t sret;
42 u32 i = 0;
43 int ret = -1;
45 scnprintf(filename, MAXPATHLEN, PACKAGE_CPUS_FMT,
46 sysfs__mountpoint(), cpu);
47 if (access(filename, F_OK) == -1) {
48 scnprintf(filename, MAXPATHLEN, PACKAGE_CPUS_FMT_OLD,
49 sysfs__mountpoint(), cpu);
51 fp = fopen(filename, "r");
52 if (!fp)
53 goto try_dies;
55 sret = getline(&buf, &len, fp);
56 fclose(fp);
57 if (sret <= 0)
58 goto try_dies;
60 p = strchr(buf, '\n');
61 if (p)
62 *p = '\0';
64 for (i = 0; i < tp->package_cpus_lists; i++) {
65 if (!strcmp(buf, tp->package_cpus_list[i]))
66 break;
68 if (i == tp->package_cpus_lists) {
69 tp->package_cpus_list[i] = buf;
70 tp->package_cpus_lists++;
71 buf = NULL;
72 len = 0;
74 ret = 0;
76 try_dies:
77 if (!tp->die_cpus_list)
78 goto try_threads;
80 scnprintf(filename, MAXPATHLEN, DIE_CPUS_FMT,
81 sysfs__mountpoint(), cpu);
82 fp = fopen(filename, "r");
83 if (!fp)
84 goto try_threads;
86 sret = getline(&buf, &len, fp);
87 fclose(fp);
88 if (sret <= 0)
89 goto try_threads;
91 p = strchr(buf, '\n');
92 if (p)
93 *p = '\0';
95 for (i = 0; i < tp->die_cpus_lists; i++) {
96 if (!strcmp(buf, tp->die_cpus_list[i]))
97 break;
99 if (i == tp->die_cpus_lists) {
100 tp->die_cpus_list[i] = buf;
101 tp->die_cpus_lists++;
102 buf = NULL;
103 len = 0;
105 ret = 0;
107 try_threads:
108 scnprintf(filename, MAXPATHLEN, CORE_CPUS_FMT,
109 sysfs__mountpoint(), cpu);
110 if (access(filename, F_OK) == -1) {
111 scnprintf(filename, MAXPATHLEN, CORE_CPUS_FMT_OLD,
112 sysfs__mountpoint(), cpu);
114 fp = fopen(filename, "r");
115 if (!fp)
116 goto done;
118 if (getline(&buf, &len, fp) <= 0)
119 goto done;
121 p = strchr(buf, '\n');
122 if (p)
123 *p = '\0';
125 for (i = 0; i < tp->core_cpus_lists; i++) {
126 if (!strcmp(buf, tp->core_cpus_list[i]))
127 break;
129 if (i == tp->core_cpus_lists) {
130 tp->core_cpus_list[i] = buf;
131 tp->core_cpus_lists++;
132 buf = NULL;
134 ret = 0;
135 done:
136 if (fp)
137 fclose(fp);
138 free(buf);
139 return ret;
142 void cpu_topology__delete(struct cpu_topology *tp)
144 u32 i;
146 if (!tp)
147 return;
149 for (i = 0 ; i < tp->package_cpus_lists; i++)
150 zfree(&tp->package_cpus_list[i]);
152 for (i = 0 ; i < tp->die_cpus_lists; i++)
153 zfree(&tp->die_cpus_list[i]);
155 for (i = 0 ; i < tp->core_cpus_lists; i++)
156 zfree(&tp->core_cpus_list[i]);
158 free(tp);
161 bool cpu_topology__smt_on(const struct cpu_topology *topology)
163 for (u32 i = 0; i < topology->core_cpus_lists; i++) {
164 const char *cpu_list = topology->core_cpus_list[i];
167 * If there is a need to separate siblings in a core then SMT is
168 * enabled.
170 if (strchr(cpu_list, ',') || strchr(cpu_list, '-'))
171 return true;
173 return false;
176 bool cpu_topology__core_wide(const struct cpu_topology *topology,
177 const char *user_requested_cpu_list)
179 struct perf_cpu_map *user_requested_cpus;
182 * If user_requested_cpu_list is empty then all CPUs are recorded and so
183 * core_wide is true.
185 if (!user_requested_cpu_list)
186 return true;
188 user_requested_cpus = perf_cpu_map__new(user_requested_cpu_list);
189 /* Check that every user requested CPU is the complete set of SMT threads on a core. */
190 for (u32 i = 0; i < topology->core_cpus_lists; i++) {
191 const char *core_cpu_list = topology->core_cpus_list[i];
192 struct perf_cpu_map *core_cpus = perf_cpu_map__new(core_cpu_list);
193 struct perf_cpu cpu;
194 int idx;
195 bool has_first, first = true;
197 perf_cpu_map__for_each_cpu(cpu, idx, core_cpus) {
198 if (first) {
199 has_first = perf_cpu_map__has(user_requested_cpus, cpu);
200 first = false;
201 } else {
203 * If the first core CPU is user requested then
204 * all subsequent CPUs in the core must be user
205 * requested too. If the first CPU isn't user
206 * requested then none of the others must be
207 * too.
209 if (perf_cpu_map__has(user_requested_cpus, cpu) != has_first) {
210 perf_cpu_map__put(core_cpus);
211 perf_cpu_map__put(user_requested_cpus);
212 return false;
216 perf_cpu_map__put(core_cpus);
218 perf_cpu_map__put(user_requested_cpus);
219 return true;
222 static bool has_die_topology(void)
224 char filename[MAXPATHLEN];
225 struct utsname uts;
227 if (uname(&uts) < 0)
228 return false;
230 if (strncmp(uts.machine, "x86_64", 6) &&
231 strncmp(uts.machine, "s390x", 5))
232 return false;
234 scnprintf(filename, MAXPATHLEN, DIE_CPUS_FMT,
235 sysfs__mountpoint(), 0);
236 if (access(filename, F_OK) == -1)
237 return false;
239 return true;
242 const struct cpu_topology *online_topology(void)
244 static const struct cpu_topology *topology;
246 if (!topology) {
247 topology = cpu_topology__new();
248 if (!topology) {
249 pr_err("Error creating CPU topology");
250 abort();
253 return topology;
256 struct cpu_topology *cpu_topology__new(void)
258 struct cpu_topology *tp = NULL;
259 void *addr;
260 u32 nr, i, nr_addr;
261 size_t sz;
262 long ncpus;
263 int ret = -1;
264 struct perf_cpu_map *map;
265 bool has_die = has_die_topology();
267 ncpus = cpu__max_present_cpu().cpu;
269 /* build online CPU map */
270 map = perf_cpu_map__new_online_cpus();
271 if (map == NULL) {
272 pr_debug("failed to get system cpumap\n");
273 return NULL;
276 nr = (u32)(ncpus & UINT_MAX);
278 sz = nr * sizeof(char *);
279 if (has_die)
280 nr_addr = 3;
281 else
282 nr_addr = 2;
283 addr = calloc(1, sizeof(*tp) + nr_addr * sz);
284 if (!addr)
285 goto out_free;
287 tp = addr;
288 addr += sizeof(*tp);
289 tp->package_cpus_list = addr;
290 addr += sz;
291 if (has_die) {
292 tp->die_cpus_list = addr;
293 addr += sz;
295 tp->core_cpus_list = addr;
297 for (i = 0; i < nr; i++) {
298 if (!perf_cpu_map__has(map, (struct perf_cpu){ .cpu = i }))
299 continue;
301 ret = build_cpu_topology(tp, i);
302 if (ret < 0)
303 break;
306 out_free:
307 perf_cpu_map__put(map);
308 if (ret) {
309 cpu_topology__delete(tp);
310 tp = NULL;
312 return tp;
315 static int load_numa_node(struct numa_topology_node *node, int nr)
317 char str[MAXPATHLEN];
318 char field[32];
319 char *buf = NULL, *p;
320 size_t len = 0;
321 int ret = -1;
322 FILE *fp;
323 u64 mem;
325 node->node = (u32) nr;
327 scnprintf(str, MAXPATHLEN, NODE_MEMINFO_FMT,
328 sysfs__mountpoint(), nr);
329 fp = fopen(str, "r");
330 if (!fp)
331 return -1;
333 while (getline(&buf, &len, fp) > 0) {
334 /* skip over invalid lines */
335 if (!strchr(buf, ':'))
336 continue;
337 if (sscanf(buf, "%*s %*d %31s %"PRIu64, field, &mem) != 2)
338 goto err;
339 if (!strcmp(field, "MemTotal:"))
340 node->mem_total = mem;
341 if (!strcmp(field, "MemFree:"))
342 node->mem_free = mem;
343 if (node->mem_total && node->mem_free)
344 break;
347 fclose(fp);
348 fp = NULL;
350 scnprintf(str, MAXPATHLEN, NODE_CPULIST_FMT,
351 sysfs__mountpoint(), nr);
353 fp = fopen(str, "r");
354 if (!fp)
355 return -1;
357 if (getline(&buf, &len, fp) <= 0)
358 goto err;
360 p = strchr(buf, '\n');
361 if (p)
362 *p = '\0';
364 node->cpus = buf;
365 fclose(fp);
366 return 0;
368 err:
369 free(buf);
370 if (fp)
371 fclose(fp);
372 return ret;
375 struct numa_topology *numa_topology__new(void)
377 struct perf_cpu_map *node_map = NULL;
378 struct numa_topology *tp = NULL;
379 char path[MAXPATHLEN];
380 char *buf = NULL;
381 size_t len = 0;
382 u32 nr, i;
383 FILE *fp;
384 char *c;
386 scnprintf(path, MAXPATHLEN, NODE_ONLINE_FMT,
387 sysfs__mountpoint());
389 fp = fopen(path, "r");
390 if (!fp)
391 return NULL;
393 if (getline(&buf, &len, fp) <= 0)
394 goto out;
396 c = strchr(buf, '\n');
397 if (c)
398 *c = '\0';
400 node_map = perf_cpu_map__new(buf);
401 if (!node_map)
402 goto out;
404 nr = (u32) perf_cpu_map__nr(node_map);
406 tp = zalloc(sizeof(*tp) + sizeof(tp->nodes[0])*nr);
407 if (!tp)
408 goto out;
410 tp->nr = nr;
412 for (i = 0; i < nr; i++) {
413 if (load_numa_node(&tp->nodes[i], perf_cpu_map__cpu(node_map, i).cpu)) {
414 numa_topology__delete(tp);
415 tp = NULL;
416 break;
420 out:
421 free(buf);
422 fclose(fp);
423 perf_cpu_map__put(node_map);
424 return tp;
427 void numa_topology__delete(struct numa_topology *tp)
429 u32 i;
431 for (i = 0; i < tp->nr; i++)
432 zfree(&tp->nodes[i].cpus);
434 free(tp);
437 static int load_hybrid_node(struct hybrid_topology_node *node,
438 struct perf_pmu *pmu)
440 char *buf = NULL, *p;
441 FILE *fp;
442 size_t len = 0;
444 node->pmu_name = strdup(pmu->name);
445 if (!node->pmu_name)
446 return -1;
448 fp = perf_pmu__open_file(pmu, "cpus");
449 if (!fp)
450 goto err;
452 if (getline(&buf, &len, fp) <= 0) {
453 fclose(fp);
454 goto err;
457 p = strchr(buf, '\n');
458 if (p)
459 *p = '\0';
461 fclose(fp);
462 node->cpus = buf;
463 return 0;
465 err:
466 zfree(&node->pmu_name);
467 free(buf);
468 return -1;
471 struct hybrid_topology *hybrid_topology__new(void)
473 struct perf_pmu *pmu = NULL;
474 struct hybrid_topology *tp = NULL;
475 int nr = perf_pmus__num_core_pmus(), i = 0;
477 if (nr <= 1)
478 return NULL;
480 tp = zalloc(sizeof(*tp) + sizeof(tp->nodes[0]) * nr);
481 if (!tp)
482 return NULL;
484 tp->nr = nr;
485 while ((pmu = perf_pmus__scan_core(pmu)) != NULL) {
486 if (load_hybrid_node(&tp->nodes[i], pmu)) {
487 hybrid_topology__delete(tp);
488 return NULL;
490 i++;
493 return tp;
496 void hybrid_topology__delete(struct hybrid_topology *tp)
498 u32 i;
500 for (i = 0; i < tp->nr; i++) {
501 zfree(&tp->nodes[i].pmu_name);
502 zfree(&tp->nodes[i].cpus);
505 free(tp);