1 // SPDX-License-Identifier: GPL-2.0
2 #include <linux/list.h>
3 #include <linux/list_sort.h>
4 #include <linux/string.h>
5 #include <linux/zalloc.h>
6 #include <subcmd/pager.h>
18 #include "print-events.h"
21 * core_pmus: A PMU belongs to core_pmus if it's name is "cpu" or it's sysfs
22 * directory contains "cpus" file. All PMUs belonging to core_pmus
23 * must have pmu->is_core=1. If there are more than one PMU in
24 * this list, perf interprets it as a heterogeneous platform.
25 * (FWIW, certain ARM platforms having heterogeneous cores uses
26 * homogeneous PMU, and thus they are treated as homogeneous
27 * platform by perf because core_pmus will have only one entry)
28 * other_pmus: All other PMUs which are not part of core_pmus list. It doesn't
29 * matter whether PMU is present per SMT-thread or outside of the
30 * core in the hw. For e.g., an instance of AMD ibs_fetch// and
31 * ibs_op// PMUs is present in each hw SMT thread, however they
32 * are captured under other_pmus. PMUs belonging to other_pmus
33 * must have pmu->is_core=0 but pmu->is_uncore could be 0 or 1.
35 static LIST_HEAD(core_pmus);
36 static LIST_HEAD(other_pmus);
37 static bool read_sysfs_core_pmus;
38 static bool read_sysfs_all_pmus;
40 static void pmu_read_sysfs(bool core_only);
42 int pmu_name_len_no_suffix(const char *str, unsigned long *num)
46 orig_len = len = strlen(str);
48 /* Non-uncore PMUs have their full length, for example, i915. */
49 if (!strstarts(str, "uncore_"))
53 * Count trailing digits and '_', if '_{num}' suffix isn't present use
56 while (len > 0 && isdigit(str[len - 1]))
59 if (len > 0 && len != orig_len && str[len - 1] == '_') {
61 *num = strtoul(&str[len], NULL, 10);
67 void perf_pmus__destroy(void)
69 struct perf_pmu *pmu, *tmp;
71 list_for_each_entry_safe(pmu, tmp, &core_pmus, list) {
74 perf_pmu__delete(pmu);
76 list_for_each_entry_safe(pmu, tmp, &other_pmus, list) {
79 perf_pmu__delete(pmu);
81 read_sysfs_core_pmus = false;
82 read_sysfs_all_pmus = false;
85 static struct perf_pmu *pmu_find(const char *name)
89 list_for_each_entry(pmu, &core_pmus, list) {
90 if (!strcmp(pmu->name, name) ||
91 (pmu->alias_name && !strcmp(pmu->alias_name, name)))
94 list_for_each_entry(pmu, &other_pmus, list) {
95 if (!strcmp(pmu->name, name) ||
96 (pmu->alias_name && !strcmp(pmu->alias_name, name)))
103 struct perf_pmu *perf_pmus__find(const char *name)
105 struct perf_pmu *pmu;
110 * Once PMU is loaded it stays in the list,
111 * so we keep us from multiple reading/parsing
112 * the pmu format definitions.
114 pmu = pmu_find(name);
118 if (read_sysfs_all_pmus)
121 core_pmu = is_pmu_core(name);
122 if (core_pmu && read_sysfs_core_pmus)
125 dirfd = perf_pmu__event_source_devices_fd();
126 pmu = perf_pmu__lookup(core_pmu ? &core_pmus : &other_pmus, dirfd, name);
131 * Looking up an inidividual PMU failed. This may mean name is
132 * an alias, so read the PMUs from sysfs and try to find again.
134 pmu_read_sysfs(core_pmu);
135 pmu = pmu_find(name);
140 static struct perf_pmu *perf_pmu__find2(int dirfd, const char *name)
142 struct perf_pmu *pmu;
146 * Once PMU is loaded it stays in the list,
147 * so we keep us from multiple reading/parsing
148 * the pmu format definitions.
150 pmu = pmu_find(name);
154 if (read_sysfs_all_pmus)
157 core_pmu = is_pmu_core(name);
158 if (core_pmu && read_sysfs_core_pmus)
161 return perf_pmu__lookup(core_pmu ? &core_pmus : &other_pmus, dirfd, name);
164 static int pmus_cmp(void *priv __maybe_unused,
165 const struct list_head *lhs, const struct list_head *rhs)
167 unsigned long lhs_num = 0, rhs_num = 0;
168 struct perf_pmu *lhs_pmu = container_of(lhs, struct perf_pmu, list);
169 struct perf_pmu *rhs_pmu = container_of(rhs, struct perf_pmu, list);
170 const char *lhs_pmu_name = lhs_pmu->name ?: "";
171 const char *rhs_pmu_name = rhs_pmu->name ?: "";
172 int lhs_pmu_name_len = pmu_name_len_no_suffix(lhs_pmu_name, &lhs_num);
173 int rhs_pmu_name_len = pmu_name_len_no_suffix(rhs_pmu_name, &rhs_num);
174 int ret = strncmp(lhs_pmu_name, rhs_pmu_name,
175 lhs_pmu_name_len < rhs_pmu_name_len ? lhs_pmu_name_len : rhs_pmu_name_len);
177 if (lhs_pmu_name_len != rhs_pmu_name_len || ret != 0 || lhs_pmu_name_len == 0)
180 return lhs_num < rhs_num ? -1 : (lhs_num > rhs_num ? 1 : 0);
183 /* Add all pmus in sysfs to pmu list: */
184 static void pmu_read_sysfs(bool core_only)
190 if (read_sysfs_all_pmus || (core_only && read_sysfs_core_pmus))
193 fd = perf_pmu__event_source_devices_fd();
203 while ((dent = readdir(dir))) {
204 if (!strcmp(dent->d_name, ".") || !strcmp(dent->d_name, ".."))
206 if (core_only && !is_pmu_core(dent->d_name))
208 /* add to static LIST_HEAD(core_pmus) or LIST_HEAD(other_pmus): */
209 perf_pmu__find2(fd, dent->d_name);
213 if (list_empty(&core_pmus)) {
214 if (!perf_pmu__create_placeholder_core_pmu(&core_pmus))
215 pr_err("Failure to set up any core PMUs\n");
217 list_sort(NULL, &core_pmus, pmus_cmp);
218 list_sort(NULL, &other_pmus, pmus_cmp);
219 if (!list_empty(&core_pmus)) {
220 read_sysfs_core_pmus = true;
222 read_sysfs_all_pmus = true;
226 static struct perf_pmu *__perf_pmus__find_by_type(unsigned int type)
228 struct perf_pmu *pmu;
230 list_for_each_entry(pmu, &core_pmus, list) {
231 if (pmu->type == type)
235 list_for_each_entry(pmu, &other_pmus, list) {
236 if (pmu->type == type)
242 struct perf_pmu *perf_pmus__find_by_type(unsigned int type)
244 struct perf_pmu *pmu = __perf_pmus__find_by_type(type);
246 if (pmu || read_sysfs_all_pmus)
249 pmu_read_sysfs(/*core_only=*/false);
250 pmu = __perf_pmus__find_by_type(type);
255 * pmu iterator: If pmu is NULL, we start at the begin, otherwise return the
256 * next pmu. Returns NULL on end.
258 struct perf_pmu *perf_pmus__scan(struct perf_pmu *pmu)
260 bool use_core_pmus = !pmu || pmu->is_core;
263 pmu_read_sysfs(/*core_only=*/false);
264 pmu = list_prepare_entry(pmu, &core_pmus, list);
267 list_for_each_entry_continue(pmu, &core_pmus, list)
271 pmu = list_prepare_entry(pmu, &other_pmus, list);
273 list_for_each_entry_continue(pmu, &other_pmus, list)
278 struct perf_pmu *perf_pmus__scan_core(struct perf_pmu *pmu)
281 pmu_read_sysfs(/*core_only=*/true);
282 return list_first_entry_or_null(&core_pmus, typeof(*pmu), list);
284 list_for_each_entry_continue(pmu, &core_pmus, list)
290 static struct perf_pmu *perf_pmus__scan_skip_duplicates(struct perf_pmu *pmu)
292 bool use_core_pmus = !pmu || pmu->is_core;
293 int last_pmu_name_len = 0;
294 const char *last_pmu_name = (pmu && pmu->name) ? pmu->name : "";
297 pmu_read_sysfs(/*core_only=*/false);
298 pmu = list_prepare_entry(pmu, &core_pmus, list);
300 last_pmu_name_len = pmu_name_len_no_suffix(pmu->name ?: "", NULL);
303 list_for_each_entry_continue(pmu, &core_pmus, list) {
304 int pmu_name_len = pmu_name_len_no_suffix(pmu->name ?: "", /*num=*/NULL);
306 if (last_pmu_name_len == pmu_name_len &&
307 !strncmp(last_pmu_name, pmu->name ?: "", pmu_name_len))
313 pmu = list_prepare_entry(pmu, &other_pmus, list);
315 list_for_each_entry_continue(pmu, &other_pmus, list) {
316 int pmu_name_len = pmu_name_len_no_suffix(pmu->name ?: "", /*num=*/NULL);
318 if (last_pmu_name_len == pmu_name_len &&
319 !strncmp(last_pmu_name, pmu->name ?: "", pmu_name_len))
327 const struct perf_pmu *perf_pmus__pmu_for_pmu_filter(const char *str)
329 struct perf_pmu *pmu = NULL;
331 while ((pmu = perf_pmus__scan(pmu)) != NULL) {
332 if (!strcmp(pmu->name, str))
334 /* Ignore "uncore_" prefix. */
335 if (!strncmp(pmu->name, "uncore_", 7)) {
336 if (!strcmp(pmu->name + 7, str))
339 /* Ignore "cpu_" prefix on Intel hybrid PMUs. */
340 if (!strncmp(pmu->name, "cpu_", 4)) {
341 if (!strcmp(pmu->name + 4, str))
348 /** Struct for ordering events as output in perf list. */
350 /** PMU for event. */
351 const struct perf_pmu *pmu;
354 const char *scale_unit;
356 const char *long_desc;
357 const char *encoding_desc;
359 const char *pmu_name;
363 static int cmp_sevent(const void *a, const void *b)
365 const struct sevent *as = a;
366 const struct sevent *bs = b;
367 bool a_iscpu, b_iscpu;
370 /* Put extra events last. */
371 if (!!as->desc != !!bs->desc)
372 return !!as->desc - !!bs->desc;
374 /* Order by topics. */
375 ret = strcmp(as->topic ?: "", bs->topic ?: "");
379 /* Order CPU core events to be first */
380 a_iscpu = as->pmu ? as->pmu->is_core : true;
381 b_iscpu = bs->pmu ? bs->pmu->is_core : true;
382 if (a_iscpu != b_iscpu)
383 return a_iscpu ? -1 : 1;
385 /* Order by PMU name. */
386 if (as->pmu != bs->pmu) {
387 ret = strcmp(as->pmu_name ?: "", bs->pmu_name ?: "");
392 /* Order by event name. */
393 return strcmp(as->name, bs->name);
396 static bool pmu_alias_is_duplicate(struct sevent *a, struct sevent *b)
398 /* Different names -> never duplicates */
399 if (strcmp(a->name ?: "//", b->name ?: "//"))
402 /* Don't remove duplicates for different PMUs */
403 return strcmp(a->pmu_name, b->pmu_name) == 0;
406 struct events_callback_state {
407 struct sevent *aliases;
412 static int perf_pmus__print_pmu_events__callback(void *vstate,
413 struct pmu_event_info *info)
415 struct events_callback_state *state = vstate;
418 if (state->index >= state->aliases_len) {
419 pr_err("Unexpected event %s/%s/\n", info->pmu->name, info->name);
422 s = &state->aliases[state->index];
424 #define COPY_STR(str) s->str = info->str ? strdup(info->str) : NULL
427 COPY_STR(scale_unit);
430 COPY_STR(encoding_desc);
434 s->deprecated = info->deprecated;
439 void perf_pmus__print_pmu_events(const struct print_callbacks *print_cb, void *print_state)
441 struct perf_pmu *pmu;
444 struct sevent *aliases;
445 struct events_callback_state state;
446 bool skip_duplicate_pmus = print_cb->skip_duplicate_pmus(print_state);
447 struct perf_pmu *(*scan_fn)(struct perf_pmu *);
449 if (skip_duplicate_pmus)
450 scan_fn = perf_pmus__scan_skip_duplicates;
452 scan_fn = perf_pmus__scan;
456 while ((pmu = scan_fn(pmu)) != NULL)
457 len += perf_pmu__num_events(pmu);
459 aliases = zalloc(sizeof(struct sevent) * len);
461 pr_err("FATAL: not enough memory to print PMU events\n");
465 state = (struct events_callback_state) {
470 while ((pmu = scan_fn(pmu)) != NULL) {
471 perf_pmu__for_each_event(pmu, skip_duplicate_pmus, &state,
472 perf_pmus__print_pmu_events__callback);
474 qsort(aliases, len, sizeof(struct sevent), cmp_sevent);
475 for (int j = 0; j < len; j++) {
476 /* Skip duplicates */
477 if (j > 0 && pmu_alias_is_duplicate(&aliases[j], &aliases[j - 1]))
480 print_cb->print_event(print_state,
485 aliases[j].scale_unit,
486 aliases[j].deprecated,
489 aliases[j].long_desc,
490 aliases[j].encoding_desc);
491 zfree(&aliases[j].name);
492 zfree(&aliases[j].alias);
493 zfree(&aliases[j].scale_unit);
494 zfree(&aliases[j].desc);
495 zfree(&aliases[j].long_desc);
496 zfree(&aliases[j].encoding_desc);
497 zfree(&aliases[j].topic);
498 zfree(&aliases[j].pmu_name);
500 if (printed && pager_in_use())
506 bool perf_pmus__have_event(const char *pname, const char *name)
508 struct perf_pmu *pmu = perf_pmus__find(pname);
510 return pmu && perf_pmu__have_event(pmu, name);
513 int perf_pmus__num_core_pmus(void)
518 struct perf_pmu *pmu = NULL;
520 while ((pmu = perf_pmus__scan_core(pmu)) != NULL)
526 static bool __perf_pmus__supports_extended_type(void)
528 struct perf_pmu *pmu = NULL;
530 if (perf_pmus__num_core_pmus() <= 1)
533 while ((pmu = perf_pmus__scan_core(pmu)) != NULL) {
534 if (!is_event_supported(PERF_TYPE_HARDWARE, PERF_COUNT_HW_CPU_CYCLES | ((__u64)pmu->type << PERF_PMU_TYPE_SHIFT)))
541 static bool perf_pmus__do_support_extended_type;
543 static void perf_pmus__init_supports_extended_type(void)
545 perf_pmus__do_support_extended_type = __perf_pmus__supports_extended_type();
548 bool perf_pmus__supports_extended_type(void)
550 static pthread_once_t extended_type_once = PTHREAD_ONCE_INIT;
552 pthread_once(&extended_type_once, perf_pmus__init_supports_extended_type);
554 return perf_pmus__do_support_extended_type;
557 char *perf_pmus__default_pmu_name(void)
564 if (!list_empty(&core_pmus))
565 return strdup(list_first_entry(&core_pmus, struct perf_pmu, list)->name);
567 fd = perf_pmu__event_source_devices_fd();
569 return strdup("cpu");
574 return strdup("cpu");
577 while ((dent = readdir(dir))) {
578 if (!strcmp(dent->d_name, ".") || !strcmp(dent->d_name, ".."))
580 if (is_pmu_core(dent->d_name)) {
581 result = strdup(dent->d_name);
587 return result ?: strdup("cpu");
590 struct perf_pmu *evsel__find_pmu(const struct evsel *evsel)
592 struct perf_pmu *pmu = evsel->pmu;
595 pmu = perf_pmus__find_by_type(evsel->core.attr.type);
596 ((struct evsel *)evsel)->pmu = pmu;
601 struct perf_pmu *perf_pmus__find_core_pmu(void)
603 return perf_pmus__scan_core(NULL);