perf evlist: Fix max mmap_pages
[linux-block.git] / tools / perf / util / evlist.c
CommitLineData
f8a95309
ACM
1/*
2 * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
3 *
4 * Parts came from builtin-{top,stat,record}.c, see those files for further
5 * copyright notes.
6 *
7 * Released under the GPL v2. (and only v2, not any later version)
8 */
a8c9ae18 9#include "util.h"
85c66be1 10#include <lk/debugfs.h>
5c581041 11#include <poll.h>
f8a95309
ACM
12#include "cpumap.h"
13#include "thread_map.h"
12864b31 14#include "target.h"
361c99a6
ACM
15#include "evlist.h"
16#include "evsel.h"
e3e1a54f 17#include "debug.h"
35b9d88e 18#include <unistd.h>
361c99a6 19
50d08e47 20#include "parse-events.h"
994a1f78 21#include "parse-options.h"
50d08e47 22
f8a95309
ACM
23#include <sys/mman.h>
24
70db7533
ACM
25#include <linux/bitops.h>
26#include <linux/hash.h>
27
f8a95309 28#define FD(e, x, y) (*(int *)xyarray__entry(e->fd, x, y))
a91e5431 29#define SID(e, x, y) xyarray__entry(e->sample_id, x, y)
f8a95309 30
7e2ed097
ACM
31void perf_evlist__init(struct perf_evlist *evlist, struct cpu_map *cpus,
32 struct thread_map *threads)
ef1d1af2
ACM
33{
34 int i;
35
36 for (i = 0; i < PERF_EVLIST__HLIST_SIZE; ++i)
37 INIT_HLIST_HEAD(&evlist->heads[i]);
38 INIT_LIST_HEAD(&evlist->entries);
7e2ed097 39 perf_evlist__set_maps(evlist, cpus, threads);
35b9d88e 40 evlist->workload.pid = -1;
ef1d1af2
ACM
41}
42
334fe7a3 43struct perf_evlist *perf_evlist__new(void)
361c99a6
ACM
44{
45 struct perf_evlist *evlist = zalloc(sizeof(*evlist));
46
ef1d1af2 47 if (evlist != NULL)
334fe7a3 48 perf_evlist__init(evlist, NULL, NULL);
361c99a6
ACM
49
50 return evlist;
51}
52
b22d54b0
JO
53struct perf_evlist *perf_evlist__new_default(void)
54{
55 struct perf_evlist *evlist = perf_evlist__new();
56
57 if (evlist && perf_evlist__add_default(evlist)) {
58 perf_evlist__delete(evlist);
59 evlist = NULL;
60 }
61
62 return evlist;
63}
64
75562573
AH
65/**
66 * perf_evlist__set_id_pos - set the positions of event ids.
67 * @evlist: selected event list
68 *
69 * Events with compatible sample types all have the same id_pos
70 * and is_pos. For convenience, put a copy on evlist.
71 */
72void perf_evlist__set_id_pos(struct perf_evlist *evlist)
73{
74 struct perf_evsel *first = perf_evlist__first(evlist);
75
76 evlist->id_pos = first->id_pos;
77 evlist->is_pos = first->is_pos;
78}
79
733cd2fe
AH
80static void perf_evlist__update_id_pos(struct perf_evlist *evlist)
81{
82 struct perf_evsel *evsel;
83
84 list_for_each_entry(evsel, &evlist->entries, node)
85 perf_evsel__calc_id_pos(evsel);
86
87 perf_evlist__set_id_pos(evlist);
88}
89
361c99a6
ACM
90static void perf_evlist__purge(struct perf_evlist *evlist)
91{
92 struct perf_evsel *pos, *n;
93
94 list_for_each_entry_safe(pos, n, &evlist->entries, node) {
95 list_del_init(&pos->node);
96 perf_evsel__delete(pos);
97 }
98
99 evlist->nr_entries = 0;
100}
101
ef1d1af2 102void perf_evlist__exit(struct perf_evlist *evlist)
361c99a6 103{
70db7533 104 free(evlist->mmap);
5c581041 105 free(evlist->pollfd);
ef1d1af2
ACM
106 evlist->mmap = NULL;
107 evlist->pollfd = NULL;
108}
109
110void perf_evlist__delete(struct perf_evlist *evlist)
111{
112 perf_evlist__purge(evlist);
113 perf_evlist__exit(evlist);
361c99a6
ACM
114 free(evlist);
115}
116
117void perf_evlist__add(struct perf_evlist *evlist, struct perf_evsel *entry)
118{
119 list_add_tail(&entry->node, &evlist->entries);
ef503831
ACM
120 entry->idx = evlist->nr_entries;
121
75562573
AH
122 if (!evlist->nr_entries++)
123 perf_evlist__set_id_pos(evlist);
361c99a6
ACM
124}
125
0529bc1f
JO
126void perf_evlist__splice_list_tail(struct perf_evlist *evlist,
127 struct list_head *list,
128 int nr_entries)
50d08e47 129{
75562573
AH
130 bool set_id_pos = !evlist->nr_entries;
131
50d08e47
ACM
132 list_splice_tail(list, &evlist->entries);
133 evlist->nr_entries += nr_entries;
75562573
AH
134 if (set_id_pos)
135 perf_evlist__set_id_pos(evlist);
50d08e47
ACM
136}
137
63dab225
ACM
138void __perf_evlist__set_leader(struct list_head *list)
139{
140 struct perf_evsel *evsel, *leader;
141
142 leader = list_entry(list->next, struct perf_evsel, node);
97f63e4a
NK
143 evsel = list_entry(list->prev, struct perf_evsel, node);
144
145 leader->nr_members = evsel->idx - leader->idx + 1;
63dab225
ACM
146
147 list_for_each_entry(evsel, list, node) {
74b2133d 148 evsel->leader = leader;
63dab225
ACM
149 }
150}
151
152void perf_evlist__set_leader(struct perf_evlist *evlist)
6a4bb04c 153{
97f63e4a
NK
154 if (evlist->nr_entries) {
155 evlist->nr_groups = evlist->nr_entries > 1 ? 1 : 0;
63dab225 156 __perf_evlist__set_leader(&evlist->entries);
97f63e4a 157 }
6a4bb04c
JO
158}
159
361c99a6
ACM
160int perf_evlist__add_default(struct perf_evlist *evlist)
161{
162 struct perf_event_attr attr = {
163 .type = PERF_TYPE_HARDWARE,
164 .config = PERF_COUNT_HW_CPU_CYCLES,
165 };
1aed2671
JR
166 struct perf_evsel *evsel;
167
168 event_attr_init(&attr);
361c99a6 169
ef503831 170 evsel = perf_evsel__new(&attr);
361c99a6 171 if (evsel == NULL)
cc2d86b0
SE
172 goto error;
173
174 /* use strdup() because free(evsel) assumes name is allocated */
175 evsel->name = strdup("cycles");
176 if (!evsel->name)
177 goto error_free;
361c99a6
ACM
178
179 perf_evlist__add(evlist, evsel);
180 return 0;
cc2d86b0
SE
181error_free:
182 perf_evsel__delete(evsel);
183error:
184 return -ENOMEM;
361c99a6 185}
5c581041 186
e60fc847
ACM
187static int perf_evlist__add_attrs(struct perf_evlist *evlist,
188 struct perf_event_attr *attrs, size_t nr_attrs)
50d08e47
ACM
189{
190 struct perf_evsel *evsel, *n;
191 LIST_HEAD(head);
192 size_t i;
193
194 for (i = 0; i < nr_attrs; i++) {
ef503831 195 evsel = perf_evsel__new_idx(attrs + i, evlist->nr_entries + i);
50d08e47
ACM
196 if (evsel == NULL)
197 goto out_delete_partial_list;
198 list_add_tail(&evsel->node, &head);
199 }
200
201 perf_evlist__splice_list_tail(evlist, &head, nr_attrs);
202
203 return 0;
204
205out_delete_partial_list:
206 list_for_each_entry_safe(evsel, n, &head, node)
207 perf_evsel__delete(evsel);
208 return -1;
209}
210
79695e1b
ACM
211int __perf_evlist__add_default_attrs(struct perf_evlist *evlist,
212 struct perf_event_attr *attrs, size_t nr_attrs)
213{
214 size_t i;
215
216 for (i = 0; i < nr_attrs; i++)
217 event_attr_init(attrs + i);
218
219 return perf_evlist__add_attrs(evlist, attrs, nr_attrs);
220}
221
da378962
ACM
222struct perf_evsel *
223perf_evlist__find_tracepoint_by_id(struct perf_evlist *evlist, int id)
ee29be62
ACM
224{
225 struct perf_evsel *evsel;
226
227 list_for_each_entry(evsel, &evlist->entries, node) {
228 if (evsel->attr.type == PERF_TYPE_TRACEPOINT &&
229 (int)evsel->attr.config == id)
230 return evsel;
231 }
232
233 return NULL;
234}
235
a2f2804a
DA
236struct perf_evsel *
237perf_evlist__find_tracepoint_by_name(struct perf_evlist *evlist,
238 const char *name)
239{
240 struct perf_evsel *evsel;
241
242 list_for_each_entry(evsel, &evlist->entries, node) {
243 if ((evsel->attr.type == PERF_TYPE_TRACEPOINT) &&
244 (strcmp(evsel->name, name) == 0))
245 return evsel;
246 }
247
248 return NULL;
249}
250
39876e7d
ACM
251int perf_evlist__add_newtp(struct perf_evlist *evlist,
252 const char *sys, const char *name, void *handler)
253{
ef503831 254 struct perf_evsel *evsel = perf_evsel__newtp(sys, name);
39876e7d 255
39876e7d
ACM
256 if (evsel == NULL)
257 return -1;
258
744a9719 259 evsel->handler = handler;
39876e7d
ACM
260 perf_evlist__add(evlist, evsel);
261 return 0;
262}
263
4152ab37
ACM
264void perf_evlist__disable(struct perf_evlist *evlist)
265{
266 int cpu, thread;
267 struct perf_evsel *pos;
b3a319d5
NK
268 int nr_cpus = cpu_map__nr(evlist->cpus);
269 int nr_threads = thread_map__nr(evlist->threads);
4152ab37 270
b3a319d5 271 for (cpu = 0; cpu < nr_cpus; cpu++) {
4152ab37 272 list_for_each_entry(pos, &evlist->entries, node) {
395c3070 273 if (!perf_evsel__is_group_leader(pos) || !pos->fd)
3fe4430d 274 continue;
b3a319d5 275 for (thread = 0; thread < nr_threads; thread++)
55da8005
NK
276 ioctl(FD(pos, cpu, thread),
277 PERF_EVENT_IOC_DISABLE, 0);
4152ab37
ACM
278 }
279 }
280}
281
764e16a3
DA
282void perf_evlist__enable(struct perf_evlist *evlist)
283{
284 int cpu, thread;
285 struct perf_evsel *pos;
b3a319d5
NK
286 int nr_cpus = cpu_map__nr(evlist->cpus);
287 int nr_threads = thread_map__nr(evlist->threads);
764e16a3 288
b3a319d5 289 for (cpu = 0; cpu < nr_cpus; cpu++) {
764e16a3 290 list_for_each_entry(pos, &evlist->entries, node) {
395c3070 291 if (!perf_evsel__is_group_leader(pos) || !pos->fd)
3fe4430d 292 continue;
b3a319d5 293 for (thread = 0; thread < nr_threads; thread++)
55da8005
NK
294 ioctl(FD(pos, cpu, thread),
295 PERF_EVENT_IOC_ENABLE, 0);
764e16a3
DA
296 }
297 }
298}
299
395c3070
AH
300int perf_evlist__disable_event(struct perf_evlist *evlist,
301 struct perf_evsel *evsel)
302{
303 int cpu, thread, err;
304
305 if (!evsel->fd)
306 return 0;
307
308 for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
309 for (thread = 0; thread < evlist->threads->nr; thread++) {
310 err = ioctl(FD(evsel, cpu, thread),
311 PERF_EVENT_IOC_DISABLE, 0);
312 if (err)
313 return err;
314 }
315 }
316 return 0;
317}
318
319int perf_evlist__enable_event(struct perf_evlist *evlist,
320 struct perf_evsel *evsel)
321{
322 int cpu, thread, err;
323
324 if (!evsel->fd)
325 return -EINVAL;
326
327 for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
328 for (thread = 0; thread < evlist->threads->nr; thread++) {
329 err = ioctl(FD(evsel, cpu, thread),
330 PERF_EVENT_IOC_ENABLE, 0);
331 if (err)
332 return err;
333 }
334 }
335 return 0;
336}
337
806fb630 338static int perf_evlist__alloc_pollfd(struct perf_evlist *evlist)
5c581041 339{
b3a319d5
NK
340 int nr_cpus = cpu_map__nr(evlist->cpus);
341 int nr_threads = thread_map__nr(evlist->threads);
342 int nfds = nr_cpus * nr_threads * evlist->nr_entries;
5c581041
ACM
343 evlist->pollfd = malloc(sizeof(struct pollfd) * nfds);
344 return evlist->pollfd != NULL ? 0 : -ENOMEM;
345}
70082dd9
ACM
346
347void perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd)
348{
349 fcntl(fd, F_SETFL, O_NONBLOCK);
350 evlist->pollfd[evlist->nr_fds].fd = fd;
351 evlist->pollfd[evlist->nr_fds].events = POLLIN;
352 evlist->nr_fds++;
353}
70db7533 354
a91e5431
ACM
355static void perf_evlist__id_hash(struct perf_evlist *evlist,
356 struct perf_evsel *evsel,
357 int cpu, int thread, u64 id)
3d3b5e95
ACM
358{
359 int hash;
360 struct perf_sample_id *sid = SID(evsel, cpu, thread);
361
362 sid->id = id;
363 sid->evsel = evsel;
364 hash = hash_64(sid->id, PERF_EVLIST__HLIST_BITS);
365 hlist_add_head(&sid->node, &evlist->heads[hash]);
366}
367
a91e5431
ACM
368void perf_evlist__id_add(struct perf_evlist *evlist, struct perf_evsel *evsel,
369 int cpu, int thread, u64 id)
370{
371 perf_evlist__id_hash(evlist, evsel, cpu, thread, id);
372 evsel->id[evsel->ids++] = id;
373}
374
375static int perf_evlist__id_add_fd(struct perf_evlist *evlist,
376 struct perf_evsel *evsel,
377 int cpu, int thread, int fd)
f8a95309 378{
f8a95309 379 u64 read_data[4] = { 0, };
3d3b5e95 380 int id_idx = 1; /* The first entry is the counter value */
e2b5abe0
JO
381 u64 id;
382 int ret;
383
384 ret = ioctl(fd, PERF_EVENT_IOC_ID, &id);
385 if (!ret)
386 goto add;
387
388 if (errno != ENOTTY)
389 return -1;
390
391 /* Legacy way to get event id.. All hail to old kernels! */
f8a95309 392
c4861afe
JO
393 /*
394 * This way does not work with group format read, so bail
395 * out in that case.
396 */
397 if (perf_evlist__read_format(evlist) & PERF_FORMAT_GROUP)
398 return -1;
399
f8a95309
ACM
400 if (!(evsel->attr.read_format & PERF_FORMAT_ID) ||
401 read(fd, &read_data, sizeof(read_data)) == -1)
402 return -1;
403
404 if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
405 ++id_idx;
406 if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
407 ++id_idx;
408
e2b5abe0
JO
409 id = read_data[id_idx];
410
411 add:
412 perf_evlist__id_add(evlist, evsel, cpu, thread, id);
f8a95309
ACM
413 return 0;
414}
415
932a3594 416struct perf_sample_id *perf_evlist__id2sid(struct perf_evlist *evlist, u64 id)
70db7533
ACM
417{
418 struct hlist_head *head;
70db7533
ACM
419 struct perf_sample_id *sid;
420 int hash;
421
70db7533
ACM
422 hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
423 head = &evlist->heads[hash];
424
b67bfe0d 425 hlist_for_each_entry(sid, head, node)
70db7533 426 if (sid->id == id)
932a3594
JO
427 return sid;
428
429 return NULL;
430}
431
432struct perf_evsel *perf_evlist__id2evsel(struct perf_evlist *evlist, u64 id)
433{
434 struct perf_sample_id *sid;
435
436 if (evlist->nr_entries == 1)
437 return perf_evlist__first(evlist);
438
439 sid = perf_evlist__id2sid(evlist, id);
440 if (sid)
441 return sid->evsel;
30e68bcc
NK
442
443 if (!perf_evlist__sample_id_all(evlist))
0c21f736 444 return perf_evlist__first(evlist);
30e68bcc 445
70db7533
ACM
446 return NULL;
447}
04391deb 448
75562573
AH
449static int perf_evlist__event2id(struct perf_evlist *evlist,
450 union perf_event *event, u64 *id)
451{
452 const u64 *array = event->sample.array;
453 ssize_t n;
454
455 n = (event->header.size - sizeof(event->header)) >> 3;
456
457 if (event->header.type == PERF_RECORD_SAMPLE) {
458 if (evlist->id_pos >= n)
459 return -1;
460 *id = array[evlist->id_pos];
461 } else {
462 if (evlist->is_pos > n)
463 return -1;
464 n -= evlist->is_pos;
465 *id = array[n];
466 }
467 return 0;
468}
469
470static struct perf_evsel *perf_evlist__event2evsel(struct perf_evlist *evlist,
471 union perf_event *event)
472{
98be6966 473 struct perf_evsel *first = perf_evlist__first(evlist);
75562573
AH
474 struct hlist_head *head;
475 struct perf_sample_id *sid;
476 int hash;
477 u64 id;
478
479 if (evlist->nr_entries == 1)
98be6966
AH
480 return first;
481
482 if (!first->attr.sample_id_all &&
483 event->header.type != PERF_RECORD_SAMPLE)
484 return first;
75562573
AH
485
486 if (perf_evlist__event2id(evlist, event, &id))
487 return NULL;
488
489 /* Synthesized events have an id of zero */
490 if (!id)
98be6966 491 return first;
75562573
AH
492
493 hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
494 head = &evlist->heads[hash];
495
496 hlist_for_each_entry(sid, head, node) {
497 if (sid->id == id)
498 return sid->evsel;
499 }
500 return NULL;
501}
502
aece948f 503union perf_event *perf_evlist__mmap_read(struct perf_evlist *evlist, int idx)
04391deb 504{
aece948f 505 struct perf_mmap *md = &evlist->mmap[idx];
04391deb
ACM
506 unsigned int head = perf_mmap__read_head(md);
507 unsigned int old = md->prev;
508 unsigned char *data = md->base + page_size;
8115d60c 509 union perf_event *event = NULL;
04391deb 510
7bb41152 511 if (evlist->overwrite) {
04391deb 512 /*
7bb41152
ACM
513 * If we're further behind than half the buffer, there's a chance
514 * the writer will bite our tail and mess up the samples under us.
515 *
516 * If we somehow ended up ahead of the head, we got messed up.
517 *
518 * In either case, truncate and restart at head.
04391deb 519 */
7bb41152
ACM
520 int diff = head - old;
521 if (diff > md->mask / 2 || diff < 0) {
522 fprintf(stderr, "WARNING: failed to keep up with mmap data.\n");
523
524 /*
525 * head points to a known good entry, start there.
526 */
527 old = head;
528 }
04391deb
ACM
529 }
530
531 if (old != head) {
532 size_t size;
533
8115d60c 534 event = (union perf_event *)&data[old & md->mask];
04391deb
ACM
535 size = event->header.size;
536
537 /*
538 * Event straddles the mmap boundary -- header should always
539 * be inside due to u64 alignment of output.
540 */
541 if ((old & md->mask) + size != ((old + size) & md->mask)) {
542 unsigned int offset = old;
543 unsigned int len = min(sizeof(*event), size), cpy;
a65cb4b9 544 void *dst = md->event_copy;
04391deb
ACM
545
546 do {
547 cpy = min(md->mask + 1 - (offset & md->mask), len);
548 memcpy(dst, &data[offset & md->mask], cpy);
549 offset += cpy;
550 dst += cpy;
551 len -= cpy;
552 } while (len);
553
a65cb4b9 554 event = (union perf_event *) md->event_copy;
04391deb
ACM
555 }
556
557 old += size;
558 }
559
560 md->prev = old;
7bb41152 561
04391deb
ACM
562 return event;
563}
f8a95309 564
8e50d384
ZZ
565void perf_evlist__mmap_consume(struct perf_evlist *evlist, int idx)
566{
567 if (!evlist->overwrite) {
568 struct perf_mmap *md = &evlist->mmap[idx];
569 unsigned int old = md->prev;
570
571 perf_mmap__write_tail(md, old);
572 }
573}
574
93edcbd9
AH
575static void __perf_evlist__munmap(struct perf_evlist *evlist, int idx)
576{
577 if (evlist->mmap[idx].base != NULL) {
578 munmap(evlist->mmap[idx].base, evlist->mmap_len);
579 evlist->mmap[idx].base = NULL;
580 }
581}
582
7e2ed097 583void perf_evlist__munmap(struct perf_evlist *evlist)
f8a95309 584{
aece948f 585 int i;
f8a95309 586
93edcbd9
AH
587 for (i = 0; i < evlist->nr_mmaps; i++)
588 __perf_evlist__munmap(evlist, i);
aece948f
ACM
589
590 free(evlist->mmap);
591 evlist->mmap = NULL;
f8a95309
ACM
592}
593
806fb630 594static int perf_evlist__alloc_mmap(struct perf_evlist *evlist)
f8a95309 595{
a14bb7a6 596 evlist->nr_mmaps = cpu_map__nr(evlist->cpus);
ec1e7e43 597 if (cpu_map__empty(evlist->cpus))
b3a319d5 598 evlist->nr_mmaps = thread_map__nr(evlist->threads);
aece948f 599 evlist->mmap = zalloc(evlist->nr_mmaps * sizeof(struct perf_mmap));
f8a95309
ACM
600 return evlist->mmap != NULL ? 0 : -ENOMEM;
601}
602
bccdaba0 603static int __perf_evlist__mmap(struct perf_evlist *evlist,
aece948f 604 int idx, int prot, int mask, int fd)
f8a95309 605{
aece948f
ACM
606 evlist->mmap[idx].prev = 0;
607 evlist->mmap[idx].mask = mask;
608 evlist->mmap[idx].base = mmap(NULL, evlist->mmap_len, prot,
f8a95309 609 MAP_SHARED, fd, 0);
301b195d 610 if (evlist->mmap[idx].base == MAP_FAILED) {
02635965
AH
611 pr_debug2("failed to mmap perf event ring buffer, error %d\n",
612 errno);
301b195d 613 evlist->mmap[idx].base = NULL;
f8a95309 614 return -1;
301b195d 615 }
f8a95309
ACM
616
617 perf_evlist__add_pollfd(evlist, fd);
618 return 0;
619}
620
04e21314
AH
621static int perf_evlist__mmap_per_evsel(struct perf_evlist *evlist, int idx,
622 int prot, int mask, int cpu, int thread,
623 int *output)
aece948f
ACM
624{
625 struct perf_evsel *evsel;
04e21314
AH
626
627 list_for_each_entry(evsel, &evlist->entries, node) {
628 int fd = FD(evsel, cpu, thread);
629
630 if (*output == -1) {
631 *output = fd;
632 if (__perf_evlist__mmap(evlist, idx, prot, mask,
633 *output) < 0)
634 return -1;
635 } else {
636 if (ioctl(fd, PERF_EVENT_IOC_SET_OUTPUT, *output) != 0)
637 return -1;
638 }
639
640 if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
641 perf_evlist__id_add_fd(evlist, evsel, cpu, thread, fd) < 0)
642 return -1;
643 }
644
645 return 0;
646}
647
648static int perf_evlist__mmap_per_cpu(struct perf_evlist *evlist, int prot,
649 int mask)
650{
aece948f 651 int cpu, thread;
b3a319d5
NK
652 int nr_cpus = cpu_map__nr(evlist->cpus);
653 int nr_threads = thread_map__nr(evlist->threads);
aece948f 654
e3e1a54f 655 pr_debug2("perf event ring buffer mmapped per cpu\n");
b3a319d5 656 for (cpu = 0; cpu < nr_cpus; cpu++) {
aece948f
ACM
657 int output = -1;
658
b3a319d5 659 for (thread = 0; thread < nr_threads; thread++) {
04e21314
AH
660 if (perf_evlist__mmap_per_evsel(evlist, cpu, prot, mask,
661 cpu, thread, &output))
662 goto out_unmap;
aece948f
ACM
663 }
664 }
665
666 return 0;
667
668out_unmap:
93edcbd9
AH
669 for (cpu = 0; cpu < nr_cpus; cpu++)
670 __perf_evlist__munmap(evlist, cpu);
aece948f
ACM
671 return -1;
672}
673
04e21314
AH
674static int perf_evlist__mmap_per_thread(struct perf_evlist *evlist, int prot,
675 int mask)
aece948f 676{
aece948f 677 int thread;
b3a319d5 678 int nr_threads = thread_map__nr(evlist->threads);
aece948f 679
e3e1a54f 680 pr_debug2("perf event ring buffer mmapped per thread\n");
b3a319d5 681 for (thread = 0; thread < nr_threads; thread++) {
aece948f
ACM
682 int output = -1;
683
04e21314
AH
684 if (perf_evlist__mmap_per_evsel(evlist, thread, prot, mask, 0,
685 thread, &output))
686 goto out_unmap;
aece948f
ACM
687 }
688
689 return 0;
690
691out_unmap:
93edcbd9
AH
692 for (thread = 0; thread < nr_threads; thread++)
693 __perf_evlist__munmap(evlist, thread);
aece948f
ACM
694 return -1;
695}
696
994a1f78
JO
697static size_t perf_evlist__mmap_size(unsigned long pages)
698{
699 /* 512 kiB: default amount of unprivileged mlocked memory */
700 if (pages == UINT_MAX)
701 pages = (512 * 1024) / page_size;
702 else if (!is_power_of_2(pages))
703 return 0;
704
705 return (pages + 1) * page_size;
706}
707
33c2dcfd
DA
708static long parse_pages_arg(const char *str, unsigned long min,
709 unsigned long max)
994a1f78 710{
2fbe4abe 711 unsigned long pages, val;
27050f53
JO
712 static struct parse_tag tags[] = {
713 { .tag = 'B', .mult = 1 },
714 { .tag = 'K', .mult = 1 << 10 },
715 { .tag = 'M', .mult = 1 << 20 },
716 { .tag = 'G', .mult = 1 << 30 },
717 { .tag = 0 },
718 };
994a1f78 719
8973504b 720 if (str == NULL)
33c2dcfd 721 return -EINVAL;
8973504b 722
27050f53 723 val = parse_tag_value(str, tags);
2fbe4abe 724 if (val != (unsigned long) -1) {
27050f53
JO
725 /* we got file size value */
726 pages = PERF_ALIGN(val, page_size) / page_size;
27050f53
JO
727 } else {
728 /* we got pages count value */
729 char *eptr;
730 pages = strtoul(str, &eptr, 10);
33c2dcfd
DA
731 if (*eptr != '\0')
732 return -EINVAL;
994a1f78
JO
733 }
734
2bcab6c1 735 if (pages == 0 && min == 0) {
33c2dcfd
DA
736 /* leave number of pages at 0 */
737 } else if (pages < (1UL << 31) && !is_power_of_2(pages)) {
738 /* round pages up to next power of 2 */
9639837e
DA
739 pages = next_pow2(pages);
740 pr_info("rounding mmap pages size to %lu bytes (%lu pages)\n",
741 pages * page_size, pages);
2fbe4abe
AH
742 }
743
33c2dcfd
DA
744 if (pages > max)
745 return -EINVAL;
746
747 return pages;
748}
749
750int perf_evlist__parse_mmap_pages(const struct option *opt, const char *str,
751 int unset __maybe_unused)
752{
753 unsigned int *mmap_pages = opt->value;
754 unsigned long max = UINT_MAX;
755 long pages;
756
f5ae9c42 757 if (max > SIZE_MAX / page_size)
33c2dcfd
DA
758 max = SIZE_MAX / page_size;
759
760 pages = parse_pages_arg(str, 1, max);
761 if (pages < 0) {
762 pr_err("Invalid argument for --mmap_pages/-m\n");
994a1f78
JO
763 return -1;
764 }
765
766 *mmap_pages = pages;
767 return 0;
768}
769
c83fa7f2
AH
770/**
771 * perf_evlist__mmap - Create mmaps to receive events.
772 * @evlist: list of events
773 * @pages: map length in pages
774 * @overwrite: overwrite older events?
f8a95309 775 *
c83fa7f2
AH
776 * If @overwrite is %false the user needs to signal event consumption using
777 * perf_mmap__write_tail(). Using perf_evlist__mmap_read() does this
778 * automatically.
7e2ed097 779 *
c83fa7f2 780 * Return: %0 on success, negative error code otherwise.
f8a95309 781 */
50a682ce
ACM
782int perf_evlist__mmap(struct perf_evlist *evlist, unsigned int pages,
783 bool overwrite)
f8a95309 784{
aece948f 785 struct perf_evsel *evsel;
7e2ed097
ACM
786 const struct cpu_map *cpus = evlist->cpus;
787 const struct thread_map *threads = evlist->threads;
50a682ce
ACM
788 int prot = PROT_READ | (overwrite ? 0 : PROT_WRITE), mask;
789
7e2ed097 790 if (evlist->mmap == NULL && perf_evlist__alloc_mmap(evlist) < 0)
f8a95309
ACM
791 return -ENOMEM;
792
7e2ed097 793 if (evlist->pollfd == NULL && perf_evlist__alloc_pollfd(evlist) < 0)
f8a95309
ACM
794 return -ENOMEM;
795
796 evlist->overwrite = overwrite;
994a1f78 797 evlist->mmap_len = perf_evlist__mmap_size(pages);
2af68ef5 798 pr_debug("mmap size %zuB\n", evlist->mmap_len);
994a1f78 799 mask = evlist->mmap_len - page_size - 1;
f8a95309
ACM
800
801 list_for_each_entry(evsel, &evlist->entries, node) {
802 if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
a91e5431 803 evsel->sample_id == NULL &&
a14bb7a6 804 perf_evsel__alloc_id(evsel, cpu_map__nr(cpus), threads->nr) < 0)
f8a95309 805 return -ENOMEM;
f8a95309
ACM
806 }
807
ec1e7e43 808 if (cpu_map__empty(cpus))
aece948f 809 return perf_evlist__mmap_per_thread(evlist, prot, mask);
f8a95309 810
aece948f 811 return perf_evlist__mmap_per_cpu(evlist, prot, mask);
f8a95309 812}
7e2ed097 813
602ad878 814int perf_evlist__create_maps(struct perf_evlist *evlist, struct target *target)
7e2ed097 815{
b809ac10
NK
816 evlist->threads = thread_map__new_str(target->pid, target->tid,
817 target->uid);
7e2ed097
ACM
818
819 if (evlist->threads == NULL)
820 return -1;
821
9c105fbc 822 if (target__uses_dummy_map(target))
d1cb9fce 823 evlist->cpus = cpu_map__dummy_new();
879d77d0
NK
824 else
825 evlist->cpus = cpu_map__new(target->cpu_list);
7e2ed097
ACM
826
827 if (evlist->cpus == NULL)
828 goto out_delete_threads;
829
830 return 0;
831
832out_delete_threads:
833 thread_map__delete(evlist->threads);
834 return -1;
835}
836
837void perf_evlist__delete_maps(struct perf_evlist *evlist)
838{
839 cpu_map__delete(evlist->cpus);
840 thread_map__delete(evlist->threads);
841 evlist->cpus = NULL;
842 evlist->threads = NULL;
843}
0a102479 844
1491a632 845int perf_evlist__apply_filters(struct perf_evlist *evlist)
0a102479 846{
0a102479 847 struct perf_evsel *evsel;
745cefc5
ACM
848 int err = 0;
849 const int ncpus = cpu_map__nr(evlist->cpus),
b3a319d5 850 nthreads = thread_map__nr(evlist->threads);
0a102479
FW
851
852 list_for_each_entry(evsel, &evlist->entries, node) {
745cefc5 853 if (evsel->filter == NULL)
0a102479 854 continue;
745cefc5
ACM
855
856 err = perf_evsel__set_filter(evsel, ncpus, nthreads, evsel->filter);
857 if (err)
858 break;
0a102479
FW
859 }
860
745cefc5
ACM
861 return err;
862}
863
864int perf_evlist__set_filter(struct perf_evlist *evlist, const char *filter)
865{
866 struct perf_evsel *evsel;
867 int err = 0;
868 const int ncpus = cpu_map__nr(evlist->cpus),
b3a319d5 869 nthreads = thread_map__nr(evlist->threads);
745cefc5
ACM
870
871 list_for_each_entry(evsel, &evlist->entries, node) {
872 err = perf_evsel__set_filter(evsel, ncpus, nthreads, filter);
873 if (err)
874 break;
875 }
876
877 return err;
0a102479 878}
74429964 879
0c21f736 880bool perf_evlist__valid_sample_type(struct perf_evlist *evlist)
74429964 881{
75562573 882 struct perf_evsel *pos;
c2a70653 883
75562573
AH
884 if (evlist->nr_entries == 1)
885 return true;
886
887 if (evlist->id_pos < 0 || evlist->is_pos < 0)
888 return false;
889
890 list_for_each_entry(pos, &evlist->entries, node) {
891 if (pos->id_pos != evlist->id_pos ||
892 pos->is_pos != evlist->is_pos)
c2a70653 893 return false;
74429964
FW
894 }
895
c2a70653 896 return true;
74429964
FW
897}
898
75562573 899u64 __perf_evlist__combined_sample_type(struct perf_evlist *evlist)
c2a70653 900{
75562573
AH
901 struct perf_evsel *evsel;
902
903 if (evlist->combined_sample_type)
904 return evlist->combined_sample_type;
905
906 list_for_each_entry(evsel, &evlist->entries, node)
907 evlist->combined_sample_type |= evsel->attr.sample_type;
908
909 return evlist->combined_sample_type;
910}
911
912u64 perf_evlist__combined_sample_type(struct perf_evlist *evlist)
913{
914 evlist->combined_sample_type = 0;
915 return __perf_evlist__combined_sample_type(evlist);
c2a70653
ACM
916}
917
9ede473c
JO
918bool perf_evlist__valid_read_format(struct perf_evlist *evlist)
919{
920 struct perf_evsel *first = perf_evlist__first(evlist), *pos = first;
921 u64 read_format = first->attr.read_format;
922 u64 sample_type = first->attr.sample_type;
923
924 list_for_each_entry_continue(pos, &evlist->entries, node) {
925 if (read_format != pos->attr.read_format)
926 return false;
927 }
928
929 /* PERF_SAMPLE_READ imples PERF_FORMAT_ID. */
930 if ((sample_type & PERF_SAMPLE_READ) &&
931 !(read_format & PERF_FORMAT_ID)) {
932 return false;
933 }
934
935 return true;
936}
937
938u64 perf_evlist__read_format(struct perf_evlist *evlist)
939{
940 struct perf_evsel *first = perf_evlist__first(evlist);
941 return first->attr.read_format;
942}
943
0c21f736 944u16 perf_evlist__id_hdr_size(struct perf_evlist *evlist)
81e36bff 945{
0c21f736 946 struct perf_evsel *first = perf_evlist__first(evlist);
81e36bff
ACM
947 struct perf_sample *data;
948 u64 sample_type;
949 u16 size = 0;
950
81e36bff
ACM
951 if (!first->attr.sample_id_all)
952 goto out;
953
954 sample_type = first->attr.sample_type;
955
956 if (sample_type & PERF_SAMPLE_TID)
957 size += sizeof(data->tid) * 2;
958
959 if (sample_type & PERF_SAMPLE_TIME)
960 size += sizeof(data->time);
961
962 if (sample_type & PERF_SAMPLE_ID)
963 size += sizeof(data->id);
964
965 if (sample_type & PERF_SAMPLE_STREAM_ID)
966 size += sizeof(data->stream_id);
967
968 if (sample_type & PERF_SAMPLE_CPU)
969 size += sizeof(data->cpu) * 2;
75562573
AH
970
971 if (sample_type & PERF_SAMPLE_IDENTIFIER)
972 size += sizeof(data->id);
81e36bff
ACM
973out:
974 return size;
975}
976
0c21f736 977bool perf_evlist__valid_sample_id_all(struct perf_evlist *evlist)
74429964 978{
0c21f736 979 struct perf_evsel *first = perf_evlist__first(evlist), *pos = first;
c2a70653
ACM
980
981 list_for_each_entry_continue(pos, &evlist->entries, node) {
982 if (first->attr.sample_id_all != pos->attr.sample_id_all)
983 return false;
74429964
FW
984 }
985
c2a70653
ACM
986 return true;
987}
988
0c21f736 989bool perf_evlist__sample_id_all(struct perf_evlist *evlist)
c2a70653 990{
0c21f736 991 struct perf_evsel *first = perf_evlist__first(evlist);
c2a70653 992 return first->attr.sample_id_all;
74429964 993}
81cce8de
ACM
994
995void perf_evlist__set_selected(struct perf_evlist *evlist,
996 struct perf_evsel *evsel)
997{
998 evlist->selected = evsel;
999}
727ab04e 1000
a74b4b66
NK
1001void perf_evlist__close(struct perf_evlist *evlist)
1002{
1003 struct perf_evsel *evsel;
1004 int ncpus = cpu_map__nr(evlist->cpus);
1005 int nthreads = thread_map__nr(evlist->threads);
1006
1007 list_for_each_entry_reverse(evsel, &evlist->entries, node)
1008 perf_evsel__close(evsel, ncpus, nthreads);
1009}
1010
6a4bb04c 1011int perf_evlist__open(struct perf_evlist *evlist)
727ab04e 1012{
6a4bb04c 1013 struct perf_evsel *evsel;
a74b4b66 1014 int err;
727ab04e 1015
733cd2fe
AH
1016 perf_evlist__update_id_pos(evlist);
1017
727ab04e 1018 list_for_each_entry(evsel, &evlist->entries, node) {
6a4bb04c 1019 err = perf_evsel__open(evsel, evlist->cpus, evlist->threads);
727ab04e
ACM
1020 if (err < 0)
1021 goto out_err;
1022 }
1023
1024 return 0;
1025out_err:
a74b4b66 1026 perf_evlist__close(evlist);
41c21a68 1027 errno = -err;
727ab04e
ACM
1028 return err;
1029}
35b9d88e 1030
602ad878 1031int perf_evlist__prepare_workload(struct perf_evlist *evlist, struct target *target,
55e162ea
NK
1032 const char *argv[], bool pipe_output,
1033 bool want_signal)
35b9d88e
ACM
1034{
1035 int child_ready_pipe[2], go_pipe[2];
1036 char bf;
1037
1038 if (pipe(child_ready_pipe) < 0) {
1039 perror("failed to create 'ready' pipe");
1040 return -1;
1041 }
1042
1043 if (pipe(go_pipe) < 0) {
1044 perror("failed to create 'go' pipe");
1045 goto out_close_ready_pipe;
1046 }
1047
1048 evlist->workload.pid = fork();
1049 if (evlist->workload.pid < 0) {
1050 perror("failed to fork");
1051 goto out_close_pipes;
1052 }
1053
1054 if (!evlist->workload.pid) {
119fa3c9 1055 if (pipe_output)
35b9d88e
ACM
1056 dup2(2, 1);
1057
0817df08
DA
1058 signal(SIGTERM, SIG_DFL);
1059
35b9d88e
ACM
1060 close(child_ready_pipe[0]);
1061 close(go_pipe[1]);
1062 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
1063
35b9d88e
ACM
1064 /*
1065 * Tell the parent we're ready to go
1066 */
1067 close(child_ready_pipe[1]);
1068
1069 /*
1070 * Wait until the parent tells us to go.
1071 */
1072 if (read(go_pipe[0], &bf, 1) == -1)
1073 perror("unable to read pipe");
1074
1075 execvp(argv[0], (char **)argv);
1076
1077 perror(argv[0]);
55e162ea
NK
1078 if (want_signal)
1079 kill(getppid(), SIGUSR1);
35b9d88e
ACM
1080 exit(-1);
1081 }
1082
602ad878 1083 if (target__none(target))
35b9d88e
ACM
1084 evlist->threads->map[0] = evlist->workload.pid;
1085
1086 close(child_ready_pipe[1]);
1087 close(go_pipe[0]);
1088 /*
1089 * wait for child to settle
1090 */
1091 if (read(child_ready_pipe[0], &bf, 1) == -1) {
1092 perror("unable to read pipe");
1093 goto out_close_pipes;
1094 }
1095
bcf3145f 1096 fcntl(go_pipe[1], F_SETFD, FD_CLOEXEC);
35b9d88e
ACM
1097 evlist->workload.cork_fd = go_pipe[1];
1098 close(child_ready_pipe[0]);
1099 return 0;
1100
1101out_close_pipes:
1102 close(go_pipe[0]);
1103 close(go_pipe[1]);
1104out_close_ready_pipe:
1105 close(child_ready_pipe[0]);
1106 close(child_ready_pipe[1]);
1107 return -1;
1108}
1109
1110int perf_evlist__start_workload(struct perf_evlist *evlist)
1111{
1112 if (evlist->workload.cork_fd > 0) {
b3824404 1113 char bf = 0;
bcf3145f 1114 int ret;
35b9d88e
ACM
1115 /*
1116 * Remove the cork, let it rip!
1117 */
bcf3145f
NK
1118 ret = write(evlist->workload.cork_fd, &bf, 1);
1119 if (ret < 0)
1120 perror("enable to write to pipe");
1121
1122 close(evlist->workload.cork_fd);
1123 return ret;
35b9d88e
ACM
1124 }
1125
1126 return 0;
1127}
cb0b29e0 1128
a3f698fe 1129int perf_evlist__parse_sample(struct perf_evlist *evlist, union perf_event *event,
0807d2d8 1130 struct perf_sample *sample)
cb0b29e0 1131{
75562573
AH
1132 struct perf_evsel *evsel = perf_evlist__event2evsel(evlist, event);
1133
1134 if (!evsel)
1135 return -EFAULT;
0807d2d8 1136 return perf_evsel__parse_sample(evsel, event, sample);
cb0b29e0 1137}
78f067b3
ACM
1138
1139size_t perf_evlist__fprintf(struct perf_evlist *evlist, FILE *fp)
1140{
1141 struct perf_evsel *evsel;
1142 size_t printed = 0;
1143
1144 list_for_each_entry(evsel, &evlist->entries, node) {
1145 printed += fprintf(fp, "%s%s", evsel->idx ? ", " : "",
1146 perf_evsel__name(evsel));
1147 }
1148
b2222139 1149 return printed + fprintf(fp, "\n");
78f067b3 1150}
6ef068cb
ACM
1151
1152int perf_evlist__strerror_tp(struct perf_evlist *evlist __maybe_unused,
1153 int err, char *buf, size_t size)
1154{
1155 char sbuf[128];
1156
1157 switch (err) {
1158 case ENOENT:
1159 scnprintf(buf, size, "%s",
1160 "Error:\tUnable to find debugfs\n"
1161 "Hint:\tWas your kernel was compiled with debugfs support?\n"
1162 "Hint:\tIs the debugfs filesystem mounted?\n"
1163 "Hint:\tTry 'sudo mount -t debugfs nodev /sys/kernel/debug'");
1164 break;
1165 case EACCES:
1166 scnprintf(buf, size,
1167 "Error:\tNo permissions to read %s/tracing/events/raw_syscalls\n"
1168 "Hint:\tTry 'sudo mount -o remount,mode=755 %s'\n",
1169 debugfs_mountpoint, debugfs_mountpoint);
1170 break;
1171 default:
1172 scnprintf(buf, size, "%s", strerror_r(err, sbuf, sizeof(sbuf)));
1173 break;
1174 }
1175
1176 return 0;
1177}
a8f23d8f
ACM
1178
1179int perf_evlist__strerror_open(struct perf_evlist *evlist __maybe_unused,
1180 int err, char *buf, size_t size)
1181{
1182 int printed, value;
1183 char sbuf[128], *emsg = strerror_r(err, sbuf, sizeof(sbuf));
1184
1185 switch (err) {
1186 case EACCES:
1187 case EPERM:
1188 printed = scnprintf(buf, size,
1189 "Error:\t%s.\n"
1190 "Hint:\tCheck /proc/sys/kernel/perf_event_paranoid setting.", emsg);
1191
1192 if (filename__read_int("/proc/sys/kernel/perf_event_paranoid", &value))
1193 break;
1194
1195 printed += scnprintf(buf + printed, size - printed, "\nHint:\t");
1196
1197 if (value >= 2) {
1198 printed += scnprintf(buf + printed, size - printed,
1199 "For your workloads it needs to be <= 1\nHint:\t");
1200 }
1201 printed += scnprintf(buf + printed, size - printed,
1202 "For system wide tracing it needs to be set to -1");
1203
1204 printed += scnprintf(buf + printed, size - printed,
1205 ".\nHint:\tThe current value is %d.", value);
1206 break;
1207 default:
1208 scnprintf(buf, size, "%s", emsg);
1209 break;
1210 }
1211
1212 return 0;
1213}