]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blame - tools/perf/util/evlist.c
Merge branch 'perf/urgent' into perf/core, to pick up fixes
[mirror_ubuntu-zesty-kernel.git] / tools / perf / util / evlist.c
CommitLineData
f8a95309
ACM
1/*
2 * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
3 *
4 * Parts came from builtin-{top,stat,record}.c, see those files for further
5 * copyright notes.
6 *
7 * Released under the GPL v2. (and only v2, not any later version)
8 */
a8c9ae18 9#include "util.h"
956fa571 10#include <api/fs/fs.h>
5c581041 11#include <poll.h>
f8a95309
ACM
12#include "cpumap.h"
13#include "thread_map.h"
12864b31 14#include "target.h"
361c99a6
ACM
15#include "evlist.h"
16#include "evsel.h"
e3e1a54f 17#include "debug.h"
35b9d88e 18#include <unistd.h>
361c99a6 19
50d08e47 20#include "parse-events.h"
994a1f78 21#include "parse-options.h"
50d08e47 22
f8a95309
ACM
23#include <sys/mman.h>
24
70db7533
ACM
25#include <linux/bitops.h>
26#include <linux/hash.h>
0389cd1f 27#include <linux/log2.h>
8dd2a131 28#include <linux/err.h>
70db7533 29
e4b356b5
ACM
30static void perf_evlist__mmap_put(struct perf_evlist *evlist, int idx);
31static void __perf_evlist__munmap(struct perf_evlist *evlist, int idx);
32
f8a95309 33#define FD(e, x, y) (*(int *)xyarray__entry(e->fd, x, y))
a91e5431 34#define SID(e, x, y) xyarray__entry(e->sample_id, x, y)
f8a95309 35
7e2ed097
ACM
36void perf_evlist__init(struct perf_evlist *evlist, struct cpu_map *cpus,
37 struct thread_map *threads)
ef1d1af2
ACM
38{
39 int i;
40
41 for (i = 0; i < PERF_EVLIST__HLIST_SIZE; ++i)
42 INIT_HLIST_HEAD(&evlist->heads[i]);
43 INIT_LIST_HEAD(&evlist->entries);
7e2ed097 44 perf_evlist__set_maps(evlist, cpus, threads);
1b85337d 45 fdarray__init(&evlist->pollfd, 64);
35b9d88e 46 evlist->workload.pid = -1;
ef1d1af2
ACM
47}
48
334fe7a3 49struct perf_evlist *perf_evlist__new(void)
361c99a6
ACM
50{
51 struct perf_evlist *evlist = zalloc(sizeof(*evlist));
52
ef1d1af2 53 if (evlist != NULL)
334fe7a3 54 perf_evlist__init(evlist, NULL, NULL);
361c99a6
ACM
55
56 return evlist;
57}
58
b22d54b0
JO
59struct perf_evlist *perf_evlist__new_default(void)
60{
61 struct perf_evlist *evlist = perf_evlist__new();
62
63 if (evlist && perf_evlist__add_default(evlist)) {
64 perf_evlist__delete(evlist);
65 evlist = NULL;
66 }
67
68 return evlist;
69}
70
75562573
AH
71/**
72 * perf_evlist__set_id_pos - set the positions of event ids.
73 * @evlist: selected event list
74 *
75 * Events with compatible sample types all have the same id_pos
76 * and is_pos. For convenience, put a copy on evlist.
77 */
78void perf_evlist__set_id_pos(struct perf_evlist *evlist)
79{
80 struct perf_evsel *first = perf_evlist__first(evlist);
81
82 evlist->id_pos = first->id_pos;
83 evlist->is_pos = first->is_pos;
84}
85
733cd2fe
AH
86static void perf_evlist__update_id_pos(struct perf_evlist *evlist)
87{
88 struct perf_evsel *evsel;
89
0050f7aa 90 evlist__for_each(evlist, evsel)
733cd2fe
AH
91 perf_evsel__calc_id_pos(evsel);
92
93 perf_evlist__set_id_pos(evlist);
94}
95
361c99a6
ACM
96static void perf_evlist__purge(struct perf_evlist *evlist)
97{
98 struct perf_evsel *pos, *n;
99
0050f7aa 100 evlist__for_each_safe(evlist, n, pos) {
361c99a6 101 list_del_init(&pos->node);
d49e4695 102 pos->evlist = NULL;
361c99a6
ACM
103 perf_evsel__delete(pos);
104 }
105
106 evlist->nr_entries = 0;
107}
108
ef1d1af2 109void perf_evlist__exit(struct perf_evlist *evlist)
361c99a6 110{
04662523 111 zfree(&evlist->mmap);
1b85337d 112 fdarray__exit(&evlist->pollfd);
ef1d1af2
ACM
113}
114
115void perf_evlist__delete(struct perf_evlist *evlist)
116{
983874d1 117 perf_evlist__munmap(evlist);
f26e1c7c 118 perf_evlist__close(evlist);
f30a79b0 119 cpu_map__put(evlist->cpus);
186fbb74 120 thread_map__put(evlist->threads);
03ad9747
ACM
121 evlist->cpus = NULL;
122 evlist->threads = NULL;
ef1d1af2
ACM
123 perf_evlist__purge(evlist);
124 perf_evlist__exit(evlist);
361c99a6
ACM
125 free(evlist);
126}
127
adc0c3e8
AH
128static void __perf_evlist__propagate_maps(struct perf_evlist *evlist,
129 struct perf_evsel *evsel)
130{
131 /*
132 * We already have cpus for evsel (via PMU sysfs) so
133 * keep it, if there's no target cpu list defined.
134 */
135 if (!evsel->own_cpus || evlist->has_user_cpus) {
136 cpu_map__put(evsel->cpus);
137 evsel->cpus = cpu_map__get(evlist->cpus);
138 } else if (evsel->cpus != evsel->own_cpus) {
139 cpu_map__put(evsel->cpus);
140 evsel->cpus = cpu_map__get(evsel->own_cpus);
141 }
142
143 thread_map__put(evsel->threads);
144 evsel->threads = thread_map__get(evlist->threads);
145}
146
147static void perf_evlist__propagate_maps(struct perf_evlist *evlist)
148{
149 struct perf_evsel *evsel;
150
151 evlist__for_each(evlist, evsel)
152 __perf_evlist__propagate_maps(evlist, evsel);
153}
154
361c99a6
ACM
155void perf_evlist__add(struct perf_evlist *evlist, struct perf_evsel *entry)
156{
d49e4695 157 entry->evlist = evlist;
361c99a6 158 list_add_tail(&entry->node, &evlist->entries);
ef503831 159 entry->idx = evlist->nr_entries;
60b0896c 160 entry->tracking = !entry->idx;
ef503831 161
75562573
AH
162 if (!evlist->nr_entries++)
163 perf_evlist__set_id_pos(evlist);
44c42d71
AH
164
165 __perf_evlist__propagate_maps(evlist, entry);
361c99a6
ACM
166}
167
4768230a
AH
168void perf_evlist__remove(struct perf_evlist *evlist, struct perf_evsel *evsel)
169{
170 evsel->evlist = NULL;
171 list_del_init(&evsel->node);
172 evlist->nr_entries -= 1;
173}
174
0529bc1f 175void perf_evlist__splice_list_tail(struct perf_evlist *evlist,
f114d6ef 176 struct list_head *list)
50d08e47 177{
f114d6ef 178 struct perf_evsel *evsel, *temp;
75562573 179
f114d6ef
AH
180 __evlist__for_each_safe(list, temp, evsel) {
181 list_del_init(&evsel->node);
182 perf_evlist__add(evlist, evsel);
183 }
50d08e47
ACM
184}
185
63dab225
ACM
186void __perf_evlist__set_leader(struct list_head *list)
187{
188 struct perf_evsel *evsel, *leader;
189
190 leader = list_entry(list->next, struct perf_evsel, node);
97f63e4a
NK
191 evsel = list_entry(list->prev, struct perf_evsel, node);
192
193 leader->nr_members = evsel->idx - leader->idx + 1;
63dab225 194
0050f7aa 195 __evlist__for_each(list, evsel) {
74b2133d 196 evsel->leader = leader;
63dab225
ACM
197 }
198}
199
200void perf_evlist__set_leader(struct perf_evlist *evlist)
6a4bb04c 201{
97f63e4a
NK
202 if (evlist->nr_entries) {
203 evlist->nr_groups = evlist->nr_entries > 1 ? 1 : 0;
63dab225 204 __perf_evlist__set_leader(&evlist->entries);
97f63e4a 205 }
6a4bb04c
JO
206}
207
45cf6c33 208void perf_event_attr__set_max_precise_ip(struct perf_event_attr *attr)
7f8d1ade
ACM
209{
210 attr->precise_ip = 3;
211
212 while (attr->precise_ip != 0) {
213 int fd = sys_perf_event_open(attr, 0, -1, -1, 0);
214 if (fd != -1) {
215 close(fd);
216 break;
217 }
218 --attr->precise_ip;
219 }
220}
221
361c99a6
ACM
222int perf_evlist__add_default(struct perf_evlist *evlist)
223{
224 struct perf_event_attr attr = {
225 .type = PERF_TYPE_HARDWARE,
226 .config = PERF_COUNT_HW_CPU_CYCLES,
227 };
1aed2671
JR
228 struct perf_evsel *evsel;
229
230 event_attr_init(&attr);
361c99a6 231
7f8d1ade
ACM
232 perf_event_attr__set_max_precise_ip(&attr);
233
ef503831 234 evsel = perf_evsel__new(&attr);
361c99a6 235 if (evsel == NULL)
cc2d86b0
SE
236 goto error;
237
7f8d1ade
ACM
238 /* use asprintf() because free(evsel) assumes name is allocated */
239 if (asprintf(&evsel->name, "cycles%.*s",
240 attr.precise_ip ? attr.precise_ip + 1 : 0, ":ppp") < 0)
cc2d86b0 241 goto error_free;
361c99a6
ACM
242
243 perf_evlist__add(evlist, evsel);
244 return 0;
cc2d86b0
SE
245error_free:
246 perf_evsel__delete(evsel);
247error:
248 return -ENOMEM;
361c99a6 249}
5c581041 250
e60fc847
ACM
251static int perf_evlist__add_attrs(struct perf_evlist *evlist,
252 struct perf_event_attr *attrs, size_t nr_attrs)
50d08e47
ACM
253{
254 struct perf_evsel *evsel, *n;
255 LIST_HEAD(head);
256 size_t i;
257
258 for (i = 0; i < nr_attrs; i++) {
ef503831 259 evsel = perf_evsel__new_idx(attrs + i, evlist->nr_entries + i);
50d08e47
ACM
260 if (evsel == NULL)
261 goto out_delete_partial_list;
262 list_add_tail(&evsel->node, &head);
263 }
264
f114d6ef 265 perf_evlist__splice_list_tail(evlist, &head);
50d08e47
ACM
266
267 return 0;
268
269out_delete_partial_list:
0050f7aa 270 __evlist__for_each_safe(&head, n, evsel)
50d08e47
ACM
271 perf_evsel__delete(evsel);
272 return -1;
273}
274
79695e1b
ACM
275int __perf_evlist__add_default_attrs(struct perf_evlist *evlist,
276 struct perf_event_attr *attrs, size_t nr_attrs)
277{
278 size_t i;
279
280 for (i = 0; i < nr_attrs; i++)
281 event_attr_init(attrs + i);
282
283 return perf_evlist__add_attrs(evlist, attrs, nr_attrs);
284}
285
da378962
ACM
286struct perf_evsel *
287perf_evlist__find_tracepoint_by_id(struct perf_evlist *evlist, int id)
ee29be62
ACM
288{
289 struct perf_evsel *evsel;
290
0050f7aa 291 evlist__for_each(evlist, evsel) {
ee29be62
ACM
292 if (evsel->attr.type == PERF_TYPE_TRACEPOINT &&
293 (int)evsel->attr.config == id)
294 return evsel;
295 }
296
297 return NULL;
298}
299
a2f2804a
DA
300struct perf_evsel *
301perf_evlist__find_tracepoint_by_name(struct perf_evlist *evlist,
302 const char *name)
303{
304 struct perf_evsel *evsel;
305
0050f7aa 306 evlist__for_each(evlist, evsel) {
a2f2804a
DA
307 if ((evsel->attr.type == PERF_TYPE_TRACEPOINT) &&
308 (strcmp(evsel->name, name) == 0))
309 return evsel;
310 }
311
312 return NULL;
313}
314
39876e7d
ACM
315int perf_evlist__add_newtp(struct perf_evlist *evlist,
316 const char *sys, const char *name, void *handler)
317{
ef503831 318 struct perf_evsel *evsel = perf_evsel__newtp(sys, name);
39876e7d 319
8dd2a131 320 if (IS_ERR(evsel))
39876e7d
ACM
321 return -1;
322
744a9719 323 evsel->handler = handler;
39876e7d
ACM
324 perf_evlist__add(evlist, evsel);
325 return 0;
326}
327
bf8e8f4b
AH
328static int perf_evlist__nr_threads(struct perf_evlist *evlist,
329 struct perf_evsel *evsel)
330{
331 if (evsel->system_wide)
332 return 1;
333 else
334 return thread_map__nr(evlist->threads);
335}
336
4152ab37
ACM
337void perf_evlist__disable(struct perf_evlist *evlist)
338{
4152ab37 339 struct perf_evsel *pos;
3e27c920
JO
340
341 evlist__for_each(evlist, pos) {
342 if (!perf_evsel__is_group_leader(pos) || !pos->fd)
343 continue;
344 perf_evsel__disable(pos);
4152ab37 345 }
2b56bcfb
ACM
346
347 evlist->enabled = false;
4152ab37
ACM
348}
349
764e16a3
DA
350void perf_evlist__enable(struct perf_evlist *evlist)
351{
764e16a3 352 struct perf_evsel *pos;
3e27c920
JO
353
354 evlist__for_each(evlist, pos) {
355 if (!perf_evsel__is_group_leader(pos) || !pos->fd)
356 continue;
357 perf_evsel__enable(pos);
764e16a3 358 }
2b56bcfb
ACM
359
360 evlist->enabled = true;
361}
362
363void perf_evlist__toggle_enable(struct perf_evlist *evlist)
364{
365 (evlist->enabled ? perf_evlist__disable : perf_evlist__enable)(evlist);
764e16a3
DA
366}
367
395c3070
AH
368int perf_evlist__disable_event(struct perf_evlist *evlist,
369 struct perf_evsel *evsel)
370{
371 int cpu, thread, err;
bf8e8f4b
AH
372 int nr_cpus = cpu_map__nr(evlist->cpus);
373 int nr_threads = perf_evlist__nr_threads(evlist, evsel);
395c3070
AH
374
375 if (!evsel->fd)
376 return 0;
377
bf8e8f4b
AH
378 for (cpu = 0; cpu < nr_cpus; cpu++) {
379 for (thread = 0; thread < nr_threads; thread++) {
395c3070
AH
380 err = ioctl(FD(evsel, cpu, thread),
381 PERF_EVENT_IOC_DISABLE, 0);
382 if (err)
383 return err;
384 }
385 }
386 return 0;
387}
388
389int perf_evlist__enable_event(struct perf_evlist *evlist,
390 struct perf_evsel *evsel)
391{
392 int cpu, thread, err;
bf8e8f4b
AH
393 int nr_cpus = cpu_map__nr(evlist->cpus);
394 int nr_threads = perf_evlist__nr_threads(evlist, evsel);
395c3070
AH
395
396 if (!evsel->fd)
397 return -EINVAL;
398
bf8e8f4b
AH
399 for (cpu = 0; cpu < nr_cpus; cpu++) {
400 for (thread = 0; thread < nr_threads; thread++) {
395c3070
AH
401 err = ioctl(FD(evsel, cpu, thread),
402 PERF_EVENT_IOC_ENABLE, 0);
403 if (err)
404 return err;
405 }
406 }
407 return 0;
408}
409
1c65056c
AH
410static int perf_evlist__enable_event_cpu(struct perf_evlist *evlist,
411 struct perf_evsel *evsel, int cpu)
412{
413 int thread, err;
414 int nr_threads = perf_evlist__nr_threads(evlist, evsel);
415
416 if (!evsel->fd)
417 return -EINVAL;
418
419 for (thread = 0; thread < nr_threads; thread++) {
420 err = ioctl(FD(evsel, cpu, thread),
421 PERF_EVENT_IOC_ENABLE, 0);
422 if (err)
423 return err;
424 }
425 return 0;
426}
427
428static int perf_evlist__enable_event_thread(struct perf_evlist *evlist,
429 struct perf_evsel *evsel,
430 int thread)
431{
432 int cpu, err;
433 int nr_cpus = cpu_map__nr(evlist->cpus);
434
435 if (!evsel->fd)
436 return -EINVAL;
437
438 for (cpu = 0; cpu < nr_cpus; cpu++) {
439 err = ioctl(FD(evsel, cpu, thread), PERF_EVENT_IOC_ENABLE, 0);
440 if (err)
441 return err;
442 }
443 return 0;
444}
445
446int perf_evlist__enable_event_idx(struct perf_evlist *evlist,
447 struct perf_evsel *evsel, int idx)
448{
449 bool per_cpu_mmaps = !cpu_map__empty(evlist->cpus);
450
451 if (per_cpu_mmaps)
452 return perf_evlist__enable_event_cpu(evlist, evsel, idx);
453 else
454 return perf_evlist__enable_event_thread(evlist, evsel, idx);
455}
456
ad6765dd 457int perf_evlist__alloc_pollfd(struct perf_evlist *evlist)
5c581041 458{
b3a319d5
NK
459 int nr_cpus = cpu_map__nr(evlist->cpus);
460 int nr_threads = thread_map__nr(evlist->threads);
bf8e8f4b
AH
461 int nfds = 0;
462 struct perf_evsel *evsel;
463
cba9b847 464 evlist__for_each(evlist, evsel) {
bf8e8f4b
AH
465 if (evsel->system_wide)
466 nfds += nr_cpus;
467 else
468 nfds += nr_cpus * nr_threads;
469 }
470
1b85337d
ACM
471 if (fdarray__available_entries(&evlist->pollfd) < nfds &&
472 fdarray__grow(&evlist->pollfd, nfds) < 0)
ad6765dd
ACM
473 return -ENOMEM;
474
475 return 0;
5c581041 476}
70082dd9 477
e4b356b5
ACM
478static int __perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd, int idx)
479{
480 int pos = fdarray__add(&evlist->pollfd, fd, POLLIN | POLLERR | POLLHUP);
481 /*
482 * Save the idx so that when we filter out fds POLLHUP'ed we can
483 * close the associated evlist->mmap[] entry.
484 */
485 if (pos >= 0) {
486 evlist->pollfd.priv[pos].idx = idx;
487
488 fcntl(fd, F_SETFL, O_NONBLOCK);
489 }
490
491 return pos;
492}
493
ad6765dd 494int perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd)
70082dd9 495{
e4b356b5
ACM
496 return __perf_evlist__add_pollfd(evlist, fd, -1);
497}
498
499static void perf_evlist__munmap_filtered(struct fdarray *fda, int fd)
500{
501 struct perf_evlist *evlist = container_of(fda, struct perf_evlist, pollfd);
1b85337d 502
e4b356b5 503 perf_evlist__mmap_put(evlist, fda->priv[fd].idx);
70082dd9 504}
70db7533 505
1ddec7f0
ACM
506int perf_evlist__filter_pollfd(struct perf_evlist *evlist, short revents_and_mask)
507{
e4b356b5
ACM
508 return fdarray__filter(&evlist->pollfd, revents_and_mask,
509 perf_evlist__munmap_filtered);
1ddec7f0
ACM
510}
511
f66a889d
ACM
512int perf_evlist__poll(struct perf_evlist *evlist, int timeout)
513{
1b85337d 514 return fdarray__poll(&evlist->pollfd, timeout);
f66a889d
ACM
515}
516
a91e5431
ACM
517static void perf_evlist__id_hash(struct perf_evlist *evlist,
518 struct perf_evsel *evsel,
519 int cpu, int thread, u64 id)
3d3b5e95
ACM
520{
521 int hash;
522 struct perf_sample_id *sid = SID(evsel, cpu, thread);
523
524 sid->id = id;
525 sid->evsel = evsel;
526 hash = hash_64(sid->id, PERF_EVLIST__HLIST_BITS);
527 hlist_add_head(&sid->node, &evlist->heads[hash]);
528}
529
a91e5431
ACM
530void perf_evlist__id_add(struct perf_evlist *evlist, struct perf_evsel *evsel,
531 int cpu, int thread, u64 id)
532{
533 perf_evlist__id_hash(evlist, evsel, cpu, thread, id);
534 evsel->id[evsel->ids++] = id;
535}
536
537static int perf_evlist__id_add_fd(struct perf_evlist *evlist,
538 struct perf_evsel *evsel,
539 int cpu, int thread, int fd)
f8a95309 540{
f8a95309 541 u64 read_data[4] = { 0, };
3d3b5e95 542 int id_idx = 1; /* The first entry is the counter value */
e2b5abe0
JO
543 u64 id;
544 int ret;
545
546 ret = ioctl(fd, PERF_EVENT_IOC_ID, &id);
547 if (!ret)
548 goto add;
549
550 if (errno != ENOTTY)
551 return -1;
552
553 /* Legacy way to get event id.. All hail to old kernels! */
f8a95309 554
c4861afe
JO
555 /*
556 * This way does not work with group format read, so bail
557 * out in that case.
558 */
559 if (perf_evlist__read_format(evlist) & PERF_FORMAT_GROUP)
560 return -1;
561
f8a95309
ACM
562 if (!(evsel->attr.read_format & PERF_FORMAT_ID) ||
563 read(fd, &read_data, sizeof(read_data)) == -1)
564 return -1;
565
566 if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
567 ++id_idx;
568 if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
569 ++id_idx;
570
e2b5abe0
JO
571 id = read_data[id_idx];
572
573 add:
574 perf_evlist__id_add(evlist, evsel, cpu, thread, id);
f8a95309
ACM
575 return 0;
576}
577
3c659eed
AH
578static void perf_evlist__set_sid_idx(struct perf_evlist *evlist,
579 struct perf_evsel *evsel, int idx, int cpu,
580 int thread)
581{
582 struct perf_sample_id *sid = SID(evsel, cpu, thread);
583 sid->idx = idx;
584 if (evlist->cpus && cpu >= 0)
585 sid->cpu = evlist->cpus->map[cpu];
586 else
587 sid->cpu = -1;
588 if (!evsel->system_wide && evlist->threads && thread >= 0)
e13798c7 589 sid->tid = thread_map__pid(evlist->threads, thread);
3c659eed
AH
590 else
591 sid->tid = -1;
592}
593
932a3594 594struct perf_sample_id *perf_evlist__id2sid(struct perf_evlist *evlist, u64 id)
70db7533
ACM
595{
596 struct hlist_head *head;
70db7533
ACM
597 struct perf_sample_id *sid;
598 int hash;
599
70db7533
ACM
600 hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
601 head = &evlist->heads[hash];
602
b67bfe0d 603 hlist_for_each_entry(sid, head, node)
70db7533 604 if (sid->id == id)
932a3594
JO
605 return sid;
606
607 return NULL;
608}
609
610struct perf_evsel *perf_evlist__id2evsel(struct perf_evlist *evlist, u64 id)
611{
612 struct perf_sample_id *sid;
613
05169df5 614 if (evlist->nr_entries == 1 || !id)
932a3594
JO
615 return perf_evlist__first(evlist);
616
617 sid = perf_evlist__id2sid(evlist, id);
618 if (sid)
619 return sid->evsel;
30e68bcc
NK
620
621 if (!perf_evlist__sample_id_all(evlist))
0c21f736 622 return perf_evlist__first(evlist);
30e68bcc 623
70db7533
ACM
624 return NULL;
625}
04391deb 626
dddcf6ab
AH
627struct perf_evsel *perf_evlist__id2evsel_strict(struct perf_evlist *evlist,
628 u64 id)
629{
630 struct perf_sample_id *sid;
631
632 if (!id)
633 return NULL;
634
635 sid = perf_evlist__id2sid(evlist, id);
636 if (sid)
637 return sid->evsel;
638
639 return NULL;
640}
641
75562573
AH
642static int perf_evlist__event2id(struct perf_evlist *evlist,
643 union perf_event *event, u64 *id)
644{
645 const u64 *array = event->sample.array;
646 ssize_t n;
647
648 n = (event->header.size - sizeof(event->header)) >> 3;
649
650 if (event->header.type == PERF_RECORD_SAMPLE) {
651 if (evlist->id_pos >= n)
652 return -1;
653 *id = array[evlist->id_pos];
654 } else {
655 if (evlist->is_pos > n)
656 return -1;
657 n -= evlist->is_pos;
658 *id = array[n];
659 }
660 return 0;
661}
662
663static struct perf_evsel *perf_evlist__event2evsel(struct perf_evlist *evlist,
664 union perf_event *event)
665{
98be6966 666 struct perf_evsel *first = perf_evlist__first(evlist);
75562573
AH
667 struct hlist_head *head;
668 struct perf_sample_id *sid;
669 int hash;
670 u64 id;
671
672 if (evlist->nr_entries == 1)
98be6966
AH
673 return first;
674
675 if (!first->attr.sample_id_all &&
676 event->header.type != PERF_RECORD_SAMPLE)
677 return first;
75562573
AH
678
679 if (perf_evlist__event2id(evlist, event, &id))
680 return NULL;
681
682 /* Synthesized events have an id of zero */
683 if (!id)
98be6966 684 return first;
75562573
AH
685
686 hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
687 head = &evlist->heads[hash];
688
689 hlist_for_each_entry(sid, head, node) {
690 if (sid->id == id)
691 return sid->evsel;
692 }
693 return NULL;
694}
695
aece948f 696union perf_event *perf_evlist__mmap_read(struct perf_evlist *evlist, int idx)
04391deb 697{
aece948f 698 struct perf_mmap *md = &evlist->mmap[idx];
7951722d 699 u64 head;
7b8283b5 700 u64 old = md->prev;
04391deb 701 unsigned char *data = md->base + page_size;
8115d60c 702 union perf_event *event = NULL;
04391deb 703
7951722d
SB
704 /*
705 * Check if event was unmapped due to a POLLHUP/POLLERR.
706 */
707 if (!atomic_read(&md->refcnt))
708 return NULL;
709
710 head = perf_mmap__read_head(md);
7bb41152 711 if (evlist->overwrite) {
04391deb 712 /*
7bb41152
ACM
713 * If we're further behind than half the buffer, there's a chance
714 * the writer will bite our tail and mess up the samples under us.
715 *
716 * If we somehow ended up ahead of the head, we got messed up.
717 *
718 * In either case, truncate and restart at head.
04391deb 719 */
7bb41152
ACM
720 int diff = head - old;
721 if (diff > md->mask / 2 || diff < 0) {
722 fprintf(stderr, "WARNING: failed to keep up with mmap data.\n");
723
724 /*
725 * head points to a known good entry, start there.
726 */
727 old = head;
728 }
04391deb
ACM
729 }
730
731 if (old != head) {
732 size_t size;
733
8115d60c 734 event = (union perf_event *)&data[old & md->mask];
04391deb
ACM
735 size = event->header.size;
736
737 /*
738 * Event straddles the mmap boundary -- header should always
739 * be inside due to u64 alignment of output.
740 */
741 if ((old & md->mask) + size != ((old + size) & md->mask)) {
742 unsigned int offset = old;
743 unsigned int len = min(sizeof(*event), size), cpy;
a65cb4b9 744 void *dst = md->event_copy;
04391deb
ACM
745
746 do {
747 cpy = min(md->mask + 1 - (offset & md->mask), len);
748 memcpy(dst, &data[offset & md->mask], cpy);
749 offset += cpy;
750 dst += cpy;
751 len -= cpy;
752 } while (len);
753
a65cb4b9 754 event = (union perf_event *) md->event_copy;
04391deb
ACM
755 }
756
757 old += size;
758 }
759
760 md->prev = old;
7bb41152 761
04391deb
ACM
762 return event;
763}
f8a95309 764
82396986
ACM
765static bool perf_mmap__empty(struct perf_mmap *md)
766{
b72e74d1 767 return perf_mmap__read_head(md) == md->prev && !md->auxtrace_mmap.base;
82396986
ACM
768}
769
770static void perf_evlist__mmap_get(struct perf_evlist *evlist, int idx)
771{
7143849a 772 atomic_inc(&evlist->mmap[idx].refcnt);
82396986
ACM
773}
774
775static void perf_evlist__mmap_put(struct perf_evlist *evlist, int idx)
776{
7143849a 777 BUG_ON(atomic_read(&evlist->mmap[idx].refcnt) == 0);
82396986 778
7143849a 779 if (atomic_dec_and_test(&evlist->mmap[idx].refcnt))
82396986
ACM
780 __perf_evlist__munmap(evlist, idx);
781}
782
8e50d384
ZZ
783void perf_evlist__mmap_consume(struct perf_evlist *evlist, int idx)
784{
82396986
ACM
785 struct perf_mmap *md = &evlist->mmap[idx];
786
8e50d384 787 if (!evlist->overwrite) {
7b8283b5 788 u64 old = md->prev;
8e50d384
ZZ
789
790 perf_mmap__write_tail(md, old);
791 }
82396986 792
7143849a 793 if (atomic_read(&md->refcnt) == 1 && perf_mmap__empty(md))
82396986 794 perf_evlist__mmap_put(evlist, idx);
8e50d384
ZZ
795}
796
718c602d
AH
797int __weak auxtrace_mmap__mmap(struct auxtrace_mmap *mm __maybe_unused,
798 struct auxtrace_mmap_params *mp __maybe_unused,
799 void *userpg __maybe_unused,
800 int fd __maybe_unused)
801{
802 return 0;
803}
804
805void __weak auxtrace_mmap__munmap(struct auxtrace_mmap *mm __maybe_unused)
806{
807}
808
809void __weak auxtrace_mmap_params__init(
810 struct auxtrace_mmap_params *mp __maybe_unused,
811 off_t auxtrace_offset __maybe_unused,
812 unsigned int auxtrace_pages __maybe_unused,
813 bool auxtrace_overwrite __maybe_unused)
814{
815}
816
817void __weak auxtrace_mmap_params__set_idx(
818 struct auxtrace_mmap_params *mp __maybe_unused,
819 struct perf_evlist *evlist __maybe_unused,
820 int idx __maybe_unused,
821 bool per_cpu __maybe_unused)
822{
823}
824
93edcbd9
AH
825static void __perf_evlist__munmap(struct perf_evlist *evlist, int idx)
826{
827 if (evlist->mmap[idx].base != NULL) {
828 munmap(evlist->mmap[idx].base, evlist->mmap_len);
829 evlist->mmap[idx].base = NULL;
7143849a 830 atomic_set(&evlist->mmap[idx].refcnt, 0);
93edcbd9 831 }
718c602d 832 auxtrace_mmap__munmap(&evlist->mmap[idx].auxtrace_mmap);
93edcbd9
AH
833}
834
7e2ed097 835void perf_evlist__munmap(struct perf_evlist *evlist)
f8a95309 836{
aece948f 837 int i;
f8a95309 838
983874d1
ACM
839 if (evlist->mmap == NULL)
840 return;
841
93edcbd9
AH
842 for (i = 0; i < evlist->nr_mmaps; i++)
843 __perf_evlist__munmap(evlist, i);
aece948f 844
04662523 845 zfree(&evlist->mmap);
f8a95309
ACM
846}
847
806fb630 848static int perf_evlist__alloc_mmap(struct perf_evlist *evlist)
f8a95309 849{
a14bb7a6 850 evlist->nr_mmaps = cpu_map__nr(evlist->cpus);
ec1e7e43 851 if (cpu_map__empty(evlist->cpus))
b3a319d5 852 evlist->nr_mmaps = thread_map__nr(evlist->threads);
aece948f 853 evlist->mmap = zalloc(evlist->nr_mmaps * sizeof(struct perf_mmap));
f8a95309
ACM
854 return evlist->mmap != NULL ? 0 : -ENOMEM;
855}
856
a8a8f3eb
AH
857struct mmap_params {
858 int prot;
859 int mask;
718c602d 860 struct auxtrace_mmap_params auxtrace_mp;
a8a8f3eb
AH
861};
862
863static int __perf_evlist__mmap(struct perf_evlist *evlist, int idx,
864 struct mmap_params *mp, int fd)
f8a95309 865{
82396986
ACM
866 /*
867 * The last one will be done at perf_evlist__mmap_consume(), so that we
868 * make sure we don't prevent tools from consuming every last event in
869 * the ring buffer.
870 *
871 * I.e. we can get the POLLHUP meaning that the fd doesn't exist
872 * anymore, but the last events for it are still in the ring buffer,
873 * waiting to be consumed.
874 *
875 * Tools can chose to ignore this at their own discretion, but the
876 * evlist layer can't just drop it when filtering events in
877 * perf_evlist__filter_pollfd().
878 */
7143849a 879 atomic_set(&evlist->mmap[idx].refcnt, 2);
aece948f 880 evlist->mmap[idx].prev = 0;
a8a8f3eb
AH
881 evlist->mmap[idx].mask = mp->mask;
882 evlist->mmap[idx].base = mmap(NULL, evlist->mmap_len, mp->prot,
f8a95309 883 MAP_SHARED, fd, 0);
301b195d 884 if (evlist->mmap[idx].base == MAP_FAILED) {
02635965
AH
885 pr_debug2("failed to mmap perf event ring buffer, error %d\n",
886 errno);
301b195d 887 evlist->mmap[idx].base = NULL;
f8a95309 888 return -1;
301b195d 889 }
ad6765dd 890
718c602d
AH
891 if (auxtrace_mmap__mmap(&evlist->mmap[idx].auxtrace_mmap,
892 &mp->auxtrace_mp, evlist->mmap[idx].base, fd))
893 return -1;
894
f8a95309
ACM
895 return 0;
896}
897
04e21314 898static int perf_evlist__mmap_per_evsel(struct perf_evlist *evlist, int idx,
a8a8f3eb
AH
899 struct mmap_params *mp, int cpu,
900 int thread, int *output)
aece948f
ACM
901{
902 struct perf_evsel *evsel;
04e21314 903
0050f7aa 904 evlist__for_each(evlist, evsel) {
bf8e8f4b
AH
905 int fd;
906
907 if (evsel->system_wide && thread)
908 continue;
909
910 fd = FD(evsel, cpu, thread);
04e21314
AH
911
912 if (*output == -1) {
913 *output = fd;
a8a8f3eb 914 if (__perf_evlist__mmap(evlist, idx, mp, *output) < 0)
04e21314
AH
915 return -1;
916 } else {
917 if (ioctl(fd, PERF_EVENT_IOC_SET_OUTPUT, *output) != 0)
918 return -1;
82396986
ACM
919
920 perf_evlist__mmap_get(evlist, idx);
04e21314
AH
921 }
922
f90d194a
AH
923 /*
924 * The system_wide flag causes a selected event to be opened
925 * always without a pid. Consequently it will never get a
926 * POLLHUP, but it is used for tracking in combination with
927 * other events, so it should not need to be polled anyway.
928 * Therefore don't add it for polling.
929 */
930 if (!evsel->system_wide &&
931 __perf_evlist__add_pollfd(evlist, fd, idx) < 0) {
82396986 932 perf_evlist__mmap_put(evlist, idx);
ad6765dd 933 return -1;
82396986 934 }
033fa713 935
3c659eed
AH
936 if (evsel->attr.read_format & PERF_FORMAT_ID) {
937 if (perf_evlist__id_add_fd(evlist, evsel, cpu, thread,
938 fd) < 0)
939 return -1;
940 perf_evlist__set_sid_idx(evlist, evsel, idx, cpu,
941 thread);
942 }
04e21314
AH
943 }
944
945 return 0;
946}
947
a8a8f3eb
AH
948static int perf_evlist__mmap_per_cpu(struct perf_evlist *evlist,
949 struct mmap_params *mp)
04e21314 950{
aece948f 951 int cpu, thread;
b3a319d5
NK
952 int nr_cpus = cpu_map__nr(evlist->cpus);
953 int nr_threads = thread_map__nr(evlist->threads);
aece948f 954
e3e1a54f 955 pr_debug2("perf event ring buffer mmapped per cpu\n");
b3a319d5 956 for (cpu = 0; cpu < nr_cpus; cpu++) {
aece948f
ACM
957 int output = -1;
958
718c602d
AH
959 auxtrace_mmap_params__set_idx(&mp->auxtrace_mp, evlist, cpu,
960 true);
961
b3a319d5 962 for (thread = 0; thread < nr_threads; thread++) {
a8a8f3eb
AH
963 if (perf_evlist__mmap_per_evsel(evlist, cpu, mp, cpu,
964 thread, &output))
04e21314 965 goto out_unmap;
aece948f
ACM
966 }
967 }
968
969 return 0;
970
971out_unmap:
93edcbd9
AH
972 for (cpu = 0; cpu < nr_cpus; cpu++)
973 __perf_evlist__munmap(evlist, cpu);
aece948f
ACM
974 return -1;
975}
976
a8a8f3eb
AH
977static int perf_evlist__mmap_per_thread(struct perf_evlist *evlist,
978 struct mmap_params *mp)
aece948f 979{
aece948f 980 int thread;
b3a319d5 981 int nr_threads = thread_map__nr(evlist->threads);
aece948f 982
e3e1a54f 983 pr_debug2("perf event ring buffer mmapped per thread\n");
b3a319d5 984 for (thread = 0; thread < nr_threads; thread++) {
aece948f
ACM
985 int output = -1;
986
718c602d
AH
987 auxtrace_mmap_params__set_idx(&mp->auxtrace_mp, evlist, thread,
988 false);
989
a8a8f3eb
AH
990 if (perf_evlist__mmap_per_evsel(evlist, thread, mp, 0, thread,
991 &output))
04e21314 992 goto out_unmap;
aece948f
ACM
993 }
994
995 return 0;
996
997out_unmap:
93edcbd9
AH
998 for (thread = 0; thread < nr_threads; thread++)
999 __perf_evlist__munmap(evlist, thread);
aece948f
ACM
1000 return -1;
1001}
1002
994a1f78
JO
1003static size_t perf_evlist__mmap_size(unsigned long pages)
1004{
8185e881
ACM
1005 if (pages == UINT_MAX) {
1006 int max;
1007
1008 if (sysctl__read_int("kernel/perf_event_mlock_kb", &max) < 0) {
1009 /*
1010 * Pick a once upon a time good value, i.e. things look
1011 * strange since we can't read a sysctl value, but lets not
1012 * die yet...
1013 */
1014 max = 512;
1015 } else {
1016 max -= (page_size / 1024);
1017 }
1018
1019 pages = (max * 1024) / page_size;
1be300f4
ACM
1020 if (!is_power_of_2(pages))
1021 pages = rounddown_pow_of_two(pages);
8185e881 1022 } else if (!is_power_of_2(pages))
994a1f78
JO
1023 return 0;
1024
1025 return (pages + 1) * page_size;
1026}
1027
33c2dcfd
DA
1028static long parse_pages_arg(const char *str, unsigned long min,
1029 unsigned long max)
994a1f78 1030{
2fbe4abe 1031 unsigned long pages, val;
27050f53
JO
1032 static struct parse_tag tags[] = {
1033 { .tag = 'B', .mult = 1 },
1034 { .tag = 'K', .mult = 1 << 10 },
1035 { .tag = 'M', .mult = 1 << 20 },
1036 { .tag = 'G', .mult = 1 << 30 },
1037 { .tag = 0 },
1038 };
994a1f78 1039
8973504b 1040 if (str == NULL)
33c2dcfd 1041 return -EINVAL;
8973504b 1042
27050f53 1043 val = parse_tag_value(str, tags);
2fbe4abe 1044 if (val != (unsigned long) -1) {
27050f53
JO
1045 /* we got file size value */
1046 pages = PERF_ALIGN(val, page_size) / page_size;
27050f53
JO
1047 } else {
1048 /* we got pages count value */
1049 char *eptr;
1050 pages = strtoul(str, &eptr, 10);
33c2dcfd
DA
1051 if (*eptr != '\0')
1052 return -EINVAL;
994a1f78
JO
1053 }
1054
2bcab6c1 1055 if (pages == 0 && min == 0) {
33c2dcfd 1056 /* leave number of pages at 0 */
1dbfa938 1057 } else if (!is_power_of_2(pages)) {
33c2dcfd 1058 /* round pages up to next power of 2 */
91529834 1059 pages = roundup_pow_of_two(pages);
1dbfa938
AH
1060 if (!pages)
1061 return -EINVAL;
9639837e
DA
1062 pr_info("rounding mmap pages size to %lu bytes (%lu pages)\n",
1063 pages * page_size, pages);
2fbe4abe
AH
1064 }
1065
33c2dcfd
DA
1066 if (pages > max)
1067 return -EINVAL;
1068
1069 return pages;
1070}
1071
e9db1310 1072int __perf_evlist__parse_mmap_pages(unsigned int *mmap_pages, const char *str)
33c2dcfd 1073{
33c2dcfd
DA
1074 unsigned long max = UINT_MAX;
1075 long pages;
1076
f5ae9c42 1077 if (max > SIZE_MAX / page_size)
33c2dcfd
DA
1078 max = SIZE_MAX / page_size;
1079
1080 pages = parse_pages_arg(str, 1, max);
1081 if (pages < 0) {
1082 pr_err("Invalid argument for --mmap_pages/-m\n");
994a1f78
JO
1083 return -1;
1084 }
1085
1086 *mmap_pages = pages;
1087 return 0;
1088}
1089
e9db1310
AH
1090int perf_evlist__parse_mmap_pages(const struct option *opt, const char *str,
1091 int unset __maybe_unused)
1092{
1093 return __perf_evlist__parse_mmap_pages(opt->value, str);
1094}
1095
c83fa7f2 1096/**
718c602d 1097 * perf_evlist__mmap_ex - Create mmaps to receive events.
c83fa7f2
AH
1098 * @evlist: list of events
1099 * @pages: map length in pages
1100 * @overwrite: overwrite older events?
718c602d
AH
1101 * @auxtrace_pages - auxtrace map length in pages
1102 * @auxtrace_overwrite - overwrite older auxtrace data?
f8a95309 1103 *
c83fa7f2
AH
1104 * If @overwrite is %false the user needs to signal event consumption using
1105 * perf_mmap__write_tail(). Using perf_evlist__mmap_read() does this
1106 * automatically.
7e2ed097 1107 *
718c602d
AH
1108 * Similarly, if @auxtrace_overwrite is %false the user needs to signal data
1109 * consumption using auxtrace_mmap__write_tail().
1110 *
c83fa7f2 1111 * Return: %0 on success, negative error code otherwise.
f8a95309 1112 */
718c602d
AH
1113int perf_evlist__mmap_ex(struct perf_evlist *evlist, unsigned int pages,
1114 bool overwrite, unsigned int auxtrace_pages,
1115 bool auxtrace_overwrite)
f8a95309 1116{
aece948f 1117 struct perf_evsel *evsel;
7e2ed097
ACM
1118 const struct cpu_map *cpus = evlist->cpus;
1119 const struct thread_map *threads = evlist->threads;
a8a8f3eb
AH
1120 struct mmap_params mp = {
1121 .prot = PROT_READ | (overwrite ? 0 : PROT_WRITE),
1122 };
50a682ce 1123
7e2ed097 1124 if (evlist->mmap == NULL && perf_evlist__alloc_mmap(evlist) < 0)
f8a95309
ACM
1125 return -ENOMEM;
1126
1b85337d 1127 if (evlist->pollfd.entries == NULL && perf_evlist__alloc_pollfd(evlist) < 0)
f8a95309
ACM
1128 return -ENOMEM;
1129
1130 evlist->overwrite = overwrite;
994a1f78 1131 evlist->mmap_len = perf_evlist__mmap_size(pages);
2af68ef5 1132 pr_debug("mmap size %zuB\n", evlist->mmap_len);
a8a8f3eb 1133 mp.mask = evlist->mmap_len - page_size - 1;
f8a95309 1134
718c602d
AH
1135 auxtrace_mmap_params__init(&mp.auxtrace_mp, evlist->mmap_len,
1136 auxtrace_pages, auxtrace_overwrite);
1137
0050f7aa 1138 evlist__for_each(evlist, evsel) {
f8a95309 1139 if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
a91e5431 1140 evsel->sample_id == NULL &&
a14bb7a6 1141 perf_evsel__alloc_id(evsel, cpu_map__nr(cpus), threads->nr) < 0)
f8a95309 1142 return -ENOMEM;
f8a95309
ACM
1143 }
1144
ec1e7e43 1145 if (cpu_map__empty(cpus))
a8a8f3eb 1146 return perf_evlist__mmap_per_thread(evlist, &mp);
f8a95309 1147
a8a8f3eb 1148 return perf_evlist__mmap_per_cpu(evlist, &mp);
f8a95309 1149}
7e2ed097 1150
718c602d
AH
1151int perf_evlist__mmap(struct perf_evlist *evlist, unsigned int pages,
1152 bool overwrite)
1153{
1154 return perf_evlist__mmap_ex(evlist, pages, overwrite, 0, false);
1155}
1156
602ad878 1157int perf_evlist__create_maps(struct perf_evlist *evlist, struct target *target)
7e2ed097 1158{
74bfd2b2
AH
1159 struct cpu_map *cpus;
1160 struct thread_map *threads;
7e2ed097 1161
74bfd2b2 1162 threads = thread_map__new_str(target->pid, target->tid, target->uid);
7e2ed097 1163
74bfd2b2 1164 if (!threads)
7e2ed097
ACM
1165 return -1;
1166
9c105fbc 1167 if (target__uses_dummy_map(target))
74bfd2b2 1168 cpus = cpu_map__dummy_new();
879d77d0 1169 else
74bfd2b2 1170 cpus = cpu_map__new(target->cpu_list);
7e2ed097 1171
74bfd2b2 1172 if (!cpus)
7e2ed097
ACM
1173 goto out_delete_threads;
1174
ec9a77a7
AH
1175 evlist->has_user_cpus = !!target->cpu_list;
1176
74bfd2b2 1177 perf_evlist__set_maps(evlist, cpus, threads);
d5bc056e
AH
1178
1179 return 0;
7e2ed097
ACM
1180
1181out_delete_threads:
74bfd2b2 1182 thread_map__put(threads);
7e2ed097
ACM
1183 return -1;
1184}
1185
d5bc056e
AH
1186void perf_evlist__set_maps(struct perf_evlist *evlist, struct cpu_map *cpus,
1187 struct thread_map *threads)
3de5cfb0 1188{
934e0f20
AH
1189 /*
1190 * Allow for the possibility that one or another of the maps isn't being
1191 * changed i.e. don't put it. Note we are assuming the maps that are
1192 * being applied are brand new and evlist is taking ownership of the
1193 * original reference count of 1. If that is not the case it is up to
1194 * the caller to increase the reference count.
1195 */
1196 if (cpus != evlist->cpus) {
3de5cfb0 1197 cpu_map__put(evlist->cpus);
934e0f20
AH
1198 evlist->cpus = cpus;
1199 }
3de5cfb0 1200
934e0f20 1201 if (threads != evlist->threads) {
3de5cfb0 1202 thread_map__put(evlist->threads);
934e0f20
AH
1203 evlist->threads = threads;
1204 }
3de5cfb0 1205
ec9a77a7 1206 perf_evlist__propagate_maps(evlist);
3de5cfb0
JO
1207}
1208
23d4aad4 1209int perf_evlist__apply_filters(struct perf_evlist *evlist, struct perf_evsel **err_evsel)
0a102479 1210{
0a102479 1211 struct perf_evsel *evsel;
745cefc5
ACM
1212 int err = 0;
1213 const int ncpus = cpu_map__nr(evlist->cpus),
b3a319d5 1214 nthreads = thread_map__nr(evlist->threads);
0a102479 1215
0050f7aa 1216 evlist__for_each(evlist, evsel) {
745cefc5 1217 if (evsel->filter == NULL)
0a102479 1218 continue;
745cefc5 1219
d988d5ee
KL
1220 /*
1221 * filters only work for tracepoint event, which doesn't have cpu limit.
1222 * So evlist and evsel should always be same.
1223 */
f47805a2 1224 err = perf_evsel__apply_filter(evsel, ncpus, nthreads, evsel->filter);
23d4aad4
ACM
1225 if (err) {
1226 *err_evsel = evsel;
745cefc5 1227 break;
23d4aad4 1228 }
0a102479
FW
1229 }
1230
745cefc5
ACM
1231 return err;
1232}
1233
1234int perf_evlist__set_filter(struct perf_evlist *evlist, const char *filter)
1235{
1236 struct perf_evsel *evsel;
1237 int err = 0;
745cefc5 1238
0050f7aa 1239 evlist__for_each(evlist, evsel) {
94ad89bc 1240 err = perf_evsel__set_filter(evsel, filter);
745cefc5
ACM
1241 if (err)
1242 break;
1243 }
1244
1245 return err;
0a102479 1246}
74429964 1247
be199ada 1248int perf_evlist__set_filter_pids(struct perf_evlist *evlist, size_t npids, pid_t *pids)
cfd70a26
ACM
1249{
1250 char *filter;
be199ada
ACM
1251 int ret = -1;
1252 size_t i;
cfd70a26 1253
be199ada
ACM
1254 for (i = 0; i < npids; ++i) {
1255 if (i == 0) {
1256 if (asprintf(&filter, "common_pid != %d", pids[i]) < 0)
1257 return -1;
1258 } else {
1259 char *tmp;
1260
1261 if (asprintf(&tmp, "%s && common_pid != %d", filter, pids[i]) < 0)
1262 goto out_free;
1263
1264 free(filter);
1265 filter = tmp;
1266 }
1267 }
cfd70a26
ACM
1268
1269 ret = perf_evlist__set_filter(evlist, filter);
be199ada 1270out_free:
cfd70a26
ACM
1271 free(filter);
1272 return ret;
1273}
1274
be199ada
ACM
1275int perf_evlist__set_filter_pid(struct perf_evlist *evlist, pid_t pid)
1276{
1277 return perf_evlist__set_filter_pids(evlist, 1, &pid);
1278}
1279
0c21f736 1280bool perf_evlist__valid_sample_type(struct perf_evlist *evlist)
74429964 1281{
75562573 1282 struct perf_evsel *pos;
c2a70653 1283
75562573
AH
1284 if (evlist->nr_entries == 1)
1285 return true;
1286
1287 if (evlist->id_pos < 0 || evlist->is_pos < 0)
1288 return false;
1289
0050f7aa 1290 evlist__for_each(evlist, pos) {
75562573
AH
1291 if (pos->id_pos != evlist->id_pos ||
1292 pos->is_pos != evlist->is_pos)
c2a70653 1293 return false;
74429964
FW
1294 }
1295
c2a70653 1296 return true;
74429964
FW
1297}
1298
75562573 1299u64 __perf_evlist__combined_sample_type(struct perf_evlist *evlist)
c2a70653 1300{
75562573
AH
1301 struct perf_evsel *evsel;
1302
1303 if (evlist->combined_sample_type)
1304 return evlist->combined_sample_type;
1305
0050f7aa 1306 evlist__for_each(evlist, evsel)
75562573
AH
1307 evlist->combined_sample_type |= evsel->attr.sample_type;
1308
1309 return evlist->combined_sample_type;
1310}
1311
1312u64 perf_evlist__combined_sample_type(struct perf_evlist *evlist)
1313{
1314 evlist->combined_sample_type = 0;
1315 return __perf_evlist__combined_sample_type(evlist);
c2a70653
ACM
1316}
1317
98df858e
AK
1318u64 perf_evlist__combined_branch_type(struct perf_evlist *evlist)
1319{
1320 struct perf_evsel *evsel;
1321 u64 branch_type = 0;
1322
1323 evlist__for_each(evlist, evsel)
1324 branch_type |= evsel->attr.branch_sample_type;
1325 return branch_type;
1326}
1327
9ede473c
JO
1328bool perf_evlist__valid_read_format(struct perf_evlist *evlist)
1329{
1330 struct perf_evsel *first = perf_evlist__first(evlist), *pos = first;
1331 u64 read_format = first->attr.read_format;
1332 u64 sample_type = first->attr.sample_type;
1333
0050f7aa 1334 evlist__for_each(evlist, pos) {
9ede473c
JO
1335 if (read_format != pos->attr.read_format)
1336 return false;
1337 }
1338
1339 /* PERF_SAMPLE_READ imples PERF_FORMAT_ID. */
1340 if ((sample_type & PERF_SAMPLE_READ) &&
1341 !(read_format & PERF_FORMAT_ID)) {
1342 return false;
1343 }
1344
1345 return true;
1346}
1347
1348u64 perf_evlist__read_format(struct perf_evlist *evlist)
1349{
1350 struct perf_evsel *first = perf_evlist__first(evlist);
1351 return first->attr.read_format;
1352}
1353
0c21f736 1354u16 perf_evlist__id_hdr_size(struct perf_evlist *evlist)
81e36bff 1355{
0c21f736 1356 struct perf_evsel *first = perf_evlist__first(evlist);
81e36bff
ACM
1357 struct perf_sample *data;
1358 u64 sample_type;
1359 u16 size = 0;
1360
81e36bff
ACM
1361 if (!first->attr.sample_id_all)
1362 goto out;
1363
1364 sample_type = first->attr.sample_type;
1365
1366 if (sample_type & PERF_SAMPLE_TID)
1367 size += sizeof(data->tid) * 2;
1368
1369 if (sample_type & PERF_SAMPLE_TIME)
1370 size += sizeof(data->time);
1371
1372 if (sample_type & PERF_SAMPLE_ID)
1373 size += sizeof(data->id);
1374
1375 if (sample_type & PERF_SAMPLE_STREAM_ID)
1376 size += sizeof(data->stream_id);
1377
1378 if (sample_type & PERF_SAMPLE_CPU)
1379 size += sizeof(data->cpu) * 2;
75562573
AH
1380
1381 if (sample_type & PERF_SAMPLE_IDENTIFIER)
1382 size += sizeof(data->id);
81e36bff
ACM
1383out:
1384 return size;
1385}
1386
0c21f736 1387bool perf_evlist__valid_sample_id_all(struct perf_evlist *evlist)
74429964 1388{
0c21f736 1389 struct perf_evsel *first = perf_evlist__first(evlist), *pos = first;
c2a70653 1390
0050f7aa 1391 evlist__for_each_continue(evlist, pos) {
c2a70653
ACM
1392 if (first->attr.sample_id_all != pos->attr.sample_id_all)
1393 return false;
74429964
FW
1394 }
1395
c2a70653
ACM
1396 return true;
1397}
1398
0c21f736 1399bool perf_evlist__sample_id_all(struct perf_evlist *evlist)
c2a70653 1400{
0c21f736 1401 struct perf_evsel *first = perf_evlist__first(evlist);
c2a70653 1402 return first->attr.sample_id_all;
74429964 1403}
81cce8de
ACM
1404
1405void perf_evlist__set_selected(struct perf_evlist *evlist,
1406 struct perf_evsel *evsel)
1407{
1408 evlist->selected = evsel;
1409}
727ab04e 1410
a74b4b66
NK
1411void perf_evlist__close(struct perf_evlist *evlist)
1412{
1413 struct perf_evsel *evsel;
1414 int ncpus = cpu_map__nr(evlist->cpus);
1415 int nthreads = thread_map__nr(evlist->threads);
8ad9219e 1416 int n;
a74b4b66 1417
8ad9219e
SE
1418 evlist__for_each_reverse(evlist, evsel) {
1419 n = evsel->cpus ? evsel->cpus->nr : ncpus;
1420 perf_evsel__close(evsel, n, nthreads);
1421 }
a74b4b66
NK
1422}
1423
4112eb18
ACM
1424static int perf_evlist__create_syswide_maps(struct perf_evlist *evlist)
1425{
8c0498b6
AH
1426 struct cpu_map *cpus;
1427 struct thread_map *threads;
4112eb18
ACM
1428 int err = -ENOMEM;
1429
1430 /*
1431 * Try reading /sys/devices/system/cpu/online to get
1432 * an all cpus map.
1433 *
1434 * FIXME: -ENOMEM is the best we can do here, the cpu_map
1435 * code needs an overhaul to properly forward the
1436 * error, and we may not want to do that fallback to a
1437 * default cpu identity map :-\
1438 */
8c0498b6
AH
1439 cpus = cpu_map__new(NULL);
1440 if (!cpus)
4112eb18
ACM
1441 goto out;
1442
8c0498b6
AH
1443 threads = thread_map__new_dummy();
1444 if (!threads)
1445 goto out_put;
4112eb18 1446
8c0498b6 1447 perf_evlist__set_maps(evlist, cpus, threads);
4112eb18
ACM
1448out:
1449 return err;
8c0498b6
AH
1450out_put:
1451 cpu_map__put(cpus);
4112eb18
ACM
1452 goto out;
1453}
1454
6a4bb04c 1455int perf_evlist__open(struct perf_evlist *evlist)
727ab04e 1456{
6a4bb04c 1457 struct perf_evsel *evsel;
a74b4b66 1458 int err;
727ab04e 1459
4112eb18
ACM
1460 /*
1461 * Default: one fd per CPU, all threads, aka systemwide
1462 * as sys_perf_event_open(cpu = -1, thread = -1) is EINVAL
1463 */
1464 if (evlist->threads == NULL && evlist->cpus == NULL) {
1465 err = perf_evlist__create_syswide_maps(evlist);
1466 if (err < 0)
1467 goto out_err;
1468 }
1469
733cd2fe
AH
1470 perf_evlist__update_id_pos(evlist);
1471
0050f7aa 1472 evlist__for_each(evlist, evsel) {
6a4bb04c 1473 err = perf_evsel__open(evsel, evlist->cpus, evlist->threads);
727ab04e
ACM
1474 if (err < 0)
1475 goto out_err;
1476 }
1477
1478 return 0;
1479out_err:
a74b4b66 1480 perf_evlist__close(evlist);
41c21a68 1481 errno = -err;
727ab04e
ACM
1482 return err;
1483}
35b9d88e 1484
602ad878 1485int perf_evlist__prepare_workload(struct perf_evlist *evlist, struct target *target,
55e162ea 1486 const char *argv[], bool pipe_output,
735f7e0b 1487 void (*exec_error)(int signo, siginfo_t *info, void *ucontext))
35b9d88e
ACM
1488{
1489 int child_ready_pipe[2], go_pipe[2];
1490 char bf;
1491
1492 if (pipe(child_ready_pipe) < 0) {
1493 perror("failed to create 'ready' pipe");
1494 return -1;
1495 }
1496
1497 if (pipe(go_pipe) < 0) {
1498 perror("failed to create 'go' pipe");
1499 goto out_close_ready_pipe;
1500 }
1501
1502 evlist->workload.pid = fork();
1503 if (evlist->workload.pid < 0) {
1504 perror("failed to fork");
1505 goto out_close_pipes;
1506 }
1507
1508 if (!evlist->workload.pid) {
5f1c4225
ACM
1509 int ret;
1510
119fa3c9 1511 if (pipe_output)
35b9d88e
ACM
1512 dup2(2, 1);
1513
0817df08
DA
1514 signal(SIGTERM, SIG_DFL);
1515
35b9d88e
ACM
1516 close(child_ready_pipe[0]);
1517 close(go_pipe[1]);
1518 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
1519
35b9d88e
ACM
1520 /*
1521 * Tell the parent we're ready to go
1522 */
1523 close(child_ready_pipe[1]);
1524
1525 /*
1526 * Wait until the parent tells us to go.
1527 */
5f1c4225
ACM
1528 ret = read(go_pipe[0], &bf, 1);
1529 /*
1530 * The parent will ask for the execvp() to be performed by
1531 * writing exactly one byte, in workload.cork_fd, usually via
1532 * perf_evlist__start_workload().
1533 *
20f86fc1 1534 * For cancelling the workload without actually running it,
5f1c4225
ACM
1535 * the parent will just close workload.cork_fd, without writing
1536 * anything, i.e. read will return zero and we just exit()
1537 * here.
1538 */
1539 if (ret != 1) {
1540 if (ret == -1)
1541 perror("unable to read pipe");
1542 exit(ret);
1543 }
35b9d88e
ACM
1544
1545 execvp(argv[0], (char **)argv);
1546
735f7e0b 1547 if (exec_error) {
f33cbe72
ACM
1548 union sigval val;
1549
1550 val.sival_int = errno;
1551 if (sigqueue(getppid(), SIGUSR1, val))
1552 perror(argv[0]);
1553 } else
1554 perror(argv[0]);
35b9d88e
ACM
1555 exit(-1);
1556 }
1557
735f7e0b
ACM
1558 if (exec_error) {
1559 struct sigaction act = {
1560 .sa_flags = SA_SIGINFO,
1561 .sa_sigaction = exec_error,
1562 };
1563 sigaction(SIGUSR1, &act, NULL);
1564 }
1565
1aaf63b1
ACM
1566 if (target__none(target)) {
1567 if (evlist->threads == NULL) {
1568 fprintf(stderr, "FATAL: evlist->threads need to be set at this point (%s:%d).\n",
1569 __func__, __LINE__);
1570 goto out_close_pipes;
1571 }
e13798c7 1572 thread_map__set_pid(evlist->threads, 0, evlist->workload.pid);
1aaf63b1 1573 }
35b9d88e
ACM
1574
1575 close(child_ready_pipe[1]);
1576 close(go_pipe[0]);
1577 /*
1578 * wait for child to settle
1579 */
1580 if (read(child_ready_pipe[0], &bf, 1) == -1) {
1581 perror("unable to read pipe");
1582 goto out_close_pipes;
1583 }
1584
bcf3145f 1585 fcntl(go_pipe[1], F_SETFD, FD_CLOEXEC);
35b9d88e
ACM
1586 evlist->workload.cork_fd = go_pipe[1];
1587 close(child_ready_pipe[0]);
1588 return 0;
1589
1590out_close_pipes:
1591 close(go_pipe[0]);
1592 close(go_pipe[1]);
1593out_close_ready_pipe:
1594 close(child_ready_pipe[0]);
1595 close(child_ready_pipe[1]);
1596 return -1;
1597}
1598
1599int perf_evlist__start_workload(struct perf_evlist *evlist)
1600{
1601 if (evlist->workload.cork_fd > 0) {
b3824404 1602 char bf = 0;
bcf3145f 1603 int ret;
35b9d88e
ACM
1604 /*
1605 * Remove the cork, let it rip!
1606 */
bcf3145f
NK
1607 ret = write(evlist->workload.cork_fd, &bf, 1);
1608 if (ret < 0)
1609 perror("enable to write to pipe");
1610
1611 close(evlist->workload.cork_fd);
1612 return ret;
35b9d88e
ACM
1613 }
1614
1615 return 0;
1616}
cb0b29e0 1617
a3f698fe 1618int perf_evlist__parse_sample(struct perf_evlist *evlist, union perf_event *event,
0807d2d8 1619 struct perf_sample *sample)
cb0b29e0 1620{
75562573
AH
1621 struct perf_evsel *evsel = perf_evlist__event2evsel(evlist, event);
1622
1623 if (!evsel)
1624 return -EFAULT;
0807d2d8 1625 return perf_evsel__parse_sample(evsel, event, sample);
cb0b29e0 1626}
78f067b3
ACM
1627
1628size_t perf_evlist__fprintf(struct perf_evlist *evlist, FILE *fp)
1629{
1630 struct perf_evsel *evsel;
1631 size_t printed = 0;
1632
0050f7aa 1633 evlist__for_each(evlist, evsel) {
78f067b3
ACM
1634 printed += fprintf(fp, "%s%s", evsel->idx ? ", " : "",
1635 perf_evsel__name(evsel));
1636 }
1637
b2222139 1638 return printed + fprintf(fp, "\n");
78f067b3 1639}
6ef068cb 1640
a8f23d8f
ACM
1641int perf_evlist__strerror_open(struct perf_evlist *evlist __maybe_unused,
1642 int err, char *buf, size_t size)
1643{
1644 int printed, value;
6e81c74c 1645 char sbuf[STRERR_BUFSIZE], *emsg = strerror_r(err, sbuf, sizeof(sbuf));
a8f23d8f
ACM
1646
1647 switch (err) {
1648 case EACCES:
1649 case EPERM:
1650 printed = scnprintf(buf, size,
1651 "Error:\t%s.\n"
1652 "Hint:\tCheck /proc/sys/kernel/perf_event_paranoid setting.", emsg);
1653
1a47245d 1654 value = perf_event_paranoid();
a8f23d8f
ACM
1655
1656 printed += scnprintf(buf + printed, size - printed, "\nHint:\t");
1657
1658 if (value >= 2) {
1659 printed += scnprintf(buf + printed, size - printed,
1660 "For your workloads it needs to be <= 1\nHint:\t");
1661 }
1662 printed += scnprintf(buf + printed, size - printed,
5229e366 1663 "For system wide tracing it needs to be set to -1.\n");
a8f23d8f
ACM
1664
1665 printed += scnprintf(buf + printed, size - printed,
5229e366
ACM
1666 "Hint:\tTry: 'sudo sh -c \"echo -1 > /proc/sys/kernel/perf_event_paranoid\"'\n"
1667 "Hint:\tThe current value is %d.", value);
a8f23d8f
ACM
1668 break;
1669 default:
1670 scnprintf(buf, size, "%s", emsg);
1671 break;
1672 }
1673
1674 return 0;
1675}
a025e4f0 1676
956fa571
ACM
1677int perf_evlist__strerror_mmap(struct perf_evlist *evlist, int err, char *buf, size_t size)
1678{
1679 char sbuf[STRERR_BUFSIZE], *emsg = strerror_r(err, sbuf, sizeof(sbuf));
e965bea1 1680 int pages_attempted = evlist->mmap_len / 1024, pages_max_per_user, printed = 0;
956fa571
ACM
1681
1682 switch (err) {
1683 case EPERM:
e5d4a290 1684 sysctl__read_int("kernel/perf_event_mlock_kb", &pages_max_per_user);
e965bea1
ACM
1685 printed += scnprintf(buf + printed, size - printed,
1686 "Error:\t%s.\n"
956fa571 1687 "Hint:\tCheck /proc/sys/kernel/perf_event_mlock_kb (%d kB) setting.\n"
e965bea1 1688 "Hint:\tTried using %zd kB.\n",
e5d4a290 1689 emsg, pages_max_per_user, pages_attempted);
e965bea1
ACM
1690
1691 if (pages_attempted >= pages_max_per_user) {
1692 printed += scnprintf(buf + printed, size - printed,
1693 "Hint:\tTry 'sudo sh -c \"echo %d > /proc/sys/kernel/perf_event_mlock_kb\"', or\n",
1694 pages_max_per_user + pages_attempted);
1695 }
1696
1697 printed += scnprintf(buf + printed, size - printed,
1698 "Hint:\tTry using a smaller -m/--mmap-pages value.");
956fa571
ACM
1699 break;
1700 default:
1701 scnprintf(buf, size, "%s", emsg);
1702 break;
1703 }
1704
1705 return 0;
1706}
1707
a025e4f0
AH
1708void perf_evlist__to_front(struct perf_evlist *evlist,
1709 struct perf_evsel *move_evsel)
1710{
1711 struct perf_evsel *evsel, *n;
1712 LIST_HEAD(move);
1713
1714 if (move_evsel == perf_evlist__first(evlist))
1715 return;
1716
0050f7aa 1717 evlist__for_each_safe(evlist, n, evsel) {
a025e4f0
AH
1718 if (evsel->leader == move_evsel->leader)
1719 list_move_tail(&evsel->node, &move);
1720 }
1721
1722 list_splice(&move, &evlist->entries);
1723}
60b0896c
AH
1724
1725void perf_evlist__set_tracking_event(struct perf_evlist *evlist,
1726 struct perf_evsel *tracking_evsel)
1727{
1728 struct perf_evsel *evsel;
1729
1730 if (tracking_evsel->tracking)
1731 return;
1732
1733 evlist__for_each(evlist, evsel) {
1734 if (evsel != tracking_evsel)
1735 evsel->tracking = false;
1736 }
1737
1738 tracking_evsel->tracking = true;
1739}