]> git.proxmox.com Git - mirror_ubuntu-focal-kernel.git/blame - tools/perf/builtin-trace.c
perf evlist: Introduce set_filter_pid method
[mirror_ubuntu-focal-kernel.git] / tools / perf / builtin-trace.c
CommitLineData
4e319027 1#include <traceevent/event-parse.h>
514f1c67 2#include "builtin.h"
752fde44 3#include "util/color.h"
7c304ee0 4#include "util/debug.h"
514f1c67 5#include "util/evlist.h"
752fde44 6#include "util/machine.h"
6810fc91 7#include "util/session.h"
752fde44 8#include "util/thread.h"
514f1c67 9#include "util/parse-options.h"
2ae3a312 10#include "util/strlist.h"
bdc89661 11#include "util/intlist.h"
514f1c67 12#include "util/thread_map.h"
bf2575c1 13#include "util/stat.h"
97978b3e 14#include "trace-event.h"
9aca7f17 15#include "util/parse-events.h"
514f1c67
ACM
16
17#include <libaudit.h>
18#include <stdlib.h>
49af9e93 19#include <sys/eventfd.h>
ae685380 20#include <sys/mman.h>
f9da0b0c 21#include <linux/futex.h>
514f1c67 22
456857bd
IM
23/* For older distros: */
24#ifndef MAP_STACK
25# define MAP_STACK 0x20000
26#endif
27
28#ifndef MADV_HWPOISON
29# define MADV_HWPOISON 100
30#endif
31
32#ifndef MADV_MERGEABLE
33# define MADV_MERGEABLE 12
34#endif
35
36#ifndef MADV_UNMERGEABLE
37# define MADV_UNMERGEABLE 13
38#endif
39
79d26a6a
BH
40#ifndef EFD_SEMAPHORE
41# define EFD_SEMAPHORE 1
42#endif
43
77170988
ACM
44struct tp_field {
45 int offset;
46 union {
47 u64 (*integer)(struct tp_field *field, struct perf_sample *sample);
48 void *(*pointer)(struct tp_field *field, struct perf_sample *sample);
49 };
50};
51
52#define TP_UINT_FIELD(bits) \
53static u64 tp_field__u##bits(struct tp_field *field, struct perf_sample *sample) \
54{ \
55 return *(u##bits *)(sample->raw_data + field->offset); \
56}
57
58TP_UINT_FIELD(8);
59TP_UINT_FIELD(16);
60TP_UINT_FIELD(32);
61TP_UINT_FIELD(64);
62
63#define TP_UINT_FIELD__SWAPPED(bits) \
64static u64 tp_field__swapped_u##bits(struct tp_field *field, struct perf_sample *sample) \
65{ \
66 u##bits value = *(u##bits *)(sample->raw_data + field->offset); \
67 return bswap_##bits(value);\
68}
69
70TP_UINT_FIELD__SWAPPED(16);
71TP_UINT_FIELD__SWAPPED(32);
72TP_UINT_FIELD__SWAPPED(64);
73
74static int tp_field__init_uint(struct tp_field *field,
75 struct format_field *format_field,
76 bool needs_swap)
77{
78 field->offset = format_field->offset;
79
80 switch (format_field->size) {
81 case 1:
82 field->integer = tp_field__u8;
83 break;
84 case 2:
85 field->integer = needs_swap ? tp_field__swapped_u16 : tp_field__u16;
86 break;
87 case 4:
88 field->integer = needs_swap ? tp_field__swapped_u32 : tp_field__u32;
89 break;
90 case 8:
91 field->integer = needs_swap ? tp_field__swapped_u64 : tp_field__u64;
92 break;
93 default:
94 return -1;
95 }
96
97 return 0;
98}
99
100static void *tp_field__ptr(struct tp_field *field, struct perf_sample *sample)
101{
102 return sample->raw_data + field->offset;
103}
104
105static int tp_field__init_ptr(struct tp_field *field, struct format_field *format_field)
106{
107 field->offset = format_field->offset;
108 field->pointer = tp_field__ptr;
109 return 0;
110}
111
112struct syscall_tp {
113 struct tp_field id;
114 union {
115 struct tp_field args, ret;
116 };
117};
118
119static int perf_evsel__init_tp_uint_field(struct perf_evsel *evsel,
120 struct tp_field *field,
121 const char *name)
122{
123 struct format_field *format_field = perf_evsel__field(evsel, name);
124
125 if (format_field == NULL)
126 return -1;
127
128 return tp_field__init_uint(field, format_field, evsel->needs_swap);
129}
130
131#define perf_evsel__init_sc_tp_uint_field(evsel, name) \
132 ({ struct syscall_tp *sc = evsel->priv;\
133 perf_evsel__init_tp_uint_field(evsel, &sc->name, #name); })
134
135static int perf_evsel__init_tp_ptr_field(struct perf_evsel *evsel,
136 struct tp_field *field,
137 const char *name)
138{
139 struct format_field *format_field = perf_evsel__field(evsel, name);
140
141 if (format_field == NULL)
142 return -1;
143
144 return tp_field__init_ptr(field, format_field);
145}
146
147#define perf_evsel__init_sc_tp_ptr_field(evsel, name) \
148 ({ struct syscall_tp *sc = evsel->priv;\
149 perf_evsel__init_tp_ptr_field(evsel, &sc->name, #name); })
150
151static void perf_evsel__delete_priv(struct perf_evsel *evsel)
152{
04662523 153 zfree(&evsel->priv);
77170988
ACM
154 perf_evsel__delete(evsel);
155}
156
96695d44
NK
157static int perf_evsel__init_syscall_tp(struct perf_evsel *evsel, void *handler)
158{
159 evsel->priv = malloc(sizeof(struct syscall_tp));
160 if (evsel->priv != NULL) {
161 if (perf_evsel__init_sc_tp_uint_field(evsel, id))
162 goto out_delete;
163
164 evsel->handler = handler;
165 return 0;
166 }
167
168 return -ENOMEM;
169
170out_delete:
04662523 171 zfree(&evsel->priv);
96695d44
NK
172 return -ENOENT;
173}
174
ef503831 175static struct perf_evsel *perf_evsel__syscall_newtp(const char *direction, void *handler)
77170988 176{
ef503831 177 struct perf_evsel *evsel = perf_evsel__newtp("raw_syscalls", direction);
77170988 178
9aca7f17
DA
179 /* older kernel (e.g., RHEL6) use syscalls:{enter,exit} */
180 if (evsel == NULL)
181 evsel = perf_evsel__newtp("syscalls", direction);
182
77170988 183 if (evsel) {
96695d44 184 if (perf_evsel__init_syscall_tp(evsel, handler))
77170988 185 goto out_delete;
77170988
ACM
186 }
187
188 return evsel;
189
190out_delete:
191 perf_evsel__delete_priv(evsel);
192 return NULL;
193}
194
195#define perf_evsel__sc_tp_uint(evsel, name, sample) \
196 ({ struct syscall_tp *fields = evsel->priv; \
197 fields->name.integer(&fields->name, sample); })
198
199#define perf_evsel__sc_tp_ptr(evsel, name, sample) \
200 ({ struct syscall_tp *fields = evsel->priv; \
201 fields->name.pointer(&fields->name, sample); })
202
203static int perf_evlist__add_syscall_newtp(struct perf_evlist *evlist,
204 void *sys_enter_handler,
205 void *sys_exit_handler)
206{
207 int ret = -1;
77170988
ACM
208 struct perf_evsel *sys_enter, *sys_exit;
209
ef503831 210 sys_enter = perf_evsel__syscall_newtp("sys_enter", sys_enter_handler);
77170988
ACM
211 if (sys_enter == NULL)
212 goto out;
213
214 if (perf_evsel__init_sc_tp_ptr_field(sys_enter, args))
215 goto out_delete_sys_enter;
216
ef503831 217 sys_exit = perf_evsel__syscall_newtp("sys_exit", sys_exit_handler);
77170988
ACM
218 if (sys_exit == NULL)
219 goto out_delete_sys_enter;
220
221 if (perf_evsel__init_sc_tp_uint_field(sys_exit, ret))
222 goto out_delete_sys_exit;
223
224 perf_evlist__add(evlist, sys_enter);
225 perf_evlist__add(evlist, sys_exit);
226
227 ret = 0;
228out:
229 return ret;
230
231out_delete_sys_exit:
232 perf_evsel__delete_priv(sys_exit);
233out_delete_sys_enter:
234 perf_evsel__delete_priv(sys_enter);
235 goto out;
236}
237
238
01533e97
ACM
239struct syscall_arg {
240 unsigned long val;
75b757ca
ACM
241 struct thread *thread;
242 struct trace *trace;
1f115cb7 243 void *parm;
01533e97
ACM
244 u8 idx;
245 u8 mask;
246};
247
1f115cb7 248struct strarray {
03e3adc9 249 int offset;
1f115cb7
ACM
250 int nr_entries;
251 const char **entries;
252};
253
254#define DEFINE_STRARRAY(array) struct strarray strarray__##array = { \
255 .nr_entries = ARRAY_SIZE(array), \
256 .entries = array, \
257}
258
03e3adc9
ACM
259#define DEFINE_STRARRAY_OFFSET(array, off) struct strarray strarray__##array = { \
260 .offset = off, \
261 .nr_entries = ARRAY_SIZE(array), \
262 .entries = array, \
263}
264
975b7c2f
ACM
265static size_t __syscall_arg__scnprintf_strarray(char *bf, size_t size,
266 const char *intfmt,
267 struct syscall_arg *arg)
1f115cb7 268{
1f115cb7 269 struct strarray *sa = arg->parm;
03e3adc9 270 int idx = arg->val - sa->offset;
1f115cb7
ACM
271
272 if (idx < 0 || idx >= sa->nr_entries)
975b7c2f 273 return scnprintf(bf, size, intfmt, arg->val);
1f115cb7
ACM
274
275 return scnprintf(bf, size, "%s", sa->entries[idx]);
276}
277
975b7c2f
ACM
278static size_t syscall_arg__scnprintf_strarray(char *bf, size_t size,
279 struct syscall_arg *arg)
280{
281 return __syscall_arg__scnprintf_strarray(bf, size, "%d", arg);
282}
283
1f115cb7
ACM
284#define SCA_STRARRAY syscall_arg__scnprintf_strarray
285
844ae5b4
ACM
286#if defined(__i386__) || defined(__x86_64__)
287/*
288 * FIXME: Make this available to all arches as soon as the ioctl beautifier
289 * gets rewritten to support all arches.
290 */
78645cf3
ACM
291static size_t syscall_arg__scnprintf_strhexarray(char *bf, size_t size,
292 struct syscall_arg *arg)
293{
294 return __syscall_arg__scnprintf_strarray(bf, size, "%#x", arg);
295}
296
297#define SCA_STRHEXARRAY syscall_arg__scnprintf_strhexarray
844ae5b4 298#endif /* defined(__i386__) || defined(__x86_64__) */
78645cf3 299
75b757ca
ACM
300static size_t syscall_arg__scnprintf_fd(char *bf, size_t size,
301 struct syscall_arg *arg);
302
303#define SCA_FD syscall_arg__scnprintf_fd
304
305static size_t syscall_arg__scnprintf_fd_at(char *bf, size_t size,
306 struct syscall_arg *arg)
307{
308 int fd = arg->val;
309
310 if (fd == AT_FDCWD)
311 return scnprintf(bf, size, "CWD");
312
313 return syscall_arg__scnprintf_fd(bf, size, arg);
314}
315
316#define SCA_FDAT syscall_arg__scnprintf_fd_at
317
318static size_t syscall_arg__scnprintf_close_fd(char *bf, size_t size,
319 struct syscall_arg *arg);
320
321#define SCA_CLOSE_FD syscall_arg__scnprintf_close_fd
322
6e7eeb51 323static size_t syscall_arg__scnprintf_hex(char *bf, size_t size,
01533e97 324 struct syscall_arg *arg)
13d4ff3e 325{
01533e97 326 return scnprintf(bf, size, "%#lx", arg->val);
13d4ff3e
ACM
327}
328
beccb2b5
ACM
329#define SCA_HEX syscall_arg__scnprintf_hex
330
6e7eeb51 331static size_t syscall_arg__scnprintf_mmap_prot(char *bf, size_t size,
01533e97 332 struct syscall_arg *arg)
ae685380 333{
01533e97 334 int printed = 0, prot = arg->val;
ae685380
ACM
335
336 if (prot == PROT_NONE)
337 return scnprintf(bf, size, "NONE");
338#define P_MMAP_PROT(n) \
339 if (prot & PROT_##n) { \
340 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
341 prot &= ~PROT_##n; \
342 }
343
344 P_MMAP_PROT(EXEC);
345 P_MMAP_PROT(READ);
346 P_MMAP_PROT(WRITE);
347#ifdef PROT_SEM
348 P_MMAP_PROT(SEM);
349#endif
350 P_MMAP_PROT(GROWSDOWN);
351 P_MMAP_PROT(GROWSUP);
352#undef P_MMAP_PROT
353
354 if (prot)
355 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", prot);
356
357 return printed;
358}
359
360#define SCA_MMAP_PROT syscall_arg__scnprintf_mmap_prot
361
6e7eeb51 362static size_t syscall_arg__scnprintf_mmap_flags(char *bf, size_t size,
01533e97 363 struct syscall_arg *arg)
941557e0 364{
01533e97 365 int printed = 0, flags = arg->val;
941557e0
ACM
366
367#define P_MMAP_FLAG(n) \
368 if (flags & MAP_##n) { \
369 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
370 flags &= ~MAP_##n; \
371 }
372
373 P_MMAP_FLAG(SHARED);
374 P_MMAP_FLAG(PRIVATE);
41817815 375#ifdef MAP_32BIT
941557e0 376 P_MMAP_FLAG(32BIT);
41817815 377#endif
941557e0
ACM
378 P_MMAP_FLAG(ANONYMOUS);
379 P_MMAP_FLAG(DENYWRITE);
380 P_MMAP_FLAG(EXECUTABLE);
381 P_MMAP_FLAG(FILE);
382 P_MMAP_FLAG(FIXED);
383 P_MMAP_FLAG(GROWSDOWN);
f2935f3e 384#ifdef MAP_HUGETLB
941557e0 385 P_MMAP_FLAG(HUGETLB);
f2935f3e 386#endif
941557e0
ACM
387 P_MMAP_FLAG(LOCKED);
388 P_MMAP_FLAG(NONBLOCK);
389 P_MMAP_FLAG(NORESERVE);
390 P_MMAP_FLAG(POPULATE);
391 P_MMAP_FLAG(STACK);
392#ifdef MAP_UNINITIALIZED
393 P_MMAP_FLAG(UNINITIALIZED);
394#endif
395#undef P_MMAP_FLAG
396
397 if (flags)
398 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", flags);
399
400 return printed;
401}
402
403#define SCA_MMAP_FLAGS syscall_arg__scnprintf_mmap_flags
404
86998dda
AS
405static size_t syscall_arg__scnprintf_mremap_flags(char *bf, size_t size,
406 struct syscall_arg *arg)
407{
408 int printed = 0, flags = arg->val;
409
410#define P_MREMAP_FLAG(n) \
411 if (flags & MREMAP_##n) { \
412 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
413 flags &= ~MREMAP_##n; \
414 }
415
416 P_MREMAP_FLAG(MAYMOVE);
417#ifdef MREMAP_FIXED
418 P_MREMAP_FLAG(FIXED);
419#endif
420#undef P_MREMAP_FLAG
421
422 if (flags)
423 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", flags);
424
425 return printed;
426}
427
428#define SCA_MREMAP_FLAGS syscall_arg__scnprintf_mremap_flags
429
6e7eeb51 430static size_t syscall_arg__scnprintf_madvise_behavior(char *bf, size_t size,
01533e97 431 struct syscall_arg *arg)
9e9716d1 432{
01533e97 433 int behavior = arg->val;
9e9716d1
ACM
434
435 switch (behavior) {
436#define P_MADV_BHV(n) case MADV_##n: return scnprintf(bf, size, #n)
437 P_MADV_BHV(NORMAL);
438 P_MADV_BHV(RANDOM);
439 P_MADV_BHV(SEQUENTIAL);
440 P_MADV_BHV(WILLNEED);
441 P_MADV_BHV(DONTNEED);
442 P_MADV_BHV(REMOVE);
443 P_MADV_BHV(DONTFORK);
444 P_MADV_BHV(DOFORK);
445 P_MADV_BHV(HWPOISON);
446#ifdef MADV_SOFT_OFFLINE
447 P_MADV_BHV(SOFT_OFFLINE);
448#endif
449 P_MADV_BHV(MERGEABLE);
450 P_MADV_BHV(UNMERGEABLE);
f2935f3e 451#ifdef MADV_HUGEPAGE
9e9716d1 452 P_MADV_BHV(HUGEPAGE);
f2935f3e
DA
453#endif
454#ifdef MADV_NOHUGEPAGE
9e9716d1 455 P_MADV_BHV(NOHUGEPAGE);
f2935f3e 456#endif
9e9716d1
ACM
457#ifdef MADV_DONTDUMP
458 P_MADV_BHV(DONTDUMP);
459#endif
460#ifdef MADV_DODUMP
461 P_MADV_BHV(DODUMP);
462#endif
463#undef P_MADV_PHV
464 default: break;
465 }
466
467 return scnprintf(bf, size, "%#x", behavior);
468}
469
470#define SCA_MADV_BHV syscall_arg__scnprintf_madvise_behavior
471
5cea6ff2
ACM
472static size_t syscall_arg__scnprintf_flock(char *bf, size_t size,
473 struct syscall_arg *arg)
474{
475 int printed = 0, op = arg->val;
476
477 if (op == 0)
478 return scnprintf(bf, size, "NONE");
479#define P_CMD(cmd) \
480 if ((op & LOCK_##cmd) == LOCK_##cmd) { \
481 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #cmd); \
482 op &= ~LOCK_##cmd; \
483 }
484
485 P_CMD(SH);
486 P_CMD(EX);
487 P_CMD(NB);
488 P_CMD(UN);
489 P_CMD(MAND);
490 P_CMD(RW);
491 P_CMD(READ);
492 P_CMD(WRITE);
493#undef P_OP
494
495 if (op)
496 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", op);
497
498 return printed;
499}
500
501#define SCA_FLOCK syscall_arg__scnprintf_flock
502
01533e97 503static size_t syscall_arg__scnprintf_futex_op(char *bf, size_t size, struct syscall_arg *arg)
f9da0b0c
ACM
504{
505 enum syscall_futex_args {
506 SCF_UADDR = (1 << 0),
507 SCF_OP = (1 << 1),
508 SCF_VAL = (1 << 2),
509 SCF_TIMEOUT = (1 << 3),
510 SCF_UADDR2 = (1 << 4),
511 SCF_VAL3 = (1 << 5),
512 };
01533e97 513 int op = arg->val;
f9da0b0c
ACM
514 int cmd = op & FUTEX_CMD_MASK;
515 size_t printed = 0;
516
517 switch (cmd) {
518#define P_FUTEX_OP(n) case FUTEX_##n: printed = scnprintf(bf, size, #n);
01533e97
ACM
519 P_FUTEX_OP(WAIT); arg->mask |= SCF_VAL3|SCF_UADDR2; break;
520 P_FUTEX_OP(WAKE); arg->mask |= SCF_VAL3|SCF_UADDR2|SCF_TIMEOUT; break;
521 P_FUTEX_OP(FD); arg->mask |= SCF_VAL3|SCF_UADDR2|SCF_TIMEOUT; break;
522 P_FUTEX_OP(REQUEUE); arg->mask |= SCF_VAL3|SCF_TIMEOUT; break;
523 P_FUTEX_OP(CMP_REQUEUE); arg->mask |= SCF_TIMEOUT; break;
524 P_FUTEX_OP(CMP_REQUEUE_PI); arg->mask |= SCF_TIMEOUT; break;
f9da0b0c 525 P_FUTEX_OP(WAKE_OP); break;
01533e97
ACM
526 P_FUTEX_OP(LOCK_PI); arg->mask |= SCF_VAL3|SCF_UADDR2|SCF_TIMEOUT; break;
527 P_FUTEX_OP(UNLOCK_PI); arg->mask |= SCF_VAL3|SCF_UADDR2|SCF_TIMEOUT; break;
528 P_FUTEX_OP(TRYLOCK_PI); arg->mask |= SCF_VAL3|SCF_UADDR2; break;
529 P_FUTEX_OP(WAIT_BITSET); arg->mask |= SCF_UADDR2; break;
530 P_FUTEX_OP(WAKE_BITSET); arg->mask |= SCF_UADDR2; break;
f9da0b0c
ACM
531 P_FUTEX_OP(WAIT_REQUEUE_PI); break;
532 default: printed = scnprintf(bf, size, "%#x", cmd); break;
533 }
534
535 if (op & FUTEX_PRIVATE_FLAG)
536 printed += scnprintf(bf + printed, size - printed, "|PRIV");
537
538 if (op & FUTEX_CLOCK_REALTIME)
539 printed += scnprintf(bf + printed, size - printed, "|CLKRT");
540
541 return printed;
542}
543
efe6b882
ACM
544#define SCA_FUTEX_OP syscall_arg__scnprintf_futex_op
545
03e3adc9
ACM
546static const char *epoll_ctl_ops[] = { "ADD", "DEL", "MOD", };
547static DEFINE_STRARRAY_OFFSET(epoll_ctl_ops, 1);
eac032c5 548
1f115cb7
ACM
549static const char *itimers[] = { "REAL", "VIRTUAL", "PROF", };
550static DEFINE_STRARRAY(itimers);
551
efe6b882
ACM
552static const char *whences[] = { "SET", "CUR", "END",
553#ifdef SEEK_DATA
554"DATA",
555#endif
556#ifdef SEEK_HOLE
557"HOLE",
558#endif
559};
560static DEFINE_STRARRAY(whences);
f9da0b0c 561
80f587d5
ACM
562static const char *fcntl_cmds[] = {
563 "DUPFD", "GETFD", "SETFD", "GETFL", "SETFL", "GETLK", "SETLK",
564 "SETLKW", "SETOWN", "GETOWN", "SETSIG", "GETSIG", "F_GETLK64",
565 "F_SETLK64", "F_SETLKW64", "F_SETOWN_EX", "F_GETOWN_EX",
566 "F_GETOWNER_UIDS",
567};
568static DEFINE_STRARRAY(fcntl_cmds);
569
c045bf02
ACM
570static const char *rlimit_resources[] = {
571 "CPU", "FSIZE", "DATA", "STACK", "CORE", "RSS", "NPROC", "NOFILE",
572 "MEMLOCK", "AS", "LOCKS", "SIGPENDING", "MSGQUEUE", "NICE", "RTPRIO",
573 "RTTIME",
574};
575static DEFINE_STRARRAY(rlimit_resources);
576
eb5b1b14
ACM
577static const char *sighow[] = { "BLOCK", "UNBLOCK", "SETMASK", };
578static DEFINE_STRARRAY(sighow);
579
4f8c1b74
DA
580static const char *clockid[] = {
581 "REALTIME", "MONOTONIC", "PROCESS_CPUTIME_ID", "THREAD_CPUTIME_ID",
582 "MONOTONIC_RAW", "REALTIME_COARSE", "MONOTONIC_COARSE",
583};
584static DEFINE_STRARRAY(clockid);
585
e10bce81
ACM
586static const char *socket_families[] = {
587 "UNSPEC", "LOCAL", "INET", "AX25", "IPX", "APPLETALK", "NETROM",
588 "BRIDGE", "ATMPVC", "X25", "INET6", "ROSE", "DECnet", "NETBEUI",
589 "SECURITY", "KEY", "NETLINK", "PACKET", "ASH", "ECONET", "ATMSVC",
590 "RDS", "SNA", "IRDA", "PPPOX", "WANPIPE", "LLC", "IB", "CAN", "TIPC",
591 "BLUETOOTH", "IUCV", "RXRPC", "ISDN", "PHONET", "IEEE802154", "CAIF",
592 "ALG", "NFC", "VSOCK",
593};
594static DEFINE_STRARRAY(socket_families);
595
a28b24b2
ACM
596#ifndef SOCK_TYPE_MASK
597#define SOCK_TYPE_MASK 0xf
598#endif
599
600static size_t syscall_arg__scnprintf_socket_type(char *bf, size_t size,
601 struct syscall_arg *arg)
602{
603 size_t printed;
604 int type = arg->val,
605 flags = type & ~SOCK_TYPE_MASK;
606
607 type &= SOCK_TYPE_MASK;
608 /*
609 * Can't use a strarray, MIPS may override for ABI reasons.
610 */
611 switch (type) {
612#define P_SK_TYPE(n) case SOCK_##n: printed = scnprintf(bf, size, #n); break;
613 P_SK_TYPE(STREAM);
614 P_SK_TYPE(DGRAM);
615 P_SK_TYPE(RAW);
616 P_SK_TYPE(RDM);
617 P_SK_TYPE(SEQPACKET);
618 P_SK_TYPE(DCCP);
619 P_SK_TYPE(PACKET);
620#undef P_SK_TYPE
621 default:
622 printed = scnprintf(bf, size, "%#x", type);
623 }
624
625#define P_SK_FLAG(n) \
626 if (flags & SOCK_##n) { \
627 printed += scnprintf(bf + printed, size - printed, "|%s", #n); \
628 flags &= ~SOCK_##n; \
629 }
630
631 P_SK_FLAG(CLOEXEC);
632 P_SK_FLAG(NONBLOCK);
633#undef P_SK_FLAG
634
635 if (flags)
636 printed += scnprintf(bf + printed, size - printed, "|%#x", flags);
637
638 return printed;
639}
640
641#define SCA_SK_TYPE syscall_arg__scnprintf_socket_type
642
b2cc99fd
ACM
643#ifndef MSG_PROBE
644#define MSG_PROBE 0x10
645#endif
b6e8f8f4
DA
646#ifndef MSG_WAITFORONE
647#define MSG_WAITFORONE 0x10000
648#endif
b2cc99fd
ACM
649#ifndef MSG_SENDPAGE_NOTLAST
650#define MSG_SENDPAGE_NOTLAST 0x20000
651#endif
652#ifndef MSG_FASTOPEN
653#define MSG_FASTOPEN 0x20000000
654#endif
655
656static size_t syscall_arg__scnprintf_msg_flags(char *bf, size_t size,
657 struct syscall_arg *arg)
658{
659 int printed = 0, flags = arg->val;
660
661 if (flags == 0)
662 return scnprintf(bf, size, "NONE");
663#define P_MSG_FLAG(n) \
664 if (flags & MSG_##n) { \
665 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
666 flags &= ~MSG_##n; \
667 }
668
669 P_MSG_FLAG(OOB);
670 P_MSG_FLAG(PEEK);
671 P_MSG_FLAG(DONTROUTE);
672 P_MSG_FLAG(TRYHARD);
673 P_MSG_FLAG(CTRUNC);
674 P_MSG_FLAG(PROBE);
675 P_MSG_FLAG(TRUNC);
676 P_MSG_FLAG(DONTWAIT);
677 P_MSG_FLAG(EOR);
678 P_MSG_FLAG(WAITALL);
679 P_MSG_FLAG(FIN);
680 P_MSG_FLAG(SYN);
681 P_MSG_FLAG(CONFIRM);
682 P_MSG_FLAG(RST);
683 P_MSG_FLAG(ERRQUEUE);
684 P_MSG_FLAG(NOSIGNAL);
685 P_MSG_FLAG(MORE);
686 P_MSG_FLAG(WAITFORONE);
687 P_MSG_FLAG(SENDPAGE_NOTLAST);
688 P_MSG_FLAG(FASTOPEN);
689 P_MSG_FLAG(CMSG_CLOEXEC);
690#undef P_MSG_FLAG
691
692 if (flags)
693 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", flags);
694
695 return printed;
696}
697
698#define SCA_MSG_FLAGS syscall_arg__scnprintf_msg_flags
699
51108999
ACM
700static size_t syscall_arg__scnprintf_access_mode(char *bf, size_t size,
701 struct syscall_arg *arg)
702{
703 size_t printed = 0;
704 int mode = arg->val;
705
706 if (mode == F_OK) /* 0 */
707 return scnprintf(bf, size, "F");
708#define P_MODE(n) \
709 if (mode & n##_OK) { \
710 printed += scnprintf(bf + printed, size - printed, "%s", #n); \
711 mode &= ~n##_OK; \
712 }
713
714 P_MODE(R);
715 P_MODE(W);
716 P_MODE(X);
717#undef P_MODE
718
719 if (mode)
720 printed += scnprintf(bf + printed, size - printed, "|%#x", mode);
721
722 return printed;
723}
724
725#define SCA_ACCMODE syscall_arg__scnprintf_access_mode
726
be65a89a 727static size_t syscall_arg__scnprintf_open_flags(char *bf, size_t size,
01533e97 728 struct syscall_arg *arg)
be65a89a 729{
01533e97 730 int printed = 0, flags = arg->val;
be65a89a
ACM
731
732 if (!(flags & O_CREAT))
01533e97 733 arg->mask |= 1 << (arg->idx + 1); /* Mask the mode parm */
be65a89a
ACM
734
735 if (flags == 0)
736 return scnprintf(bf, size, "RDONLY");
737#define P_FLAG(n) \
738 if (flags & O_##n) { \
739 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
740 flags &= ~O_##n; \
741 }
742
743 P_FLAG(APPEND);
744 P_FLAG(ASYNC);
745 P_FLAG(CLOEXEC);
746 P_FLAG(CREAT);
747 P_FLAG(DIRECT);
748 P_FLAG(DIRECTORY);
749 P_FLAG(EXCL);
750 P_FLAG(LARGEFILE);
751 P_FLAG(NOATIME);
752 P_FLAG(NOCTTY);
753#ifdef O_NONBLOCK
754 P_FLAG(NONBLOCK);
755#elif O_NDELAY
756 P_FLAG(NDELAY);
757#endif
758#ifdef O_PATH
759 P_FLAG(PATH);
760#endif
761 P_FLAG(RDWR);
762#ifdef O_DSYNC
763 if ((flags & O_SYNC) == O_SYNC)
764 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", "SYNC");
765 else {
766 P_FLAG(DSYNC);
767 }
768#else
769 P_FLAG(SYNC);
770#endif
771 P_FLAG(TRUNC);
772 P_FLAG(WRONLY);
773#undef P_FLAG
774
775 if (flags)
776 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", flags);
777
778 return printed;
779}
780
781#define SCA_OPEN_FLAGS syscall_arg__scnprintf_open_flags
782
49af9e93
ACM
783static size_t syscall_arg__scnprintf_eventfd_flags(char *bf, size_t size,
784 struct syscall_arg *arg)
785{
786 int printed = 0, flags = arg->val;
787
788 if (flags == 0)
789 return scnprintf(bf, size, "NONE");
790#define P_FLAG(n) \
791 if (flags & EFD_##n) { \
792 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
793 flags &= ~EFD_##n; \
794 }
795
796 P_FLAG(SEMAPHORE);
797 P_FLAG(CLOEXEC);
798 P_FLAG(NONBLOCK);
799#undef P_FLAG
800
801 if (flags)
802 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", flags);
803
804 return printed;
805}
806
807#define SCA_EFD_FLAGS syscall_arg__scnprintf_eventfd_flags
808
46cce19b
ACM
809static size_t syscall_arg__scnprintf_pipe_flags(char *bf, size_t size,
810 struct syscall_arg *arg)
811{
812 int printed = 0, flags = arg->val;
813
814#define P_FLAG(n) \
815 if (flags & O_##n) { \
816 printed += scnprintf(bf + printed, size - printed, "%s%s", printed ? "|" : "", #n); \
817 flags &= ~O_##n; \
818 }
819
820 P_FLAG(CLOEXEC);
821 P_FLAG(NONBLOCK);
822#undef P_FLAG
823
824 if (flags)
825 printed += scnprintf(bf + printed, size - printed, "%s%#x", printed ? "|" : "", flags);
826
827 return printed;
828}
829
830#define SCA_PIPE_FLAGS syscall_arg__scnprintf_pipe_flags
831
8bad5b0a
ACM
832static size_t syscall_arg__scnprintf_signum(char *bf, size_t size, struct syscall_arg *arg)
833{
834 int sig = arg->val;
835
836 switch (sig) {
837#define P_SIGNUM(n) case SIG##n: return scnprintf(bf, size, #n)
838 P_SIGNUM(HUP);
839 P_SIGNUM(INT);
840 P_SIGNUM(QUIT);
841 P_SIGNUM(ILL);
842 P_SIGNUM(TRAP);
843 P_SIGNUM(ABRT);
844 P_SIGNUM(BUS);
845 P_SIGNUM(FPE);
846 P_SIGNUM(KILL);
847 P_SIGNUM(USR1);
848 P_SIGNUM(SEGV);
849 P_SIGNUM(USR2);
850 P_SIGNUM(PIPE);
851 P_SIGNUM(ALRM);
852 P_SIGNUM(TERM);
8bad5b0a
ACM
853 P_SIGNUM(CHLD);
854 P_SIGNUM(CONT);
855 P_SIGNUM(STOP);
856 P_SIGNUM(TSTP);
857 P_SIGNUM(TTIN);
858 P_SIGNUM(TTOU);
859 P_SIGNUM(URG);
860 P_SIGNUM(XCPU);
861 P_SIGNUM(XFSZ);
862 P_SIGNUM(VTALRM);
863 P_SIGNUM(PROF);
864 P_SIGNUM(WINCH);
865 P_SIGNUM(IO);
866 P_SIGNUM(PWR);
867 P_SIGNUM(SYS);
02c5bb4a
BH
868#ifdef SIGEMT
869 P_SIGNUM(EMT);
870#endif
871#ifdef SIGSTKFLT
872 P_SIGNUM(STKFLT);
873#endif
874#ifdef SIGSWI
875 P_SIGNUM(SWI);
876#endif
8bad5b0a
ACM
877 default: break;
878 }
879
880 return scnprintf(bf, size, "%#x", sig);
881}
882
883#define SCA_SIGNUM syscall_arg__scnprintf_signum
884
844ae5b4
ACM
885#if defined(__i386__) || defined(__x86_64__)
886/*
887 * FIXME: Make this available to all arches.
888 */
78645cf3
ACM
889#define TCGETS 0x5401
890
891static const char *tioctls[] = {
892 "TCGETS", "TCSETS", "TCSETSW", "TCSETSF", "TCGETA", "TCSETA", "TCSETAW",
893 "TCSETAF", "TCSBRK", "TCXONC", "TCFLSH", "TIOCEXCL", "TIOCNXCL",
894 "TIOCSCTTY", "TIOCGPGRP", "TIOCSPGRP", "TIOCOUTQ", "TIOCSTI",
895 "TIOCGWINSZ", "TIOCSWINSZ", "TIOCMGET", "TIOCMBIS", "TIOCMBIC",
896 "TIOCMSET", "TIOCGSOFTCAR", "TIOCSSOFTCAR", "FIONREAD", "TIOCLINUX",
897 "TIOCCONS", "TIOCGSERIAL", "TIOCSSERIAL", "TIOCPKT", "FIONBIO",
898 "TIOCNOTTY", "TIOCSETD", "TIOCGETD", "TCSBRKP", [0x27] = "TIOCSBRK",
899 "TIOCCBRK", "TIOCGSID", "TCGETS2", "TCSETS2", "TCSETSW2", "TCSETSF2",
900 "TIOCGRS485", "TIOCSRS485", "TIOCGPTN", "TIOCSPTLCK",
901 "TIOCGDEV||TCGETX", "TCSETX", "TCSETXF", "TCSETXW", "TIOCSIG",
902 "TIOCVHANGUP", "TIOCGPKT", "TIOCGPTLCK", "TIOCGEXCL",
903 [0x50] = "FIONCLEX", "FIOCLEX", "FIOASYNC", "TIOCSERCONFIG",
904 "TIOCSERGWILD", "TIOCSERSWILD", "TIOCGLCKTRMIOS", "TIOCSLCKTRMIOS",
905 "TIOCSERGSTRUCT", "TIOCSERGETLSR", "TIOCSERGETMULTI", "TIOCSERSETMULTI",
906 "TIOCMIWAIT", "TIOCGICOUNT", [0x60] = "FIOQSIZE",
907};
908
909static DEFINE_STRARRAY_OFFSET(tioctls, 0x5401);
844ae5b4 910#endif /* defined(__i386__) || defined(__x86_64__) */
78645cf3 911
453350dd
ACM
912#define STRARRAY(arg, name, array) \
913 .arg_scnprintf = { [arg] = SCA_STRARRAY, }, \
914 .arg_parm = { [arg] = &strarray__##array, }
915
514f1c67
ACM
916static struct syscall_fmt {
917 const char *name;
aec1930b 918 const char *alias;
01533e97 919 size_t (*arg_scnprintf[6])(char *bf, size_t size, struct syscall_arg *arg);
1f115cb7 920 void *arg_parm[6];
514f1c67
ACM
921 bool errmsg;
922 bool timeout;
04b34729 923 bool hexret;
514f1c67 924} syscall_fmts[] = {
51108999
ACM
925 { .name = "access", .errmsg = true,
926 .arg_scnprintf = { [1] = SCA_ACCMODE, /* mode */ }, },
aec1930b 927 { .name = "arch_prctl", .errmsg = true, .alias = "prctl", },
beccb2b5
ACM
928 { .name = "brk", .hexret = true,
929 .arg_scnprintf = { [0] = SCA_HEX, /* brk */ }, },
4f8c1b74 930 { .name = "clock_gettime", .errmsg = true, STRARRAY(0, clk_id, clockid), },
75b757ca 931 { .name = "close", .errmsg = true,
48000a1a 932 .arg_scnprintf = { [0] = SCA_CLOSE_FD, /* fd */ }, },
a14bb860 933 { .name = "connect", .errmsg = true, },
75b757ca 934 { .name = "dup", .errmsg = true,
48000a1a 935 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 936 { .name = "dup2", .errmsg = true,
48000a1a 937 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 938 { .name = "dup3", .errmsg = true,
48000a1a 939 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
453350dd 940 { .name = "epoll_ctl", .errmsg = true, STRARRAY(1, op, epoll_ctl_ops), },
49af9e93
ACM
941 { .name = "eventfd2", .errmsg = true,
942 .arg_scnprintf = { [1] = SCA_EFD_FLAGS, /* flags */ }, },
75b757ca
ACM
943 { .name = "faccessat", .errmsg = true,
944 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
945 { .name = "fadvise64", .errmsg = true,
48000a1a 946 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 947 { .name = "fallocate", .errmsg = true,
48000a1a 948 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 949 { .name = "fchdir", .errmsg = true,
48000a1a 950 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 951 { .name = "fchmod", .errmsg = true,
48000a1a 952 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 953 { .name = "fchmodat", .errmsg = true,
48000a1a 954 .arg_scnprintf = { [0] = SCA_FDAT, /* fd */ }, },
75b757ca 955 { .name = "fchown", .errmsg = true,
48000a1a 956 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 957 { .name = "fchownat", .errmsg = true,
48000a1a 958 .arg_scnprintf = { [0] = SCA_FDAT, /* fd */ }, },
75b757ca
ACM
959 { .name = "fcntl", .errmsg = true,
960 .arg_scnprintf = { [0] = SCA_FD, /* fd */
961 [1] = SCA_STRARRAY, /* cmd */ },
962 .arg_parm = { [1] = &strarray__fcntl_cmds, /* cmd */ }, },
963 { .name = "fdatasync", .errmsg = true,
48000a1a 964 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
5cea6ff2 965 { .name = "flock", .errmsg = true,
75b757ca
ACM
966 .arg_scnprintf = { [0] = SCA_FD, /* fd */
967 [1] = SCA_FLOCK, /* cmd */ }, },
968 { .name = "fsetxattr", .errmsg = true,
48000a1a 969 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 970 { .name = "fstat", .errmsg = true, .alias = "newfstat",
48000a1a 971 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 972 { .name = "fstatat", .errmsg = true, .alias = "newfstatat",
48000a1a 973 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
75b757ca 974 { .name = "fstatfs", .errmsg = true,
48000a1a 975 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 976 { .name = "fsync", .errmsg = true,
48000a1a 977 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 978 { .name = "ftruncate", .errmsg = true,
48000a1a 979 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
f9da0b0c
ACM
980 { .name = "futex", .errmsg = true,
981 .arg_scnprintf = { [1] = SCA_FUTEX_OP, /* op */ }, },
75b757ca 982 { .name = "futimesat", .errmsg = true,
48000a1a 983 .arg_scnprintf = { [0] = SCA_FDAT, /* fd */ }, },
75b757ca 984 { .name = "getdents", .errmsg = true,
48000a1a 985 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 986 { .name = "getdents64", .errmsg = true,
48000a1a 987 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
453350dd
ACM
988 { .name = "getitimer", .errmsg = true, STRARRAY(0, which, itimers), },
989 { .name = "getrlimit", .errmsg = true, STRARRAY(0, resource, rlimit_resources), },
beccb2b5 990 { .name = "ioctl", .errmsg = true,
48000a1a 991 .arg_scnprintf = { [0] = SCA_FD, /* fd */
844ae5b4
ACM
992#if defined(__i386__) || defined(__x86_64__)
993/*
994 * FIXME: Make this available to all arches.
995 */
78645cf3
ACM
996 [1] = SCA_STRHEXARRAY, /* cmd */
997 [2] = SCA_HEX, /* arg */ },
998 .arg_parm = { [1] = &strarray__tioctls, /* cmd */ }, },
844ae5b4
ACM
999#else
1000 [2] = SCA_HEX, /* arg */ }, },
1001#endif
8bad5b0a
ACM
1002 { .name = "kill", .errmsg = true,
1003 .arg_scnprintf = { [1] = SCA_SIGNUM, /* sig */ }, },
75b757ca 1004 { .name = "linkat", .errmsg = true,
48000a1a 1005 .arg_scnprintf = { [0] = SCA_FDAT, /* fd */ }, },
75b757ca
ACM
1006 { .name = "lseek", .errmsg = true,
1007 .arg_scnprintf = { [0] = SCA_FD, /* fd */
1008 [2] = SCA_STRARRAY, /* whence */ },
1009 .arg_parm = { [2] = &strarray__whences, /* whence */ }, },
e5959683 1010 { .name = "lstat", .errmsg = true, .alias = "newlstat", },
9e9716d1
ACM
1011 { .name = "madvise", .errmsg = true,
1012 .arg_scnprintf = { [0] = SCA_HEX, /* start */
1013 [2] = SCA_MADV_BHV, /* behavior */ }, },
75b757ca 1014 { .name = "mkdirat", .errmsg = true,
48000a1a 1015 .arg_scnprintf = { [0] = SCA_FDAT, /* fd */ }, },
75b757ca 1016 { .name = "mknodat", .errmsg = true,
48000a1a 1017 .arg_scnprintf = { [0] = SCA_FDAT, /* fd */ }, },
3d903aa7
ACM
1018 { .name = "mlock", .errmsg = true,
1019 .arg_scnprintf = { [0] = SCA_HEX, /* addr */ }, },
1020 { .name = "mlockall", .errmsg = true,
1021 .arg_scnprintf = { [0] = SCA_HEX, /* addr */ }, },
beccb2b5 1022 { .name = "mmap", .hexret = true,
ae685380 1023 .arg_scnprintf = { [0] = SCA_HEX, /* addr */
941557e0 1024 [2] = SCA_MMAP_PROT, /* prot */
73faab3a
NK
1025 [3] = SCA_MMAP_FLAGS, /* flags */
1026 [4] = SCA_FD, /* fd */ }, },
beccb2b5 1027 { .name = "mprotect", .errmsg = true,
ae685380
ACM
1028 .arg_scnprintf = { [0] = SCA_HEX, /* start */
1029 [2] = SCA_MMAP_PROT, /* prot */ }, },
1030 { .name = "mremap", .hexret = true,
1031 .arg_scnprintf = { [0] = SCA_HEX, /* addr */
86998dda 1032 [3] = SCA_MREMAP_FLAGS, /* flags */
ae685380 1033 [4] = SCA_HEX, /* new_addr */ }, },
3d903aa7
ACM
1034 { .name = "munlock", .errmsg = true,
1035 .arg_scnprintf = { [0] = SCA_HEX, /* addr */ }, },
beccb2b5
ACM
1036 { .name = "munmap", .errmsg = true,
1037 .arg_scnprintf = { [0] = SCA_HEX, /* addr */ }, },
75b757ca 1038 { .name = "name_to_handle_at", .errmsg = true,
48000a1a 1039 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
75b757ca 1040 { .name = "newfstatat", .errmsg = true,
48000a1a 1041 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
be65a89a
ACM
1042 { .name = "open", .errmsg = true,
1043 .arg_scnprintf = { [1] = SCA_OPEN_FLAGS, /* flags */ }, },
31cd3855 1044 { .name = "open_by_handle_at", .errmsg = true,
75b757ca
ACM
1045 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */
1046 [2] = SCA_OPEN_FLAGS, /* flags */ }, },
31cd3855 1047 { .name = "openat", .errmsg = true,
75b757ca
ACM
1048 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */
1049 [2] = SCA_OPEN_FLAGS, /* flags */ }, },
46cce19b
ACM
1050 { .name = "pipe2", .errmsg = true,
1051 .arg_scnprintf = { [1] = SCA_PIPE_FLAGS, /* flags */ }, },
aec1930b
ACM
1052 { .name = "poll", .errmsg = true, .timeout = true, },
1053 { .name = "ppoll", .errmsg = true, .timeout = true, },
75b757ca 1054 { .name = "pread", .errmsg = true, .alias = "pread64",
48000a1a 1055 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 1056 { .name = "preadv", .errmsg = true, .alias = "pread",
48000a1a 1057 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
453350dd 1058 { .name = "prlimit64", .errmsg = true, STRARRAY(1, resource, rlimit_resources), },
75b757ca 1059 { .name = "pwrite", .errmsg = true, .alias = "pwrite64",
48000a1a 1060 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 1061 { .name = "pwritev", .errmsg = true,
48000a1a 1062 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 1063 { .name = "read", .errmsg = true,
48000a1a 1064 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 1065 { .name = "readlinkat", .errmsg = true,
48000a1a 1066 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
75b757ca 1067 { .name = "readv", .errmsg = true,
48000a1a 1068 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
b2cc99fd
ACM
1069 { .name = "recvfrom", .errmsg = true,
1070 .arg_scnprintf = { [3] = SCA_MSG_FLAGS, /* flags */ }, },
1071 { .name = "recvmmsg", .errmsg = true,
1072 .arg_scnprintf = { [3] = SCA_MSG_FLAGS, /* flags */ }, },
1073 { .name = "recvmsg", .errmsg = true,
1074 .arg_scnprintf = { [2] = SCA_MSG_FLAGS, /* flags */ }, },
75b757ca 1075 { .name = "renameat", .errmsg = true,
48000a1a 1076 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
8bad5b0a
ACM
1077 { .name = "rt_sigaction", .errmsg = true,
1078 .arg_scnprintf = { [0] = SCA_SIGNUM, /* sig */ }, },
453350dd 1079 { .name = "rt_sigprocmask", .errmsg = true, STRARRAY(0, how, sighow), },
8bad5b0a
ACM
1080 { .name = "rt_sigqueueinfo", .errmsg = true,
1081 .arg_scnprintf = { [1] = SCA_SIGNUM, /* sig */ }, },
1082 { .name = "rt_tgsigqueueinfo", .errmsg = true,
1083 .arg_scnprintf = { [2] = SCA_SIGNUM, /* sig */ }, },
aec1930b 1084 { .name = "select", .errmsg = true, .timeout = true, },
b2cc99fd
ACM
1085 { .name = "sendmmsg", .errmsg = true,
1086 .arg_scnprintf = { [3] = SCA_MSG_FLAGS, /* flags */ }, },
1087 { .name = "sendmsg", .errmsg = true,
1088 .arg_scnprintf = { [2] = SCA_MSG_FLAGS, /* flags */ }, },
1089 { .name = "sendto", .errmsg = true,
1090 .arg_scnprintf = { [3] = SCA_MSG_FLAGS, /* flags */ }, },
453350dd
ACM
1091 { .name = "setitimer", .errmsg = true, STRARRAY(0, which, itimers), },
1092 { .name = "setrlimit", .errmsg = true, STRARRAY(0, resource, rlimit_resources), },
75b757ca 1093 { .name = "shutdown", .errmsg = true,
48000a1a 1094 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
e10bce81 1095 { .name = "socket", .errmsg = true,
a28b24b2
ACM
1096 .arg_scnprintf = { [0] = SCA_STRARRAY, /* family */
1097 [1] = SCA_SK_TYPE, /* type */ },
07120aa5
ACM
1098 .arg_parm = { [0] = &strarray__socket_families, /* family */ }, },
1099 { .name = "socketpair", .errmsg = true,
1100 .arg_scnprintf = { [0] = SCA_STRARRAY, /* family */
1101 [1] = SCA_SK_TYPE, /* type */ },
e10bce81 1102 .arg_parm = { [0] = &strarray__socket_families, /* family */ }, },
aec1930b 1103 { .name = "stat", .errmsg = true, .alias = "newstat", },
75b757ca 1104 { .name = "symlinkat", .errmsg = true,
48000a1a 1105 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
8bad5b0a
ACM
1106 { .name = "tgkill", .errmsg = true,
1107 .arg_scnprintf = { [2] = SCA_SIGNUM, /* sig */ }, },
1108 { .name = "tkill", .errmsg = true,
1109 .arg_scnprintf = { [1] = SCA_SIGNUM, /* sig */ }, },
e5959683 1110 { .name = "uname", .errmsg = true, .alias = "newuname", },
75b757ca
ACM
1111 { .name = "unlinkat", .errmsg = true,
1112 .arg_scnprintf = { [0] = SCA_FDAT, /* dfd */ }, },
1113 { .name = "utimensat", .errmsg = true,
1114 .arg_scnprintf = { [0] = SCA_FDAT, /* dirfd */ }, },
1115 { .name = "write", .errmsg = true,
48000a1a 1116 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
75b757ca 1117 { .name = "writev", .errmsg = true,
48000a1a 1118 .arg_scnprintf = { [0] = SCA_FD, /* fd */ }, },
514f1c67
ACM
1119};
1120
1121static int syscall_fmt__cmp(const void *name, const void *fmtp)
1122{
1123 const struct syscall_fmt *fmt = fmtp;
1124 return strcmp(name, fmt->name);
1125}
1126
1127static struct syscall_fmt *syscall_fmt__find(const char *name)
1128{
1129 const int nmemb = ARRAY_SIZE(syscall_fmts);
1130 return bsearch(name, syscall_fmts, nmemb, sizeof(struct syscall_fmt), syscall_fmt__cmp);
1131}
1132
1133struct syscall {
1134 struct event_format *tp_format;
1135 const char *name;
2ae3a312 1136 bool filtered;
5089f20e 1137 bool is_exit;
514f1c67 1138 struct syscall_fmt *fmt;
01533e97 1139 size_t (**arg_scnprintf)(char *bf, size_t size, struct syscall_arg *arg);
1f115cb7 1140 void **arg_parm;
514f1c67
ACM
1141};
1142
60c907ab
ACM
1143static size_t fprintf_duration(unsigned long t, FILE *fp)
1144{
1145 double duration = (double)t / NSEC_PER_MSEC;
1146 size_t printed = fprintf(fp, "(");
1147
1148 if (duration >= 1.0)
1149 printed += color_fprintf(fp, PERF_COLOR_RED, "%6.3f ms", duration);
1150 else if (duration >= 0.01)
1151 printed += color_fprintf(fp, PERF_COLOR_YELLOW, "%6.3f ms", duration);
1152 else
1153 printed += color_fprintf(fp, PERF_COLOR_NORMAL, "%6.3f ms", duration);
c24ff998 1154 return printed + fprintf(fp, "): ");
60c907ab
ACM
1155}
1156
752fde44
ACM
1157struct thread_trace {
1158 u64 entry_time;
1159 u64 exit_time;
1160 bool entry_pending;
efd5745e 1161 unsigned long nr_events;
a2ea67d7 1162 unsigned long pfmaj, pfmin;
752fde44 1163 char *entry_str;
1302d88e 1164 double runtime_ms;
75b757ca
ACM
1165 struct {
1166 int max;
1167 char **table;
1168 } paths;
bf2575c1
DA
1169
1170 struct intlist *syscall_stats;
752fde44
ACM
1171};
1172
1173static struct thread_trace *thread_trace__new(void)
1174{
75b757ca
ACM
1175 struct thread_trace *ttrace = zalloc(sizeof(struct thread_trace));
1176
1177 if (ttrace)
1178 ttrace->paths.max = -1;
1179
bf2575c1
DA
1180 ttrace->syscall_stats = intlist__new(NULL);
1181
75b757ca 1182 return ttrace;
752fde44
ACM
1183}
1184
c24ff998 1185static struct thread_trace *thread__trace(struct thread *thread, FILE *fp)
752fde44 1186{
efd5745e
ACM
1187 struct thread_trace *ttrace;
1188
752fde44
ACM
1189 if (thread == NULL)
1190 goto fail;
1191
89dceb22
NK
1192 if (thread__priv(thread) == NULL)
1193 thread__set_priv(thread, thread_trace__new());
48000a1a 1194
89dceb22 1195 if (thread__priv(thread) == NULL)
752fde44
ACM
1196 goto fail;
1197
89dceb22 1198 ttrace = thread__priv(thread);
efd5745e
ACM
1199 ++ttrace->nr_events;
1200
1201 return ttrace;
752fde44 1202fail:
c24ff998 1203 color_fprintf(fp, PERF_COLOR_RED,
752fde44
ACM
1204 "WARNING: not enough memory, dropping samples!\n");
1205 return NULL;
1206}
1207
598d02c5
SF
1208#define TRACE_PFMAJ (1 << 0)
1209#define TRACE_PFMIN (1 << 1)
1210
514f1c67 1211struct trace {
c24ff998 1212 struct perf_tool tool;
c522739d
ACM
1213 struct {
1214 int machine;
1215 int open_id;
1216 } audit;
514f1c67
ACM
1217 struct {
1218 int max;
1219 struct syscall *table;
1220 } syscalls;
b4006796 1221 struct record_opts opts;
14a052df 1222 struct perf_evlist *evlist;
8fb598e5 1223 struct machine *host;
e596663e 1224 struct thread *current;
752fde44 1225 u64 base_time;
c24ff998 1226 FILE *output;
efd5745e 1227 unsigned long nr_events;
b059efdf 1228 struct strlist *ev_qualifier;
c522739d 1229 const char *last_vfs_getname;
bdc89661
DA
1230 struct intlist *tid_list;
1231 struct intlist *pid_list;
98eafce6
ACM
1232 double duration_filter;
1233 double runtime_ms;
1234 struct {
1235 u64 vfs_getname,
1236 proc_getname;
1237 } stats;
1238 bool not_ev_qualifier;
1239 bool live;
1240 bool full_time;
1302d88e 1241 bool sched;
752fde44 1242 bool multiple_threads;
bf2575c1 1243 bool summary;
fd2eabaf 1244 bool summary_only;
50c95cbd 1245 bool show_comm;
c522739d 1246 bool show_tool_stats;
e281a960 1247 bool trace_syscalls;
598d02c5 1248 int trace_pgfaults;
514f1c67
ACM
1249};
1250
97119f37 1251static int trace__set_fd_pathname(struct thread *thread, int fd, const char *pathname)
75b757ca 1252{
89dceb22 1253 struct thread_trace *ttrace = thread__priv(thread);
75b757ca
ACM
1254
1255 if (fd > ttrace->paths.max) {
1256 char **npath = realloc(ttrace->paths.table, (fd + 1) * sizeof(char *));
1257
1258 if (npath == NULL)
1259 return -1;
1260
1261 if (ttrace->paths.max != -1) {
1262 memset(npath + ttrace->paths.max + 1, 0,
1263 (fd - ttrace->paths.max) * sizeof(char *));
1264 } else {
1265 memset(npath, 0, (fd + 1) * sizeof(char *));
1266 }
1267
1268 ttrace->paths.table = npath;
1269 ttrace->paths.max = fd;
1270 }
1271
1272 ttrace->paths.table[fd] = strdup(pathname);
1273
1274 return ttrace->paths.table[fd] != NULL ? 0 : -1;
1275}
1276
97119f37
ACM
1277static int thread__read_fd_path(struct thread *thread, int fd)
1278{
1279 char linkname[PATH_MAX], pathname[PATH_MAX];
1280 struct stat st;
1281 int ret;
1282
1283 if (thread->pid_ == thread->tid) {
1284 scnprintf(linkname, sizeof(linkname),
1285 "/proc/%d/fd/%d", thread->pid_, fd);
1286 } else {
1287 scnprintf(linkname, sizeof(linkname),
1288 "/proc/%d/task/%d/fd/%d", thread->pid_, thread->tid, fd);
1289 }
1290
1291 if (lstat(linkname, &st) < 0 || st.st_size + 1 > (off_t)sizeof(pathname))
1292 return -1;
1293
1294 ret = readlink(linkname, pathname, sizeof(pathname));
1295
1296 if (ret < 0 || ret > st.st_size)
1297 return -1;
1298
1299 pathname[ret] = '\0';
1300 return trace__set_fd_pathname(thread, fd, pathname);
1301}
1302
c522739d
ACM
1303static const char *thread__fd_path(struct thread *thread, int fd,
1304 struct trace *trace)
75b757ca 1305{
89dceb22 1306 struct thread_trace *ttrace = thread__priv(thread);
75b757ca
ACM
1307
1308 if (ttrace == NULL)
1309 return NULL;
1310
1311 if (fd < 0)
1312 return NULL;
1313
cdcd1e6b 1314 if ((fd > ttrace->paths.max || ttrace->paths.table[fd] == NULL)) {
c522739d
ACM
1315 if (!trace->live)
1316 return NULL;
1317 ++trace->stats.proc_getname;
cdcd1e6b 1318 if (thread__read_fd_path(thread, fd))
c522739d
ACM
1319 return NULL;
1320 }
75b757ca
ACM
1321
1322 return ttrace->paths.table[fd];
1323}
1324
1325static size_t syscall_arg__scnprintf_fd(char *bf, size_t size,
1326 struct syscall_arg *arg)
1327{
1328 int fd = arg->val;
1329 size_t printed = scnprintf(bf, size, "%d", fd);
c522739d 1330 const char *path = thread__fd_path(arg->thread, fd, arg->trace);
75b757ca
ACM
1331
1332 if (path)
1333 printed += scnprintf(bf + printed, size - printed, "<%s>", path);
1334
1335 return printed;
1336}
1337
1338static size_t syscall_arg__scnprintf_close_fd(char *bf, size_t size,
1339 struct syscall_arg *arg)
1340{
1341 int fd = arg->val;
1342 size_t printed = syscall_arg__scnprintf_fd(bf, size, arg);
89dceb22 1343 struct thread_trace *ttrace = thread__priv(arg->thread);
75b757ca 1344
04662523
ACM
1345 if (ttrace && fd >= 0 && fd <= ttrace->paths.max)
1346 zfree(&ttrace->paths.table[fd]);
75b757ca
ACM
1347
1348 return printed;
1349}
1350
ae9ed035
ACM
1351static bool trace__filter_duration(struct trace *trace, double t)
1352{
1353 return t < (trace->duration_filter * NSEC_PER_MSEC);
1354}
1355
752fde44
ACM
1356static size_t trace__fprintf_tstamp(struct trace *trace, u64 tstamp, FILE *fp)
1357{
1358 double ts = (double)(tstamp - trace->base_time) / NSEC_PER_MSEC;
1359
60c907ab 1360 return fprintf(fp, "%10.3f ", ts);
752fde44
ACM
1361}
1362
f15eb531 1363static bool done = false;
ba209f85 1364static bool interrupted = false;
f15eb531 1365
ba209f85 1366static void sig_handler(int sig)
f15eb531
NK
1367{
1368 done = true;
ba209f85 1369 interrupted = sig == SIGINT;
f15eb531
NK
1370}
1371
752fde44 1372static size_t trace__fprintf_entry_head(struct trace *trace, struct thread *thread,
60c907ab 1373 u64 duration, u64 tstamp, FILE *fp)
752fde44
ACM
1374{
1375 size_t printed = trace__fprintf_tstamp(trace, tstamp, fp);
60c907ab 1376 printed += fprintf_duration(duration, fp);
752fde44 1377
50c95cbd
ACM
1378 if (trace->multiple_threads) {
1379 if (trace->show_comm)
1902efe7 1380 printed += fprintf(fp, "%.14s/", thread__comm_str(thread));
38051234 1381 printed += fprintf(fp, "%d ", thread->tid);
50c95cbd 1382 }
752fde44
ACM
1383
1384 return printed;
1385}
1386
c24ff998 1387static int trace__process_event(struct trace *trace, struct machine *machine,
162f0bef 1388 union perf_event *event, struct perf_sample *sample)
752fde44
ACM
1389{
1390 int ret = 0;
1391
1392 switch (event->header.type) {
1393 case PERF_RECORD_LOST:
c24ff998 1394 color_fprintf(trace->output, PERF_COLOR_RED,
752fde44 1395 "LOST %" PRIu64 " events!\n", event->lost.lost);
162f0bef 1396 ret = machine__process_lost_event(machine, event, sample);
752fde44 1397 default:
162f0bef 1398 ret = machine__process_event(machine, event, sample);
752fde44
ACM
1399 break;
1400 }
1401
1402 return ret;
1403}
1404
c24ff998 1405static int trace__tool_process(struct perf_tool *tool,
752fde44 1406 union perf_event *event,
162f0bef 1407 struct perf_sample *sample,
752fde44
ACM
1408 struct machine *machine)
1409{
c24ff998 1410 struct trace *trace = container_of(tool, struct trace, tool);
162f0bef 1411 return trace__process_event(trace, machine, event, sample);
752fde44
ACM
1412}
1413
1414static int trace__symbols_init(struct trace *trace, struct perf_evlist *evlist)
1415{
0a7e6d1b 1416 int err = symbol__init(NULL);
752fde44
ACM
1417
1418 if (err)
1419 return err;
1420
8fb598e5
DA
1421 trace->host = machine__new_host();
1422 if (trace->host == NULL)
1423 return -ENOMEM;
752fde44 1424
a33fbd56
ACM
1425 err = __machine__synthesize_threads(trace->host, &trace->tool, &trace->opts.target,
1426 evlist->threads, trace__tool_process, false);
752fde44
ACM
1427 if (err)
1428 symbol__exit();
1429
1430 return err;
1431}
1432
13d4ff3e
ACM
1433static int syscall__set_arg_fmts(struct syscall *sc)
1434{
1435 struct format_field *field;
1436 int idx = 0;
1437
1438 sc->arg_scnprintf = calloc(sc->tp_format->format.nr_fields - 1, sizeof(void *));
1439 if (sc->arg_scnprintf == NULL)
1440 return -1;
1441
1f115cb7
ACM
1442 if (sc->fmt)
1443 sc->arg_parm = sc->fmt->arg_parm;
1444
13d4ff3e 1445 for (field = sc->tp_format->format.fields->next; field; field = field->next) {
beccb2b5
ACM
1446 if (sc->fmt && sc->fmt->arg_scnprintf[idx])
1447 sc->arg_scnprintf[idx] = sc->fmt->arg_scnprintf[idx];
1448 else if (field->flags & FIELD_IS_POINTER)
13d4ff3e
ACM
1449 sc->arg_scnprintf[idx] = syscall_arg__scnprintf_hex;
1450 ++idx;
1451 }
1452
1453 return 0;
1454}
1455
514f1c67
ACM
1456static int trace__read_syscall_info(struct trace *trace, int id)
1457{
1458 char tp_name[128];
1459 struct syscall *sc;
c522739d 1460 const char *name = audit_syscall_to_name(id, trace->audit.machine);
3a531260
ACM
1461
1462 if (name == NULL)
1463 return -1;
514f1c67
ACM
1464
1465 if (id > trace->syscalls.max) {
1466 struct syscall *nsyscalls = realloc(trace->syscalls.table, (id + 1) * sizeof(*sc));
1467
1468 if (nsyscalls == NULL)
1469 return -1;
1470
1471 if (trace->syscalls.max != -1) {
1472 memset(nsyscalls + trace->syscalls.max + 1, 0,
1473 (id - trace->syscalls.max) * sizeof(*sc));
1474 } else {
1475 memset(nsyscalls, 0, (id + 1) * sizeof(*sc));
1476 }
1477
1478 trace->syscalls.table = nsyscalls;
1479 trace->syscalls.max = id;
1480 }
1481
1482 sc = trace->syscalls.table + id;
3a531260 1483 sc->name = name;
2ae3a312 1484
b059efdf
ACM
1485 if (trace->ev_qualifier) {
1486 bool in = strlist__find(trace->ev_qualifier, name) != NULL;
1487
1488 if (!(in ^ trace->not_ev_qualifier)) {
1489 sc->filtered = true;
1490 /*
1491 * No need to do read tracepoint information since this will be
1492 * filtered out.
1493 */
1494 return 0;
1495 }
2ae3a312
ACM
1496 }
1497
3a531260 1498 sc->fmt = syscall_fmt__find(sc->name);
514f1c67 1499
aec1930b 1500 snprintf(tp_name, sizeof(tp_name), "sys_enter_%s", sc->name);
97978b3e 1501 sc->tp_format = trace_event__tp_format("syscalls", tp_name);
aec1930b
ACM
1502
1503 if (sc->tp_format == NULL && sc->fmt && sc->fmt->alias) {
1504 snprintf(tp_name, sizeof(tp_name), "sys_enter_%s", sc->fmt->alias);
97978b3e 1505 sc->tp_format = trace_event__tp_format("syscalls", tp_name);
aec1930b 1506 }
514f1c67 1507
13d4ff3e
ACM
1508 if (sc->tp_format == NULL)
1509 return -1;
1510
5089f20e
ACM
1511 sc->is_exit = !strcmp(name, "exit_group") || !strcmp(name, "exit");
1512
13d4ff3e 1513 return syscall__set_arg_fmts(sc);
514f1c67
ACM
1514}
1515
752fde44 1516static size_t syscall__scnprintf_args(struct syscall *sc, char *bf, size_t size,
75b757ca
ACM
1517 unsigned long *args, struct trace *trace,
1518 struct thread *thread)
514f1c67 1519{
514f1c67
ACM
1520 size_t printed = 0;
1521
1522 if (sc->tp_format != NULL) {
1523 struct format_field *field;
01533e97
ACM
1524 u8 bit = 1;
1525 struct syscall_arg arg = {
75b757ca
ACM
1526 .idx = 0,
1527 .mask = 0,
1528 .trace = trace,
1529 .thread = thread,
01533e97 1530 };
6e7eeb51
ACM
1531
1532 for (field = sc->tp_format->format.fields->next; field;
01533e97
ACM
1533 field = field->next, ++arg.idx, bit <<= 1) {
1534 if (arg.mask & bit)
6e7eeb51 1535 continue;
4aa58232
ACM
1536 /*
1537 * Suppress this argument if its value is zero and
1538 * and we don't have a string associated in an
1539 * strarray for it.
1540 */
1541 if (args[arg.idx] == 0 &&
1542 !(sc->arg_scnprintf &&
1543 sc->arg_scnprintf[arg.idx] == SCA_STRARRAY &&
1544 sc->arg_parm[arg.idx]))
22ae5cf1
ACM
1545 continue;
1546
752fde44 1547 printed += scnprintf(bf + printed, size - printed,
13d4ff3e 1548 "%s%s: ", printed ? ", " : "", field->name);
01533e97
ACM
1549 if (sc->arg_scnprintf && sc->arg_scnprintf[arg.idx]) {
1550 arg.val = args[arg.idx];
1f115cb7
ACM
1551 if (sc->arg_parm)
1552 arg.parm = sc->arg_parm[arg.idx];
01533e97
ACM
1553 printed += sc->arg_scnprintf[arg.idx](bf + printed,
1554 size - printed, &arg);
6e7eeb51 1555 } else {
13d4ff3e 1556 printed += scnprintf(bf + printed, size - printed,
01533e97 1557 "%ld", args[arg.idx]);
6e7eeb51 1558 }
514f1c67
ACM
1559 }
1560 } else {
01533e97
ACM
1561 int i = 0;
1562
514f1c67 1563 while (i < 6) {
752fde44
ACM
1564 printed += scnprintf(bf + printed, size - printed,
1565 "%sarg%d: %ld",
1566 printed ? ", " : "", i, args[i]);
514f1c67
ACM
1567 ++i;
1568 }
1569 }
1570
1571 return printed;
1572}
1573
ba3d7dee 1574typedef int (*tracepoint_handler)(struct trace *trace, struct perf_evsel *evsel,
0c82adcf 1575 union perf_event *event,
ba3d7dee
ACM
1576 struct perf_sample *sample);
1577
1578static struct syscall *trace__syscall_info(struct trace *trace,
bf2575c1 1579 struct perf_evsel *evsel, int id)
ba3d7dee 1580{
ba3d7dee
ACM
1581
1582 if (id < 0) {
adaa18bf
ACM
1583
1584 /*
1585 * XXX: Noticed on x86_64, reproduced as far back as 3.0.36, haven't tried
1586 * before that, leaving at a higher verbosity level till that is
1587 * explained. Reproduced with plain ftrace with:
1588 *
1589 * echo 1 > /t/events/raw_syscalls/sys_exit/enable
1590 * grep "NR -1 " /t/trace_pipe
1591 *
1592 * After generating some load on the machine.
1593 */
1594 if (verbose > 1) {
1595 static u64 n;
1596 fprintf(trace->output, "Invalid syscall %d id, skipping (%s, %" PRIu64 ") ...\n",
1597 id, perf_evsel__name(evsel), ++n);
1598 }
ba3d7dee
ACM
1599 return NULL;
1600 }
1601
1602 if ((id > trace->syscalls.max || trace->syscalls.table[id].name == NULL) &&
1603 trace__read_syscall_info(trace, id))
1604 goto out_cant_read;
1605
1606 if ((id > trace->syscalls.max || trace->syscalls.table[id].name == NULL))
1607 goto out_cant_read;
1608
1609 return &trace->syscalls.table[id];
1610
1611out_cant_read:
7c304ee0
ACM
1612 if (verbose) {
1613 fprintf(trace->output, "Problems reading syscall %d", id);
1614 if (id <= trace->syscalls.max && trace->syscalls.table[id].name != NULL)
1615 fprintf(trace->output, "(%s)", trace->syscalls.table[id].name);
1616 fputs(" information\n", trace->output);
1617 }
ba3d7dee
ACM
1618 return NULL;
1619}
1620
bf2575c1
DA
1621static void thread__update_stats(struct thread_trace *ttrace,
1622 int id, struct perf_sample *sample)
1623{
1624 struct int_node *inode;
1625 struct stats *stats;
1626 u64 duration = 0;
1627
1628 inode = intlist__findnew(ttrace->syscall_stats, id);
1629 if (inode == NULL)
1630 return;
1631
1632 stats = inode->priv;
1633 if (stats == NULL) {
1634 stats = malloc(sizeof(struct stats));
1635 if (stats == NULL)
1636 return;
1637 init_stats(stats);
1638 inode->priv = stats;
1639 }
1640
1641 if (ttrace->entry_time && sample->time > ttrace->entry_time)
1642 duration = sample->time - ttrace->entry_time;
1643
1644 update_stats(stats, duration);
1645}
1646
e596663e
ACM
1647static int trace__printf_interrupted_entry(struct trace *trace, struct perf_sample *sample)
1648{
1649 struct thread_trace *ttrace;
1650 u64 duration;
1651 size_t printed;
1652
1653 if (trace->current == NULL)
1654 return 0;
1655
1656 ttrace = thread__priv(trace->current);
1657
1658 if (!ttrace->entry_pending)
1659 return 0;
1660
1661 duration = sample->time - ttrace->entry_time;
1662
1663 printed = trace__fprintf_entry_head(trace, trace->current, duration, sample->time, trace->output);
1664 printed += fprintf(trace->output, "%-70s) ...\n", ttrace->entry_str);
1665 ttrace->entry_pending = false;
1666
1667 return printed;
1668}
1669
ba3d7dee 1670static int trace__sys_enter(struct trace *trace, struct perf_evsel *evsel,
0c82adcf 1671 union perf_event *event __maybe_unused,
ba3d7dee
ACM
1672 struct perf_sample *sample)
1673{
752fde44 1674 char *msg;
ba3d7dee 1675 void *args;
752fde44 1676 size_t printed = 0;
2ae3a312 1677 struct thread *thread;
77170988 1678 int id = perf_evsel__sc_tp_uint(evsel, id, sample);
bf2575c1 1679 struct syscall *sc = trace__syscall_info(trace, evsel, id);
2ae3a312
ACM
1680 struct thread_trace *ttrace;
1681
1682 if (sc == NULL)
1683 return -1;
ba3d7dee 1684
2ae3a312
ACM
1685 if (sc->filtered)
1686 return 0;
1687
8fb598e5 1688 thread = machine__findnew_thread(trace->host, sample->pid, sample->tid);
c24ff998 1689 ttrace = thread__trace(thread, trace->output);
2ae3a312 1690 if (ttrace == NULL)
ba3d7dee
ACM
1691 return -1;
1692
77170988 1693 args = perf_evsel__sc_tp_ptr(evsel, args, sample);
752fde44
ACM
1694
1695 if (ttrace->entry_str == NULL) {
1696 ttrace->entry_str = malloc(1024);
1697 if (!ttrace->entry_str)
1698 return -1;
1699 }
1700
e596663e
ACM
1701 printed += trace__printf_interrupted_entry(trace, sample);
1702
752fde44
ACM
1703 ttrace->entry_time = sample->time;
1704 msg = ttrace->entry_str;
1705 printed += scnprintf(msg + printed, 1024 - printed, "%s(", sc->name);
1706
75b757ca
ACM
1707 printed += syscall__scnprintf_args(sc, msg + printed, 1024 - printed,
1708 args, trace, thread);
752fde44 1709
5089f20e 1710 if (sc->is_exit) {
fd2eabaf 1711 if (!trace->duration_filter && !trace->summary_only) {
c24ff998
ACM
1712 trace__fprintf_entry_head(trace, thread, 1, sample->time, trace->output);
1713 fprintf(trace->output, "%-70s\n", ttrace->entry_str);
ae9ed035 1714 }
752fde44
ACM
1715 } else
1716 ttrace->entry_pending = true;
ba3d7dee 1717
e596663e
ACM
1718 trace->current = thread;
1719
ba3d7dee
ACM
1720 return 0;
1721}
1722
1723static int trace__sys_exit(struct trace *trace, struct perf_evsel *evsel,
0c82adcf 1724 union perf_event *event __maybe_unused,
ba3d7dee
ACM
1725 struct perf_sample *sample)
1726{
2c82c3ad 1727 long ret;
60c907ab 1728 u64 duration = 0;
2ae3a312 1729 struct thread *thread;
77170988 1730 int id = perf_evsel__sc_tp_uint(evsel, id, sample);
bf2575c1 1731 struct syscall *sc = trace__syscall_info(trace, evsel, id);
2ae3a312
ACM
1732 struct thread_trace *ttrace;
1733
1734 if (sc == NULL)
1735 return -1;
ba3d7dee 1736
2ae3a312
ACM
1737 if (sc->filtered)
1738 return 0;
1739
8fb598e5 1740 thread = machine__findnew_thread(trace->host, sample->pid, sample->tid);
c24ff998 1741 ttrace = thread__trace(thread, trace->output);
2ae3a312 1742 if (ttrace == NULL)
ba3d7dee
ACM
1743 return -1;
1744
bf2575c1
DA
1745 if (trace->summary)
1746 thread__update_stats(ttrace, id, sample);
1747
77170988 1748 ret = perf_evsel__sc_tp_uint(evsel, ret, sample);
ba3d7dee 1749
c522739d
ACM
1750 if (id == trace->audit.open_id && ret >= 0 && trace->last_vfs_getname) {
1751 trace__set_fd_pathname(thread, ret, trace->last_vfs_getname);
1752 trace->last_vfs_getname = NULL;
1753 ++trace->stats.vfs_getname;
1754 }
1755
752fde44
ACM
1756 ttrace->exit_time = sample->time;
1757
ae9ed035 1758 if (ttrace->entry_time) {
60c907ab 1759 duration = sample->time - ttrace->entry_time;
ae9ed035
ACM
1760 if (trace__filter_duration(trace, duration))
1761 goto out;
1762 } else if (trace->duration_filter)
1763 goto out;
60c907ab 1764
fd2eabaf
DA
1765 if (trace->summary_only)
1766 goto out;
1767
c24ff998 1768 trace__fprintf_entry_head(trace, thread, duration, sample->time, trace->output);
752fde44
ACM
1769
1770 if (ttrace->entry_pending) {
c24ff998 1771 fprintf(trace->output, "%-70s", ttrace->entry_str);
752fde44 1772 } else {
c24ff998
ACM
1773 fprintf(trace->output, " ... [");
1774 color_fprintf(trace->output, PERF_COLOR_YELLOW, "continued");
1775 fprintf(trace->output, "]: %s()", sc->name);
752fde44
ACM
1776 }
1777
da3c9a44
ACM
1778 if (sc->fmt == NULL) {
1779signed_print:
2c82c3ad 1780 fprintf(trace->output, ") = %ld", ret);
da3c9a44 1781 } else if (ret < 0 && sc->fmt->errmsg) {
942a91ed 1782 char bf[STRERR_BUFSIZE];
ba3d7dee
ACM
1783 const char *emsg = strerror_r(-ret, bf, sizeof(bf)),
1784 *e = audit_errno_to_name(-ret);
1785
c24ff998 1786 fprintf(trace->output, ") = -1 %s %s", e, emsg);
da3c9a44 1787 } else if (ret == 0 && sc->fmt->timeout)
c24ff998 1788 fprintf(trace->output, ") = 0 Timeout");
04b34729 1789 else if (sc->fmt->hexret)
2c82c3ad 1790 fprintf(trace->output, ") = %#lx", ret);
ba3d7dee 1791 else
da3c9a44 1792 goto signed_print;
ba3d7dee 1793
c24ff998 1794 fputc('\n', trace->output);
ae9ed035 1795out:
752fde44
ACM
1796 ttrace->entry_pending = false;
1797
ba3d7dee
ACM
1798 return 0;
1799}
1800
c522739d 1801static int trace__vfs_getname(struct trace *trace, struct perf_evsel *evsel,
0c82adcf 1802 union perf_event *event __maybe_unused,
c522739d
ACM
1803 struct perf_sample *sample)
1804{
1805 trace->last_vfs_getname = perf_evsel__rawptr(evsel, sample, "pathname");
1806 return 0;
1807}
1808
1302d88e 1809static int trace__sched_stat_runtime(struct trace *trace, struct perf_evsel *evsel,
0c82adcf 1810 union perf_event *event __maybe_unused,
1302d88e
ACM
1811 struct perf_sample *sample)
1812{
1813 u64 runtime = perf_evsel__intval(evsel, sample, "runtime");
1814 double runtime_ms = (double)runtime / NSEC_PER_MSEC;
8fb598e5 1815 struct thread *thread = machine__findnew_thread(trace->host,
314add6b
AH
1816 sample->pid,
1817 sample->tid);
c24ff998 1818 struct thread_trace *ttrace = thread__trace(thread, trace->output);
1302d88e
ACM
1819
1820 if (ttrace == NULL)
1821 goto out_dump;
1822
1823 ttrace->runtime_ms += runtime_ms;
1824 trace->runtime_ms += runtime_ms;
1825 return 0;
1826
1827out_dump:
c24ff998 1828 fprintf(trace->output, "%s: comm=%s,pid=%u,runtime=%" PRIu64 ",vruntime=%" PRIu64 ")\n",
1302d88e
ACM
1829 evsel->name,
1830 perf_evsel__strval(evsel, sample, "comm"),
1831 (pid_t)perf_evsel__intval(evsel, sample, "pid"),
1832 runtime,
1833 perf_evsel__intval(evsel, sample, "vruntime"));
1834 return 0;
1835}
1836
14a052df
ACM
1837static int trace__event_handler(struct trace *trace, struct perf_evsel *evsel,
1838 union perf_event *event __maybe_unused,
1839 struct perf_sample *sample)
1840{
1841 trace__printf_interrupted_entry(trace, sample);
1842 trace__fprintf_tstamp(trace, sample->time, trace->output);
0808921a
ACM
1843
1844 if (trace->trace_syscalls)
1845 fprintf(trace->output, "( ): ");
1846
1847 fprintf(trace->output, "%s:", evsel->name);
14a052df
ACM
1848
1849 if (evsel->tp_format) {
1850 event_format__fprintf(evsel->tp_format, sample->cpu,
1851 sample->raw_data, sample->raw_size,
1852 trace->output);
1853 }
1854
1855 fprintf(trace->output, ")\n");
1856 return 0;
1857}
1858
598d02c5
SF
1859static void print_location(FILE *f, struct perf_sample *sample,
1860 struct addr_location *al,
1861 bool print_dso, bool print_sym)
1862{
1863
1864 if ((verbose || print_dso) && al->map)
1865 fprintf(f, "%s@", al->map->dso->long_name);
1866
1867 if ((verbose || print_sym) && al->sym)
4414a3c5 1868 fprintf(f, "%s+0x%" PRIx64, al->sym->name,
598d02c5
SF
1869 al->addr - al->sym->start);
1870 else if (al->map)
4414a3c5 1871 fprintf(f, "0x%" PRIx64, al->addr);
598d02c5 1872 else
4414a3c5 1873 fprintf(f, "0x%" PRIx64, sample->addr);
598d02c5
SF
1874}
1875
1876static int trace__pgfault(struct trace *trace,
1877 struct perf_evsel *evsel,
1878 union perf_event *event,
1879 struct perf_sample *sample)
1880{
1881 struct thread *thread;
1882 u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
1883 struct addr_location al;
1884 char map_type = 'd';
a2ea67d7 1885 struct thread_trace *ttrace;
598d02c5
SF
1886
1887 thread = machine__findnew_thread(trace->host, sample->pid, sample->tid);
a2ea67d7
SF
1888 ttrace = thread__trace(thread, trace->output);
1889 if (ttrace == NULL)
1890 return -1;
1891
1892 if (evsel->attr.config == PERF_COUNT_SW_PAGE_FAULTS_MAJ)
1893 ttrace->pfmaj++;
1894 else
1895 ttrace->pfmin++;
1896
1897 if (trace->summary_only)
1898 return 0;
598d02c5 1899
bb871a9c 1900 thread__find_addr_location(thread, cpumode, MAP__FUNCTION,
598d02c5
SF
1901 sample->ip, &al);
1902
1903 trace__fprintf_entry_head(trace, thread, 0, sample->time, trace->output);
1904
1905 fprintf(trace->output, "%sfault [",
1906 evsel->attr.config == PERF_COUNT_SW_PAGE_FAULTS_MAJ ?
1907 "maj" : "min");
1908
1909 print_location(trace->output, sample, &al, false, true);
1910
1911 fprintf(trace->output, "] => ");
1912
bb871a9c 1913 thread__find_addr_location(thread, cpumode, MAP__VARIABLE,
598d02c5
SF
1914 sample->addr, &al);
1915
1916 if (!al.map) {
bb871a9c 1917 thread__find_addr_location(thread, cpumode,
598d02c5
SF
1918 MAP__FUNCTION, sample->addr, &al);
1919
1920 if (al.map)
1921 map_type = 'x';
1922 else
1923 map_type = '?';
1924 }
1925
1926 print_location(trace->output, sample, &al, true, false);
1927
1928 fprintf(trace->output, " (%c%c)\n", map_type, al.level);
1929
1930 return 0;
1931}
1932
bdc89661
DA
1933static bool skip_sample(struct trace *trace, struct perf_sample *sample)
1934{
1935 if ((trace->pid_list && intlist__find(trace->pid_list, sample->pid)) ||
1936 (trace->tid_list && intlist__find(trace->tid_list, sample->tid)))
1937 return false;
1938
1939 if (trace->pid_list || trace->tid_list)
1940 return true;
1941
1942 return false;
1943}
1944
6810fc91 1945static int trace__process_sample(struct perf_tool *tool,
0c82adcf 1946 union perf_event *event,
6810fc91
DA
1947 struct perf_sample *sample,
1948 struct perf_evsel *evsel,
1949 struct machine *machine __maybe_unused)
1950{
1951 struct trace *trace = container_of(tool, struct trace, tool);
1952 int err = 0;
1953
744a9719 1954 tracepoint_handler handler = evsel->handler;
6810fc91 1955
bdc89661
DA
1956 if (skip_sample(trace, sample))
1957 return 0;
1958
4bb09192 1959 if (!trace->full_time && trace->base_time == 0)
6810fc91
DA
1960 trace->base_time = sample->time;
1961
3160565f
DA
1962 if (handler) {
1963 ++trace->nr_events;
0c82adcf 1964 handler(trace, evsel, event, sample);
3160565f 1965 }
6810fc91
DA
1966
1967 return err;
1968}
1969
bdc89661
DA
1970static int parse_target_str(struct trace *trace)
1971{
1972 if (trace->opts.target.pid) {
1973 trace->pid_list = intlist__new(trace->opts.target.pid);
1974 if (trace->pid_list == NULL) {
1975 pr_err("Error parsing process id string\n");
1976 return -EINVAL;
1977 }
1978 }
1979
1980 if (trace->opts.target.tid) {
1981 trace->tid_list = intlist__new(trace->opts.target.tid);
1982 if (trace->tid_list == NULL) {
1983 pr_err("Error parsing thread id string\n");
1984 return -EINVAL;
1985 }
1986 }
1987
1988 return 0;
1989}
1990
1e28fe0a 1991static int trace__record(struct trace *trace, int argc, const char **argv)
5e2485b1
DA
1992{
1993 unsigned int rec_argc, i, j;
1994 const char **rec_argv;
1995 const char * const record_args[] = {
1996 "record",
1997 "-R",
1998 "-m", "1024",
1999 "-c", "1",
5e2485b1
DA
2000 };
2001
1e28fe0a
SF
2002 const char * const sc_args[] = { "-e", };
2003 unsigned int sc_args_nr = ARRAY_SIZE(sc_args);
2004 const char * const majpf_args[] = { "-e", "major-faults" };
2005 unsigned int majpf_args_nr = ARRAY_SIZE(majpf_args);
2006 const char * const minpf_args[] = { "-e", "minor-faults" };
2007 unsigned int minpf_args_nr = ARRAY_SIZE(minpf_args);
2008
9aca7f17 2009 /* +1 is for the event string below */
1e28fe0a
SF
2010 rec_argc = ARRAY_SIZE(record_args) + sc_args_nr + 1 +
2011 majpf_args_nr + minpf_args_nr + argc;
5e2485b1
DA
2012 rec_argv = calloc(rec_argc + 1, sizeof(char *));
2013
2014 if (rec_argv == NULL)
2015 return -ENOMEM;
2016
1e28fe0a 2017 j = 0;
5e2485b1 2018 for (i = 0; i < ARRAY_SIZE(record_args); i++)
1e28fe0a
SF
2019 rec_argv[j++] = record_args[i];
2020
e281a960
SF
2021 if (trace->trace_syscalls) {
2022 for (i = 0; i < sc_args_nr; i++)
2023 rec_argv[j++] = sc_args[i];
2024
2025 /* event string may be different for older kernels - e.g., RHEL6 */
2026 if (is_valid_tracepoint("raw_syscalls:sys_enter"))
2027 rec_argv[j++] = "raw_syscalls:sys_enter,raw_syscalls:sys_exit";
2028 else if (is_valid_tracepoint("syscalls:sys_enter"))
2029 rec_argv[j++] = "syscalls:sys_enter,syscalls:sys_exit";
2030 else {
2031 pr_err("Neither raw_syscalls nor syscalls events exist.\n");
2032 return -1;
2033 }
9aca7f17 2034 }
9aca7f17 2035
1e28fe0a
SF
2036 if (trace->trace_pgfaults & TRACE_PFMAJ)
2037 for (i = 0; i < majpf_args_nr; i++)
2038 rec_argv[j++] = majpf_args[i];
2039
2040 if (trace->trace_pgfaults & TRACE_PFMIN)
2041 for (i = 0; i < minpf_args_nr; i++)
2042 rec_argv[j++] = minpf_args[i];
2043
2044 for (i = 0; i < (unsigned int)argc; i++)
2045 rec_argv[j++] = argv[i];
5e2485b1 2046
1e28fe0a 2047 return cmd_record(j, rec_argv, NULL);
5e2485b1
DA
2048}
2049
bf2575c1
DA
2050static size_t trace__fprintf_thread_summary(struct trace *trace, FILE *fp);
2051
c522739d
ACM
2052static void perf_evlist__add_vfs_getname(struct perf_evlist *evlist)
2053{
ef503831 2054 struct perf_evsel *evsel = perf_evsel__newtp("probe", "vfs_getname");
c522739d
ACM
2055 if (evsel == NULL)
2056 return;
2057
2058 if (perf_evsel__field(evsel, "pathname") == NULL) {
2059 perf_evsel__delete(evsel);
2060 return;
2061 }
2062
744a9719 2063 evsel->handler = trace__vfs_getname;
c522739d
ACM
2064 perf_evlist__add(evlist, evsel);
2065}
2066
598d02c5
SF
2067static int perf_evlist__add_pgfault(struct perf_evlist *evlist,
2068 u64 config)
2069{
2070 struct perf_evsel *evsel;
2071 struct perf_event_attr attr = {
2072 .type = PERF_TYPE_SOFTWARE,
2073 .mmap_data = 1,
598d02c5
SF
2074 };
2075
2076 attr.config = config;
0524798c 2077 attr.sample_period = 1;
598d02c5
SF
2078
2079 event_attr_init(&attr);
2080
2081 evsel = perf_evsel__new(&attr);
2082 if (!evsel)
2083 return -ENOMEM;
2084
2085 evsel->handler = trace__pgfault;
2086 perf_evlist__add(evlist, evsel);
2087
2088 return 0;
2089}
2090
f15eb531 2091static int trace__run(struct trace *trace, int argc, const char **argv)
514f1c67 2092{
14a052df 2093 struct perf_evlist *evlist = trace->evlist;
ba3d7dee 2094 struct perf_evsel *evsel;
efd5745e
ACM
2095 int err = -1, i;
2096 unsigned long before;
f15eb531 2097 const bool forks = argc > 0;
46fb3c21 2098 bool draining = false;
514f1c67 2099
75b757ca
ACM
2100 trace->live = true;
2101
e281a960
SF
2102 if (trace->trace_syscalls &&
2103 perf_evlist__add_syscall_newtp(evlist, trace__sys_enter,
2104 trace__sys_exit))
801c67b0 2105 goto out_error_raw_syscalls;
514f1c67 2106
e281a960
SF
2107 if (trace->trace_syscalls)
2108 perf_evlist__add_vfs_getname(evlist);
c522739d 2109
598d02c5 2110 if ((trace->trace_pgfaults & TRACE_PFMAJ) &&
e2726d99 2111 perf_evlist__add_pgfault(evlist, PERF_COUNT_SW_PAGE_FAULTS_MAJ)) {
5ed08dae 2112 goto out_error_mem;
e2726d99 2113 }
598d02c5
SF
2114
2115 if ((trace->trace_pgfaults & TRACE_PFMIN) &&
2116 perf_evlist__add_pgfault(evlist, PERF_COUNT_SW_PAGE_FAULTS_MIN))
5ed08dae 2117 goto out_error_mem;
598d02c5 2118
1302d88e 2119 if (trace->sched &&
2cc990ba
ACM
2120 perf_evlist__add_newtp(evlist, "sched", "sched_stat_runtime",
2121 trace__sched_stat_runtime))
2122 goto out_error_sched_stat_runtime;
1302d88e 2123
514f1c67
ACM
2124 err = perf_evlist__create_maps(evlist, &trace->opts.target);
2125 if (err < 0) {
c24ff998 2126 fprintf(trace->output, "Problems parsing the target to trace, check your options!\n");
514f1c67
ACM
2127 goto out_delete_evlist;
2128 }
2129
752fde44
ACM
2130 err = trace__symbols_init(trace, evlist);
2131 if (err < 0) {
c24ff998 2132 fprintf(trace->output, "Problems initializing symbol libraries!\n");
03ad9747 2133 goto out_delete_evlist;
752fde44
ACM
2134 }
2135
f77a9518 2136 perf_evlist__config(evlist, &trace->opts);
514f1c67 2137
f15eb531
NK
2138 signal(SIGCHLD, sig_handler);
2139 signal(SIGINT, sig_handler);
2140
2141 if (forks) {
6ef73ec4 2142 err = perf_evlist__prepare_workload(evlist, &trace->opts.target,
735f7e0b 2143 argv, false, NULL);
f15eb531 2144 if (err < 0) {
c24ff998 2145 fprintf(trace->output, "Couldn't run the workload!\n");
03ad9747 2146 goto out_delete_evlist;
f15eb531
NK
2147 }
2148 }
2149
514f1c67 2150 err = perf_evlist__open(evlist);
a8f23d8f
ACM
2151 if (err < 0)
2152 goto out_error_open;
514f1c67 2153
f885037e 2154 err = perf_evlist__mmap(evlist, trace->opts.mmap_pages, false);
e09b18d4
ACM
2155 if (err < 0)
2156 goto out_error_mmap;
514f1c67 2157
f15eb531
NK
2158 if (forks)
2159 perf_evlist__start_workload(evlist);
f7aa222f
ACM
2160 else
2161 perf_evlist__enable(evlist);
f15eb531 2162
42052bea
ACM
2163 trace->multiple_threads = evlist->threads->map[0] == -1 ||
2164 evlist->threads->nr > 1 ||
2165 perf_evlist__first(evlist)->attr.inherit;
514f1c67 2166again:
efd5745e 2167 before = trace->nr_events;
514f1c67
ACM
2168
2169 for (i = 0; i < evlist->nr_mmaps; i++) {
2170 union perf_event *event;
2171
2172 while ((event = perf_evlist__mmap_read(evlist, i)) != NULL) {
2173 const u32 type = event->header.type;
ba3d7dee 2174 tracepoint_handler handler;
514f1c67 2175 struct perf_sample sample;
514f1c67 2176
efd5745e 2177 ++trace->nr_events;
514f1c67 2178
514f1c67
ACM
2179 err = perf_evlist__parse_sample(evlist, event, &sample);
2180 if (err) {
c24ff998 2181 fprintf(trace->output, "Can't parse sample, err = %d, skipping...\n", err);
8e50d384 2182 goto next_event;
514f1c67
ACM
2183 }
2184
4bb09192 2185 if (!trace->full_time && trace->base_time == 0)
752fde44
ACM
2186 trace->base_time = sample.time;
2187
2188 if (type != PERF_RECORD_SAMPLE) {
162f0bef 2189 trace__process_event(trace, trace->host, event, &sample);
752fde44
ACM
2190 continue;
2191 }
2192
514f1c67
ACM
2193 evsel = perf_evlist__id2evsel(evlist, sample.id);
2194 if (evsel == NULL) {
c24ff998 2195 fprintf(trace->output, "Unknown tp ID %" PRIu64 ", skipping...\n", sample.id);
8e50d384 2196 goto next_event;
514f1c67
ACM
2197 }
2198
598d02c5
SF
2199 if (evsel->attr.type == PERF_TYPE_TRACEPOINT &&
2200 sample.raw_data == NULL) {
c24ff998 2201 fprintf(trace->output, "%s sample with no payload for tid: %d, cpu %d, raw_size=%d, skipping...\n",
fc551f8d
ACM
2202 perf_evsel__name(evsel), sample.tid,
2203 sample.cpu, sample.raw_size);
8e50d384 2204 goto next_event;
fc551f8d
ACM
2205 }
2206
744a9719 2207 handler = evsel->handler;
0c82adcf 2208 handler(trace, evsel, event, &sample);
8e50d384
ZZ
2209next_event:
2210 perf_evlist__mmap_consume(evlist, i);
20c5f10e 2211
ba209f85
ACM
2212 if (interrupted)
2213 goto out_disable;
514f1c67
ACM
2214 }
2215 }
2216
efd5745e 2217 if (trace->nr_events == before) {
ba209f85 2218 int timeout = done ? 100 : -1;
f15eb531 2219
46fb3c21
ACM
2220 if (!draining && perf_evlist__poll(evlist, timeout) > 0) {
2221 if (perf_evlist__filter_pollfd(evlist, POLLERR | POLLHUP) == 0)
2222 draining = true;
2223
ba209f85 2224 goto again;
46fb3c21 2225 }
ba209f85
ACM
2226 } else {
2227 goto again;
f15eb531
NK
2228 }
2229
ba209f85
ACM
2230out_disable:
2231 perf_evlist__disable(evlist);
514f1c67 2232
c522739d
ACM
2233 if (!err) {
2234 if (trace->summary)
2235 trace__fprintf_thread_summary(trace, trace->output);
2236
2237 if (trace->show_tool_stats) {
2238 fprintf(trace->output, "Stats:\n "
2239 " vfs_getname : %" PRIu64 "\n"
2240 " proc_getname: %" PRIu64 "\n",
2241 trace->stats.vfs_getname,
2242 trace->stats.proc_getname);
2243 }
2244 }
bf2575c1 2245
514f1c67
ACM
2246out_delete_evlist:
2247 perf_evlist__delete(evlist);
14a052df 2248 trace->evlist = NULL;
75b757ca 2249 trace->live = false;
514f1c67 2250 return err;
6ef068cb
ACM
2251{
2252 char errbuf[BUFSIZ];
a8f23d8f 2253
2cc990ba
ACM
2254out_error_sched_stat_runtime:
2255 debugfs__strerror_open_tp(errno, errbuf, sizeof(errbuf), "sched", "sched_stat_runtime");
2256 goto out_error;
2257
801c67b0 2258out_error_raw_syscalls:
2cc990ba 2259 debugfs__strerror_open_tp(errno, errbuf, sizeof(errbuf), "raw_syscalls", "sys_(enter|exit)");
a8f23d8f
ACM
2260 goto out_error;
2261
e09b18d4
ACM
2262out_error_mmap:
2263 perf_evlist__strerror_mmap(evlist, errno, errbuf, sizeof(errbuf));
2264 goto out_error;
2265
a8f23d8f
ACM
2266out_error_open:
2267 perf_evlist__strerror_open(evlist, errno, errbuf, sizeof(errbuf));
2268
2269out_error:
6ef068cb 2270 fprintf(trace->output, "%s\n", errbuf);
87f91868 2271 goto out_delete_evlist;
514f1c67 2272}
5ed08dae
ACM
2273out_error_mem:
2274 fprintf(trace->output, "Not enough memory to run!\n");
2275 goto out_delete_evlist;
a8f23d8f 2276}
514f1c67 2277
6810fc91
DA
2278static int trace__replay(struct trace *trace)
2279{
2280 const struct perf_evsel_str_handler handlers[] = {
c522739d 2281 { "probe:vfs_getname", trace__vfs_getname, },
6810fc91 2282 };
f5fc1412
JO
2283 struct perf_data_file file = {
2284 .path = input_name,
2285 .mode = PERF_DATA_MODE_READ,
2286 };
6810fc91 2287 struct perf_session *session;
003824e8 2288 struct perf_evsel *evsel;
6810fc91
DA
2289 int err = -1;
2290
2291 trace->tool.sample = trace__process_sample;
2292 trace->tool.mmap = perf_event__process_mmap;
384c671e 2293 trace->tool.mmap2 = perf_event__process_mmap2;
6810fc91
DA
2294 trace->tool.comm = perf_event__process_comm;
2295 trace->tool.exit = perf_event__process_exit;
2296 trace->tool.fork = perf_event__process_fork;
2297 trace->tool.attr = perf_event__process_attr;
2298 trace->tool.tracing_data = perf_event__process_tracing_data;
2299 trace->tool.build_id = perf_event__process_build_id;
2300
0a8cb85c 2301 trace->tool.ordered_events = true;
6810fc91
DA
2302 trace->tool.ordering_requires_timestamps = true;
2303
2304 /* add tid to output */
2305 trace->multiple_threads = true;
2306
f5fc1412 2307 session = perf_session__new(&file, false, &trace->tool);
6810fc91 2308 if (session == NULL)
52e02834 2309 return -1;
6810fc91 2310
0a7e6d1b 2311 if (symbol__init(&session->header.env) < 0)
cb2ffae2
NK
2312 goto out;
2313
8fb598e5
DA
2314 trace->host = &session->machines.host;
2315
6810fc91
DA
2316 err = perf_session__set_tracepoints_handlers(session, handlers);
2317 if (err)
2318 goto out;
2319
003824e8
NK
2320 evsel = perf_evlist__find_tracepoint_by_name(session->evlist,
2321 "raw_syscalls:sys_enter");
9aca7f17
DA
2322 /* older kernels have syscalls tp versus raw_syscalls */
2323 if (evsel == NULL)
2324 evsel = perf_evlist__find_tracepoint_by_name(session->evlist,
2325 "syscalls:sys_enter");
003824e8 2326
e281a960
SF
2327 if (evsel &&
2328 (perf_evsel__init_syscall_tp(evsel, trace__sys_enter) < 0 ||
2329 perf_evsel__init_sc_tp_ptr_field(evsel, args))) {
003824e8
NK
2330 pr_err("Error during initialize raw_syscalls:sys_enter event\n");
2331 goto out;
2332 }
2333
2334 evsel = perf_evlist__find_tracepoint_by_name(session->evlist,
2335 "raw_syscalls:sys_exit");
9aca7f17
DA
2336 if (evsel == NULL)
2337 evsel = perf_evlist__find_tracepoint_by_name(session->evlist,
2338 "syscalls:sys_exit");
e281a960
SF
2339 if (evsel &&
2340 (perf_evsel__init_syscall_tp(evsel, trace__sys_exit) < 0 ||
2341 perf_evsel__init_sc_tp_uint_field(evsel, ret))) {
003824e8 2342 pr_err("Error during initialize raw_syscalls:sys_exit event\n");
6810fc91
DA
2343 goto out;
2344 }
2345
1e28fe0a
SF
2346 evlist__for_each(session->evlist, evsel) {
2347 if (evsel->attr.type == PERF_TYPE_SOFTWARE &&
2348 (evsel->attr.config == PERF_COUNT_SW_PAGE_FAULTS_MAJ ||
2349 evsel->attr.config == PERF_COUNT_SW_PAGE_FAULTS_MIN ||
2350 evsel->attr.config == PERF_COUNT_SW_PAGE_FAULTS))
2351 evsel->handler = trace__pgfault;
2352 }
2353
bdc89661
DA
2354 err = parse_target_str(trace);
2355 if (err != 0)
2356 goto out;
2357
6810fc91
DA
2358 setup_pager();
2359
2360 err = perf_session__process_events(session, &trace->tool);
2361 if (err)
2362 pr_err("Failed to process events, error %d", err);
2363
bf2575c1
DA
2364 else if (trace->summary)
2365 trace__fprintf_thread_summary(trace, trace->output);
2366
6810fc91
DA
2367out:
2368 perf_session__delete(session);
2369
2370 return err;
2371}
2372
1302d88e
ACM
2373static size_t trace__fprintf_threads_header(FILE *fp)
2374{
2375 size_t printed;
2376
99ff7150 2377 printed = fprintf(fp, "\n Summary of events:\n\n");
bf2575c1
DA
2378
2379 return printed;
2380}
2381
2382static size_t thread__dump_stats(struct thread_trace *ttrace,
2383 struct trace *trace, FILE *fp)
2384{
2385 struct stats *stats;
2386 size_t printed = 0;
2387 struct syscall *sc;
2388 struct int_node *inode = intlist__first(ttrace->syscall_stats);
2389
2390 if (inode == NULL)
2391 return 0;
2392
2393 printed += fprintf(fp, "\n");
2394
27a778b5
PE
2395 printed += fprintf(fp, " syscall calls min avg max stddev\n");
2396 printed += fprintf(fp, " (msec) (msec) (msec) (%%)\n");
2397 printed += fprintf(fp, " --------------- -------- --------- --------- --------- ------\n");
99ff7150 2398
bf2575c1
DA
2399 /* each int_node is a syscall */
2400 while (inode) {
2401 stats = inode->priv;
2402 if (stats) {
2403 double min = (double)(stats->min) / NSEC_PER_MSEC;
2404 double max = (double)(stats->max) / NSEC_PER_MSEC;
2405 double avg = avg_stats(stats);
2406 double pct;
2407 u64 n = (u64) stats->n;
2408
2409 pct = avg ? 100.0 * stddev_stats(stats)/avg : 0.0;
2410 avg /= NSEC_PER_MSEC;
2411
2412 sc = &trace->syscalls.table[inode->i];
99ff7150 2413 printed += fprintf(fp, " %-15s", sc->name);
27a778b5 2414 printed += fprintf(fp, " %8" PRIu64 " %9.3f %9.3f",
7f7a4138 2415 n, min, avg);
27a778b5 2416 printed += fprintf(fp, " %9.3f %9.2f%%\n", max, pct);
bf2575c1
DA
2417 }
2418
2419 inode = intlist__next(inode);
2420 }
2421
2422 printed += fprintf(fp, "\n\n");
1302d88e
ACM
2423
2424 return printed;
2425}
2426
896cbb56
DA
2427/* struct used to pass data to per-thread function */
2428struct summary_data {
2429 FILE *fp;
2430 struct trace *trace;
2431 size_t printed;
2432};
2433
2434static int trace__fprintf_one_thread(struct thread *thread, void *priv)
2435{
2436 struct summary_data *data = priv;
2437 FILE *fp = data->fp;
2438 size_t printed = data->printed;
2439 struct trace *trace = data->trace;
89dceb22 2440 struct thread_trace *ttrace = thread__priv(thread);
896cbb56
DA
2441 double ratio;
2442
2443 if (ttrace == NULL)
2444 return 0;
2445
2446 ratio = (double)ttrace->nr_events / trace->nr_events * 100.0;
2447
15e65c69 2448 printed += fprintf(fp, " %s (%d), ", thread__comm_str(thread), thread->tid);
99ff7150 2449 printed += fprintf(fp, "%lu events, ", ttrace->nr_events);
15e65c69 2450 printed += fprintf(fp, "%.1f%%", ratio);
a2ea67d7
SF
2451 if (ttrace->pfmaj)
2452 printed += fprintf(fp, ", %lu majfaults", ttrace->pfmaj);
2453 if (ttrace->pfmin)
2454 printed += fprintf(fp, ", %lu minfaults", ttrace->pfmin);
99ff7150 2455 printed += fprintf(fp, ", %.3f msec\n", ttrace->runtime_ms);
bf2575c1 2456 printed += thread__dump_stats(ttrace, trace, fp);
896cbb56
DA
2457
2458 data->printed += printed;
2459
2460 return 0;
2461}
2462
1302d88e
ACM
2463static size_t trace__fprintf_thread_summary(struct trace *trace, FILE *fp)
2464{
896cbb56
DA
2465 struct summary_data data = {
2466 .fp = fp,
2467 .trace = trace
2468 };
2469 data.printed = trace__fprintf_threads_header(fp);
1302d88e 2470
896cbb56
DA
2471 machine__for_each_thread(trace->host, trace__fprintf_one_thread, &data);
2472
2473 return data.printed;
1302d88e
ACM
2474}
2475
ae9ed035
ACM
2476static int trace__set_duration(const struct option *opt, const char *str,
2477 int unset __maybe_unused)
2478{
2479 struct trace *trace = opt->value;
2480
2481 trace->duration_filter = atof(str);
2482 return 0;
2483}
2484
c24ff998
ACM
2485static int trace__open_output(struct trace *trace, const char *filename)
2486{
2487 struct stat st;
2488
2489 if (!stat(filename, &st) && st.st_size) {
2490 char oldname[PATH_MAX];
2491
2492 scnprintf(oldname, sizeof(oldname), "%s.old", filename);
2493 unlink(oldname);
2494 rename(filename, oldname);
2495 }
2496
2497 trace->output = fopen(filename, "w");
2498
2499 return trace->output == NULL ? -errno : 0;
2500}
2501
598d02c5
SF
2502static int parse_pagefaults(const struct option *opt, const char *str,
2503 int unset __maybe_unused)
2504{
2505 int *trace_pgfaults = opt->value;
2506
2507 if (strcmp(str, "all") == 0)
2508 *trace_pgfaults |= TRACE_PFMAJ | TRACE_PFMIN;
2509 else if (strcmp(str, "maj") == 0)
2510 *trace_pgfaults |= TRACE_PFMAJ;
2511 else if (strcmp(str, "min") == 0)
2512 *trace_pgfaults |= TRACE_PFMIN;
2513 else
2514 return -1;
2515
2516 return 0;
2517}
2518
14a052df
ACM
2519static void evlist__set_evsel_handler(struct perf_evlist *evlist, void *handler)
2520{
2521 struct perf_evsel *evsel;
2522
2523 evlist__for_each(evlist, evsel)
2524 evsel->handler = handler;
2525}
2526
514f1c67
ACM
2527int cmd_trace(int argc, const char **argv, const char *prefix __maybe_unused)
2528{
2529 const char * const trace_usage[] = {
f15eb531
NK
2530 "perf trace [<options>] [<command>]",
2531 "perf trace [<options>] -- <command> [<options>]",
5e2485b1
DA
2532 "perf trace record [<options>] [<command>]",
2533 "perf trace record [<options>] -- <command> [<options>]",
514f1c67
ACM
2534 NULL
2535 };
2536 struct trace trace = {
c522739d
ACM
2537 .audit = {
2538 .machine = audit_detect_machine(),
2539 .open_id = audit_name_to_syscall("open", trace.audit.machine),
2540 },
514f1c67
ACM
2541 .syscalls = {
2542 . max = -1,
2543 },
2544 .opts = {
2545 .target = {
2546 .uid = UINT_MAX,
2547 .uses_mmap = true,
2548 },
2549 .user_freq = UINT_MAX,
2550 .user_interval = ULLONG_MAX,
509051ea 2551 .no_buffering = true,
38d5447d 2552 .mmap_pages = UINT_MAX,
514f1c67 2553 },
c24ff998 2554 .output = stdout,
50c95cbd 2555 .show_comm = true,
e281a960 2556 .trace_syscalls = true,
514f1c67 2557 };
c24ff998 2558 const char *output_name = NULL;
2ae3a312 2559 const char *ev_qualifier_str = NULL;
514f1c67 2560 const struct option trace_options[] = {
14a052df
ACM
2561 OPT_CALLBACK(0, "event", &trace.evlist, "event",
2562 "event selector. use 'perf list' to list available events",
2563 parse_events_option),
50c95cbd
ACM
2564 OPT_BOOLEAN(0, "comm", &trace.show_comm,
2565 "show the thread COMM next to its id"),
c522739d 2566 OPT_BOOLEAN(0, "tool_stats", &trace.show_tool_stats, "show tool stats"),
2ae3a312
ACM
2567 OPT_STRING('e', "expr", &ev_qualifier_str, "expr",
2568 "list of events to trace"),
c24ff998 2569 OPT_STRING('o', "output", &output_name, "file", "output file name"),
6810fc91 2570 OPT_STRING('i', "input", &input_name, "file", "Analyze events in file"),
514f1c67
ACM
2571 OPT_STRING('p', "pid", &trace.opts.target.pid, "pid",
2572 "trace events on existing process id"),
ac9be8ee 2573 OPT_STRING('t', "tid", &trace.opts.target.tid, "tid",
514f1c67 2574 "trace events on existing thread id"),
ac9be8ee 2575 OPT_BOOLEAN('a', "all-cpus", &trace.opts.target.system_wide,
514f1c67 2576 "system-wide collection from all CPUs"),
ac9be8ee 2577 OPT_STRING('C', "cpu", &trace.opts.target.cpu_list, "cpu",
514f1c67 2578 "list of cpus to monitor"),
6810fc91 2579 OPT_BOOLEAN(0, "no-inherit", &trace.opts.no_inherit,
514f1c67 2580 "child tasks do not inherit counters"),
994a1f78
JO
2581 OPT_CALLBACK('m', "mmap-pages", &trace.opts.mmap_pages, "pages",
2582 "number of mmap data pages",
2583 perf_evlist__parse_mmap_pages),
ac9be8ee 2584 OPT_STRING('u', "uid", &trace.opts.target.uid_str, "user",
514f1c67 2585 "user to profile"),
ae9ed035
ACM
2586 OPT_CALLBACK(0, "duration", &trace, "float",
2587 "show only events with duration > N.M ms",
2588 trace__set_duration),
1302d88e 2589 OPT_BOOLEAN(0, "sched", &trace.sched, "show blocking scheduler events"),
7c304ee0 2590 OPT_INCR('v', "verbose", &verbose, "be more verbose"),
4bb09192
DA
2591 OPT_BOOLEAN('T', "time", &trace.full_time,
2592 "Show full timestamp, not time relative to first start"),
fd2eabaf
DA
2593 OPT_BOOLEAN('s', "summary", &trace.summary_only,
2594 "Show only syscall summary with statistics"),
2595 OPT_BOOLEAN('S', "with-summary", &trace.summary,
2596 "Show all syscalls and summary with statistics"),
598d02c5
SF
2597 OPT_CALLBACK_DEFAULT('F', "pf", &trace.trace_pgfaults, "all|maj|min",
2598 "Trace pagefaults", parse_pagefaults, "maj"),
e281a960 2599 OPT_BOOLEAN(0, "syscalls", &trace.trace_syscalls, "Trace syscalls"),
514f1c67
ACM
2600 OPT_END()
2601 };
2602 int err;
32caf0d1 2603 char bf[BUFSIZ];
514f1c67 2604
14a052df
ACM
2605 trace.evlist = perf_evlist__new();
2606 if (trace.evlist == NULL)
2607 return -ENOMEM;
2608
2609 if (trace.evlist == NULL) {
2610 pr_err("Not enough memory to run!\n");
2611 goto out;
2612 }
2613
1e28fe0a
SF
2614 argc = parse_options(argc, argv, trace_options, trace_usage,
2615 PARSE_OPT_STOP_AT_NON_OPTION);
fd2eabaf 2616
598d02c5
SF
2617 if (trace.trace_pgfaults) {
2618 trace.opts.sample_address = true;
2619 trace.opts.sample_time = true;
2620 }
2621
14a052df
ACM
2622 if (trace.evlist->nr_entries > 0)
2623 evlist__set_evsel_handler(trace.evlist, trace__event_handler);
2624
1e28fe0a
SF
2625 if ((argc >= 1) && (strcmp(argv[0], "record") == 0))
2626 return trace__record(&trace, argc-1, &argv[1]);
2627
2628 /* summary_only implies summary option, but don't overwrite summary if set */
2629 if (trace.summary_only)
2630 trace.summary = trace.summary_only;
2631
726f3234
ACM
2632 if (!trace.trace_syscalls && !trace.trace_pgfaults &&
2633 trace.evlist->nr_entries == 0 /* Was --events used? */) {
e281a960
SF
2634 pr_err("Please specify something to trace.\n");
2635 return -1;
2636 }
2637
c24ff998
ACM
2638 if (output_name != NULL) {
2639 err = trace__open_output(&trace, output_name);
2640 if (err < 0) {
2641 perror("failed to create output file");
2642 goto out;
2643 }
2644 }
2645
2ae3a312 2646 if (ev_qualifier_str != NULL) {
b059efdf
ACM
2647 const char *s = ev_qualifier_str;
2648
2649 trace.not_ev_qualifier = *s == '!';
2650 if (trace.not_ev_qualifier)
2651 ++s;
2652 trace.ev_qualifier = strlist__new(true, s);
2ae3a312 2653 if (trace.ev_qualifier == NULL) {
c24ff998
ACM
2654 fputs("Not enough memory to parse event qualifier",
2655 trace.output);
2656 err = -ENOMEM;
2657 goto out_close;
2ae3a312
ACM
2658 }
2659 }
2660
602ad878 2661 err = target__validate(&trace.opts.target);
32caf0d1 2662 if (err) {
602ad878 2663 target__strerror(&trace.opts.target, err, bf, sizeof(bf));
c24ff998
ACM
2664 fprintf(trace.output, "%s", bf);
2665 goto out_close;
32caf0d1
NK
2666 }
2667
602ad878 2668 err = target__parse_uid(&trace.opts.target);
514f1c67 2669 if (err) {
602ad878 2670 target__strerror(&trace.opts.target, err, bf, sizeof(bf));
c24ff998
ACM
2671 fprintf(trace.output, "%s", bf);
2672 goto out_close;
514f1c67
ACM
2673 }
2674
602ad878 2675 if (!argc && target__none(&trace.opts.target))
ee76120e
NK
2676 trace.opts.target.system_wide = true;
2677
6810fc91
DA
2678 if (input_name)
2679 err = trace__replay(&trace);
2680 else
2681 err = trace__run(&trace, argc, argv);
1302d88e 2682
c24ff998
ACM
2683out_close:
2684 if (output_name != NULL)
2685 fclose(trace.output);
2686out:
1302d88e 2687 return err;
514f1c67 2688}