]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - kernel/trace/trace.c
tracing: Add hist trigger 'execname' modifier
[mirror_ubuntu-jammy-kernel.git] / kernel / trace / trace.c
CommitLineData
bc0c38d1
SR
1/*
2 * ring buffer based function tracer
3 *
2b6080f2 4 * Copyright (C) 2007-2012 Steven Rostedt <srostedt@redhat.com>
bc0c38d1
SR
5 * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
6 *
7 * Originally taken from the RT patch by:
8 * Arnaldo Carvalho de Melo <acme@redhat.com>
9 *
10 * Based on code from the latency_tracer, that is:
11 * Copyright (C) 2004-2006 Ingo Molnar
6d49e352 12 * Copyright (C) 2004 Nadia Yvette Chambers
bc0c38d1 13 */
2cadf913 14#include <linux/ring_buffer.h>
273b281f 15#include <generated/utsrelease.h>
2cadf913
SR
16#include <linux/stacktrace.h>
17#include <linux/writeback.h>
bc0c38d1
SR
18#include <linux/kallsyms.h>
19#include <linux/seq_file.h>
3f5a54e3 20#include <linux/notifier.h>
2cadf913 21#include <linux/irqflags.h>
bc0c38d1 22#include <linux/debugfs.h>
8434dc93 23#include <linux/tracefs.h>
4c11d7ae 24#include <linux/pagemap.h>
bc0c38d1
SR
25#include <linux/hardirq.h>
26#include <linux/linkage.h>
27#include <linux/uaccess.h>
2cadf913 28#include <linux/kprobes.h>
bc0c38d1
SR
29#include <linux/ftrace.h>
30#include <linux/module.h>
31#include <linux/percpu.h>
2cadf913 32#include <linux/splice.h>
3f5a54e3 33#include <linux/kdebug.h>
5f0c6c03 34#include <linux/string.h>
f76180bc 35#include <linux/mount.h>
7e53bd42 36#include <linux/rwsem.h>
5a0e3ad6 37#include <linux/slab.h>
bc0c38d1
SR
38#include <linux/ctype.h>
39#include <linux/init.h>
2a2cc8f7 40#include <linux/poll.h>
b892e5c8 41#include <linux/nmi.h>
bc0c38d1 42#include <linux/fs.h>
8bd75c77 43#include <linux/sched/rt.h>
86387f7e 44
bc0c38d1 45#include "trace.h"
f0868d1e 46#include "trace_output.h"
bc0c38d1 47
73c5162a
SR
48/*
49 * On boot up, the ring buffer is set to the minimum size, so that
50 * we do not waste memory on systems that are not using tracing.
51 */
55034cd6 52bool ring_buffer_expanded;
73c5162a 53
8e1b82e0
FW
54/*
55 * We need to change this state when a selftest is running.
ff32504f
FW
56 * A selftest will lurk into the ring-buffer to count the
57 * entries inserted during the selftest although some concurrent
5e1607a0 58 * insertions into the ring-buffer such as trace_printk could occurred
ff32504f
FW
59 * at the same time, giving false positive or negative results.
60 */
8e1b82e0 61static bool __read_mostly tracing_selftest_running;
ff32504f 62
b2821ae6
SR
63/*
64 * If a tracer is running, we do not want to run SELFTEST.
65 */
020e5f85 66bool __read_mostly tracing_selftest_disabled;
b2821ae6 67
0daa2302
SRRH
68/* Pipe tracepoints to printk */
69struct trace_iterator *tracepoint_print_iter;
70int tracepoint_printk;
71
adf9f195
FW
72/* For tracers that don't implement custom flags */
73static struct tracer_opt dummy_tracer_opt[] = {
74 { }
75};
76
8c1a49ae
SRRH
77static int
78dummy_set_flag(struct trace_array *tr, u32 old_flags, u32 bit, int set)
adf9f195
FW
79{
80 return 0;
81}
0f048701 82
7ffbd48d
SR
83/*
84 * To prevent the comm cache from being overwritten when no
85 * tracing is active, only save the comm when a trace event
86 * occurred.
87 */
88static DEFINE_PER_CPU(bool, trace_cmdline_save);
89
0f048701
SR
90/*
91 * Kill all tracing for good (never come back).
92 * It is initialized to 1 but will turn to zero if the initialization
93 * of the tracer is successful. But that is the only place that sets
94 * this back to zero.
95 */
4fd27358 96static int tracing_disabled = 1;
0f048701 97
955b61e5 98cpumask_var_t __read_mostly tracing_buffer_mask;
ab46428c 99
944ac425
SR
100/*
101 * ftrace_dump_on_oops - variable to dump ftrace buffer on oops
102 *
103 * If there is an oops (or kernel panic) and the ftrace_dump_on_oops
104 * is set, then ftrace_dump is called. This will output the contents
105 * of the ftrace buffers to the console. This is very useful for
106 * capturing traces that lead to crashes and outputing it to a
107 * serial console.
108 *
109 * It is default off, but you can enable it with either specifying
110 * "ftrace_dump_on_oops" in the kernel command line, or setting
cecbca96
FW
111 * /proc/sys/kernel/ftrace_dump_on_oops
112 * Set 1 if you want to dump buffers of all CPUs
113 * Set 2 if you want to dump the buffer of the CPU that triggered oops
944ac425 114 */
cecbca96
FW
115
116enum ftrace_dump_mode ftrace_dump_on_oops;
944ac425 117
de7edd31
SRRH
118/* When set, tracing will stop when a WARN*() is hit */
119int __disable_trace_on_warning;
120
9828413d
SRRH
121#ifdef CONFIG_TRACE_ENUM_MAP_FILE
122/* Map of enums to their values, for "enum_map" file */
123struct trace_enum_map_head {
124 struct module *mod;
125 unsigned long length;
126};
127
128union trace_enum_map_item;
129
130struct trace_enum_map_tail {
131 /*
132 * "end" is first and points to NULL as it must be different
133 * than "mod" or "enum_string"
134 */
135 union trace_enum_map_item *next;
136 const char *end; /* points to NULL */
137};
138
139static DEFINE_MUTEX(trace_enum_mutex);
140
141/*
142 * The trace_enum_maps are saved in an array with two extra elements,
143 * one at the beginning, and one at the end. The beginning item contains
144 * the count of the saved maps (head.length), and the module they
145 * belong to if not built in (head.mod). The ending item contains a
146 * pointer to the next array of saved enum_map items.
147 */
148union trace_enum_map_item {
149 struct trace_enum_map map;
150 struct trace_enum_map_head head;
151 struct trace_enum_map_tail tail;
152};
153
154static union trace_enum_map_item *trace_enum_maps;
155#endif /* CONFIG_TRACE_ENUM_MAP_FILE */
156
607e2ea1 157static int tracing_set_tracer(struct trace_array *tr, const char *buf);
b2821ae6 158
ee6c2c1b
LZ
159#define MAX_TRACER_SIZE 100
160static char bootup_tracer_buf[MAX_TRACER_SIZE] __initdata;
b2821ae6 161static char *default_bootup_tracer;
d9e54076 162
55034cd6
SRRH
163static bool allocate_snapshot;
164
1beee96b 165static int __init set_cmdline_ftrace(char *str)
d9e54076 166{
67012ab1 167 strlcpy(bootup_tracer_buf, str, MAX_TRACER_SIZE);
b2821ae6 168 default_bootup_tracer = bootup_tracer_buf;
73c5162a 169 /* We are using ftrace early, expand it */
55034cd6 170 ring_buffer_expanded = true;
d9e54076
PZ
171 return 1;
172}
1beee96b 173__setup("ftrace=", set_cmdline_ftrace);
d9e54076 174
944ac425
SR
175static int __init set_ftrace_dump_on_oops(char *str)
176{
cecbca96
FW
177 if (*str++ != '=' || !*str) {
178 ftrace_dump_on_oops = DUMP_ALL;
179 return 1;
180 }
181
182 if (!strcmp("orig_cpu", str)) {
183 ftrace_dump_on_oops = DUMP_ORIG;
184 return 1;
185 }
186
187 return 0;
944ac425
SR
188}
189__setup("ftrace_dump_on_oops", set_ftrace_dump_on_oops);
60a11774 190
de7edd31
SRRH
191static int __init stop_trace_on_warning(char *str)
192{
933ff9f2
LCG
193 if ((strcmp(str, "=0") != 0 && strcmp(str, "=off") != 0))
194 __disable_trace_on_warning = 1;
de7edd31
SRRH
195 return 1;
196}
933ff9f2 197__setup("traceoff_on_warning", stop_trace_on_warning);
de7edd31 198
3209cff4 199static int __init boot_alloc_snapshot(char *str)
55034cd6
SRRH
200{
201 allocate_snapshot = true;
202 /* We also need the main ring buffer expanded */
203 ring_buffer_expanded = true;
204 return 1;
205}
3209cff4 206__setup("alloc_snapshot", boot_alloc_snapshot);
55034cd6 207
7bcfaf54
SR
208
209static char trace_boot_options_buf[MAX_TRACER_SIZE] __initdata;
7bcfaf54
SR
210
211static int __init set_trace_boot_options(char *str)
212{
67012ab1 213 strlcpy(trace_boot_options_buf, str, MAX_TRACER_SIZE);
7bcfaf54
SR
214 return 0;
215}
216__setup("trace_options=", set_trace_boot_options);
217
e1e232ca
SR
218static char trace_boot_clock_buf[MAX_TRACER_SIZE] __initdata;
219static char *trace_boot_clock __initdata;
220
221static int __init set_trace_boot_clock(char *str)
222{
223 strlcpy(trace_boot_clock_buf, str, MAX_TRACER_SIZE);
224 trace_boot_clock = trace_boot_clock_buf;
225 return 0;
226}
227__setup("trace_clock=", set_trace_boot_clock);
228
0daa2302
SRRH
229static int __init set_tracepoint_printk(char *str)
230{
231 if ((strcmp(str, "=0") != 0 && strcmp(str, "=off") != 0))
232 tracepoint_printk = 1;
233 return 1;
234}
235__setup("tp_printk", set_tracepoint_printk);
de7edd31 236
cf8e3474 237unsigned long long ns2usecs(cycle_t nsec)
bc0c38d1
SR
238{
239 nsec += 500;
240 do_div(nsec, 1000);
241 return nsec;
242}
243
983f938a
SRRH
244/* trace_flags holds trace_options default values */
245#define TRACE_DEFAULT_FLAGS \
246 (FUNCTION_DEFAULT_FLAGS | \
247 TRACE_ITER_PRINT_PARENT | TRACE_ITER_PRINTK | \
248 TRACE_ITER_ANNOTATE | TRACE_ITER_CONTEXT_INFO | \
249 TRACE_ITER_RECORD_CMD | TRACE_ITER_OVERWRITE | \
250 TRACE_ITER_IRQ_INFO | TRACE_ITER_MARKERS)
251
16270145
SRRH
252/* trace_options that are only supported by global_trace */
253#define TOP_LEVEL_TRACE_FLAGS (TRACE_ITER_PRINTK | \
254 TRACE_ITER_PRINTK_MSGONLY | TRACE_ITER_RECORD_CMD)
255
256
4fcdae83
SR
257/*
258 * The global_trace is the descriptor that holds the tracing
259 * buffers for the live tracing. For each CPU, it contains
260 * a link list of pages that will store trace entries. The
261 * page descriptor of the pages in the memory is used to hold
262 * the link list by linking the lru item in the page descriptor
263 * to each of the pages in the buffer per CPU.
264 *
265 * For each active CPU there is a data field that holds the
266 * pages for the buffer for that CPU. Each CPU has the same number
267 * of pages allocated for its buffer.
268 */
983f938a
SRRH
269static struct trace_array global_trace = {
270 .trace_flags = TRACE_DEFAULT_FLAGS,
271};
bc0c38d1 272
ae63b31e 273LIST_HEAD(ftrace_trace_arrays);
bc0c38d1 274
ff451961
SRRH
275int trace_array_get(struct trace_array *this_tr)
276{
277 struct trace_array *tr;
278 int ret = -ENODEV;
279
280 mutex_lock(&trace_types_lock);
281 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
282 if (tr == this_tr) {
283 tr->ref++;
284 ret = 0;
285 break;
286 }
287 }
288 mutex_unlock(&trace_types_lock);
289
290 return ret;
291}
292
293static void __trace_array_put(struct trace_array *this_tr)
294{
295 WARN_ON(!this_tr->ref);
296 this_tr->ref--;
297}
298
299void trace_array_put(struct trace_array *this_tr)
300{
301 mutex_lock(&trace_types_lock);
302 __trace_array_put(this_tr);
303 mutex_unlock(&trace_types_lock);
304}
305
7f1d2f82 306int filter_check_discard(struct trace_event_file *file, void *rec,
f306cc82
TZ
307 struct ring_buffer *buffer,
308 struct ring_buffer_event *event)
eb02ce01 309{
5d6ad960 310 if (unlikely(file->flags & EVENT_FILE_FL_FILTERED) &&
f306cc82
TZ
311 !filter_match_preds(file->filter, rec)) {
312 ring_buffer_discard_commit(buffer, event);
313 return 1;
314 }
315
316 return 0;
317}
318EXPORT_SYMBOL_GPL(filter_check_discard);
319
2425bcb9 320int call_filter_check_discard(struct trace_event_call *call, void *rec,
f306cc82
TZ
321 struct ring_buffer *buffer,
322 struct ring_buffer_event *event)
323{
324 if (unlikely(call->flags & TRACE_EVENT_FL_FILTERED) &&
325 !filter_match_preds(call->filter, rec)) {
326 ring_buffer_discard_commit(buffer, event);
327 return 1;
328 }
329
330 return 0;
eb02ce01 331}
f306cc82 332EXPORT_SYMBOL_GPL(call_filter_check_discard);
eb02ce01 333
ad1438a0 334static cycle_t buffer_ftrace_now(struct trace_buffer *buf, int cpu)
37886f6a
SR
335{
336 u64 ts;
337
338 /* Early boot up does not have a buffer yet */
9457158b 339 if (!buf->buffer)
37886f6a
SR
340 return trace_clock_local();
341
9457158b
AL
342 ts = ring_buffer_time_stamp(buf->buffer, cpu);
343 ring_buffer_normalize_time_stamp(buf->buffer, cpu, &ts);
37886f6a
SR
344
345 return ts;
346}
bc0c38d1 347
9457158b
AL
348cycle_t ftrace_now(int cpu)
349{
350 return buffer_ftrace_now(&global_trace.trace_buffer, cpu);
351}
352
10246fa3
SRRH
353/**
354 * tracing_is_enabled - Show if global_trace has been disabled
355 *
356 * Shows if the global trace has been enabled or not. It uses the
357 * mirror flag "buffer_disabled" to be used in fast paths such as for
358 * the irqsoff tracer. But it may be inaccurate due to races. If you
359 * need to know the accurate state, use tracing_is_on() which is a little
360 * slower, but accurate.
361 */
9036990d
SR
362int tracing_is_enabled(void)
363{
10246fa3
SRRH
364 /*
365 * For quick access (irqsoff uses this in fast path), just
366 * return the mirror variable of the state of the ring buffer.
367 * It's a little racy, but we don't really care.
368 */
369 smp_rmb();
370 return !global_trace.buffer_disabled;
9036990d
SR
371}
372
4fcdae83 373/*
3928a8a2
SR
374 * trace_buf_size is the size in bytes that is allocated
375 * for a buffer. Note, the number of bytes is always rounded
376 * to page size.
3f5a54e3
SR
377 *
378 * This number is purposely set to a low number of 16384.
379 * If the dump on oops happens, it will be much appreciated
380 * to not have to wait for all that output. Anyway this can be
381 * boot time and run time configurable.
4fcdae83 382 */
3928a8a2 383#define TRACE_BUF_SIZE_DEFAULT 1441792UL /* 16384 * 88 (sizeof(entry)) */
3f5a54e3 384
3928a8a2 385static unsigned long trace_buf_size = TRACE_BUF_SIZE_DEFAULT;
bc0c38d1 386
4fcdae83 387/* trace_types holds a link list of available tracers. */
bc0c38d1 388static struct tracer *trace_types __read_mostly;
4fcdae83 389
4fcdae83
SR
390/*
391 * trace_types_lock is used to protect the trace_types list.
4fcdae83 392 */
a8227415 393DEFINE_MUTEX(trace_types_lock);
4fcdae83 394
7e53bd42
LJ
395/*
396 * serialize the access of the ring buffer
397 *
398 * ring buffer serializes readers, but it is low level protection.
399 * The validity of the events (which returns by ring_buffer_peek() ..etc)
400 * are not protected by ring buffer.
401 *
402 * The content of events may become garbage if we allow other process consumes
403 * these events concurrently:
404 * A) the page of the consumed events may become a normal page
405 * (not reader page) in ring buffer, and this page will be rewrited
406 * by events producer.
407 * B) The page of the consumed events may become a page for splice_read,
408 * and this page will be returned to system.
409 *
410 * These primitives allow multi process access to different cpu ring buffer
411 * concurrently.
412 *
413 * These primitives don't distinguish read-only and read-consume access.
414 * Multi read-only access are also serialized.
415 */
416
417#ifdef CONFIG_SMP
418static DECLARE_RWSEM(all_cpu_access_lock);
419static DEFINE_PER_CPU(struct mutex, cpu_access_lock);
420
421static inline void trace_access_lock(int cpu)
422{
ae3b5093 423 if (cpu == RING_BUFFER_ALL_CPUS) {
7e53bd42
LJ
424 /* gain it for accessing the whole ring buffer. */
425 down_write(&all_cpu_access_lock);
426 } else {
427 /* gain it for accessing a cpu ring buffer. */
428
ae3b5093 429 /* Firstly block other trace_access_lock(RING_BUFFER_ALL_CPUS). */
7e53bd42
LJ
430 down_read(&all_cpu_access_lock);
431
432 /* Secondly block other access to this @cpu ring buffer. */
433 mutex_lock(&per_cpu(cpu_access_lock, cpu));
434 }
435}
436
437static inline void trace_access_unlock(int cpu)
438{
ae3b5093 439 if (cpu == RING_BUFFER_ALL_CPUS) {
7e53bd42
LJ
440 up_write(&all_cpu_access_lock);
441 } else {
442 mutex_unlock(&per_cpu(cpu_access_lock, cpu));
443 up_read(&all_cpu_access_lock);
444 }
445}
446
447static inline void trace_access_lock_init(void)
448{
449 int cpu;
450
451 for_each_possible_cpu(cpu)
452 mutex_init(&per_cpu(cpu_access_lock, cpu));
453}
454
455#else
456
457static DEFINE_MUTEX(access_lock);
458
459static inline void trace_access_lock(int cpu)
460{
461 (void)cpu;
462 mutex_lock(&access_lock);
463}
464
465static inline void trace_access_unlock(int cpu)
466{
467 (void)cpu;
468 mutex_unlock(&access_lock);
469}
470
471static inline void trace_access_lock_init(void)
472{
473}
474
475#endif
476
d78a4614
SRRH
477#ifdef CONFIG_STACKTRACE
478static void __ftrace_trace_stack(struct ring_buffer *buffer,
479 unsigned long flags,
480 int skip, int pc, struct pt_regs *regs);
2d34f489
SRRH
481static inline void ftrace_trace_stack(struct trace_array *tr,
482 struct ring_buffer *buffer,
73dddbb5
SRRH
483 unsigned long flags,
484 int skip, int pc, struct pt_regs *regs);
ca475e83 485
d78a4614
SRRH
486#else
487static inline void __ftrace_trace_stack(struct ring_buffer *buffer,
488 unsigned long flags,
489 int skip, int pc, struct pt_regs *regs)
490{
491}
2d34f489
SRRH
492static inline void ftrace_trace_stack(struct trace_array *tr,
493 struct ring_buffer *buffer,
73dddbb5
SRRH
494 unsigned long flags,
495 int skip, int pc, struct pt_regs *regs)
ca475e83
SRRH
496{
497}
498
d78a4614
SRRH
499#endif
500
5280bcef 501static void tracer_tracing_on(struct trace_array *tr)
10246fa3
SRRH
502{
503 if (tr->trace_buffer.buffer)
504 ring_buffer_record_on(tr->trace_buffer.buffer);
505 /*
506 * This flag is looked at when buffers haven't been allocated
507 * yet, or by some tracers (like irqsoff), that just want to
508 * know if the ring buffer has been disabled, but it can handle
509 * races of where it gets disabled but we still do a record.
510 * As the check is in the fast path of the tracers, it is more
511 * important to be fast than accurate.
512 */
513 tr->buffer_disabled = 0;
514 /* Make the flag seen by readers */
515 smp_wmb();
516}
517
499e5470
SR
518/**
519 * tracing_on - enable tracing buffers
520 *
521 * This function enables tracing buffers that may have been
522 * disabled with tracing_off.
523 */
524void tracing_on(void)
525{
10246fa3 526 tracer_tracing_on(&global_trace);
499e5470
SR
527}
528EXPORT_SYMBOL_GPL(tracing_on);
529
09ae7234
SRRH
530/**
531 * __trace_puts - write a constant string into the trace buffer.
532 * @ip: The address of the caller
533 * @str: The constant string to write
534 * @size: The size of the string.
535 */
536int __trace_puts(unsigned long ip, const char *str, int size)
537{
538 struct ring_buffer_event *event;
539 struct ring_buffer *buffer;
540 struct print_entry *entry;
541 unsigned long irq_flags;
542 int alloc;
8abfb872
J
543 int pc;
544
983f938a 545 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
f0160a5a
J
546 return 0;
547
8abfb872 548 pc = preempt_count();
09ae7234 549
3132e107
SRRH
550 if (unlikely(tracing_selftest_running || tracing_disabled))
551 return 0;
552
09ae7234
SRRH
553 alloc = sizeof(*entry) + size + 2; /* possible \n added */
554
555 local_save_flags(irq_flags);
556 buffer = global_trace.trace_buffer.buffer;
557 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, alloc,
8abfb872 558 irq_flags, pc);
09ae7234
SRRH
559 if (!event)
560 return 0;
561
562 entry = ring_buffer_event_data(event);
563 entry->ip = ip;
564
565 memcpy(&entry->buf, str, size);
566
567 /* Add a newline if necessary */
568 if (entry->buf[size - 1] != '\n') {
569 entry->buf[size] = '\n';
570 entry->buf[size + 1] = '\0';
571 } else
572 entry->buf[size] = '\0';
573
574 __buffer_unlock_commit(buffer, event);
2d34f489 575 ftrace_trace_stack(&global_trace, buffer, irq_flags, 4, pc, NULL);
09ae7234
SRRH
576
577 return size;
578}
579EXPORT_SYMBOL_GPL(__trace_puts);
580
581/**
582 * __trace_bputs - write the pointer to a constant string into trace buffer
583 * @ip: The address of the caller
584 * @str: The constant string to write to the buffer to
585 */
586int __trace_bputs(unsigned long ip, const char *str)
587{
588 struct ring_buffer_event *event;
589 struct ring_buffer *buffer;
590 struct bputs_entry *entry;
591 unsigned long irq_flags;
592 int size = sizeof(struct bputs_entry);
8abfb872
J
593 int pc;
594
983f938a 595 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
f0160a5a
J
596 return 0;
597
8abfb872 598 pc = preempt_count();
09ae7234 599
3132e107
SRRH
600 if (unlikely(tracing_selftest_running || tracing_disabled))
601 return 0;
602
09ae7234
SRRH
603 local_save_flags(irq_flags);
604 buffer = global_trace.trace_buffer.buffer;
605 event = trace_buffer_lock_reserve(buffer, TRACE_BPUTS, size,
8abfb872 606 irq_flags, pc);
09ae7234
SRRH
607 if (!event)
608 return 0;
609
610 entry = ring_buffer_event_data(event);
611 entry->ip = ip;
612 entry->str = str;
613
614 __buffer_unlock_commit(buffer, event);
2d34f489 615 ftrace_trace_stack(&global_trace, buffer, irq_flags, 4, pc, NULL);
09ae7234
SRRH
616
617 return 1;
618}
619EXPORT_SYMBOL_GPL(__trace_bputs);
620
ad909e21
SRRH
621#ifdef CONFIG_TRACER_SNAPSHOT
622/**
623 * trace_snapshot - take a snapshot of the current buffer.
624 *
625 * This causes a swap between the snapshot buffer and the current live
626 * tracing buffer. You can use this to take snapshots of the live
627 * trace when some condition is triggered, but continue to trace.
628 *
629 * Note, make sure to allocate the snapshot with either
630 * a tracing_snapshot_alloc(), or by doing it manually
631 * with: echo 1 > /sys/kernel/debug/tracing/snapshot
632 *
633 * If the snapshot buffer is not allocated, it will stop tracing.
634 * Basically making a permanent snapshot.
635 */
636void tracing_snapshot(void)
637{
638 struct trace_array *tr = &global_trace;
639 struct tracer *tracer = tr->current_trace;
640 unsigned long flags;
641
1b22e382
SRRH
642 if (in_nmi()) {
643 internal_trace_puts("*** SNAPSHOT CALLED FROM NMI CONTEXT ***\n");
644 internal_trace_puts("*** snapshot is being ignored ***\n");
645 return;
646 }
647
ad909e21 648 if (!tr->allocated_snapshot) {
ca268da6
SRRH
649 internal_trace_puts("*** SNAPSHOT NOT ALLOCATED ***\n");
650 internal_trace_puts("*** stopping trace here! ***\n");
ad909e21
SRRH
651 tracing_off();
652 return;
653 }
654
655 /* Note, snapshot can not be used when the tracer uses it */
656 if (tracer->use_max_tr) {
ca268da6
SRRH
657 internal_trace_puts("*** LATENCY TRACER ACTIVE ***\n");
658 internal_trace_puts("*** Can not use snapshot (sorry) ***\n");
ad909e21
SRRH
659 return;
660 }
661
662 local_irq_save(flags);
663 update_max_tr(tr, current, smp_processor_id());
664 local_irq_restore(flags);
665}
1b22e382 666EXPORT_SYMBOL_GPL(tracing_snapshot);
ad909e21
SRRH
667
668static int resize_buffer_duplicate_size(struct trace_buffer *trace_buf,
669 struct trace_buffer *size_buf, int cpu_id);
3209cff4
SRRH
670static void set_buffer_entries(struct trace_buffer *buf, unsigned long val);
671
672static int alloc_snapshot(struct trace_array *tr)
673{
674 int ret;
675
676 if (!tr->allocated_snapshot) {
677
678 /* allocate spare buffer */
679 ret = resize_buffer_duplicate_size(&tr->max_buffer,
680 &tr->trace_buffer, RING_BUFFER_ALL_CPUS);
681 if (ret < 0)
682 return ret;
683
684 tr->allocated_snapshot = true;
685 }
686
687 return 0;
688}
689
ad1438a0 690static void free_snapshot(struct trace_array *tr)
3209cff4
SRRH
691{
692 /*
693 * We don't free the ring buffer. instead, resize it because
694 * The max_tr ring buffer has some state (e.g. ring->clock) and
695 * we want preserve it.
696 */
697 ring_buffer_resize(tr->max_buffer.buffer, 1, RING_BUFFER_ALL_CPUS);
698 set_buffer_entries(&tr->max_buffer, 1);
699 tracing_reset_online_cpus(&tr->max_buffer);
700 tr->allocated_snapshot = false;
701}
ad909e21 702
93e31ffb
TZ
703/**
704 * tracing_alloc_snapshot - allocate snapshot buffer.
705 *
706 * This only allocates the snapshot buffer if it isn't already
707 * allocated - it doesn't also take a snapshot.
708 *
709 * This is meant to be used in cases where the snapshot buffer needs
710 * to be set up for events that can't sleep but need to be able to
711 * trigger a snapshot.
712 */
713int tracing_alloc_snapshot(void)
714{
715 struct trace_array *tr = &global_trace;
716 int ret;
717
718 ret = alloc_snapshot(tr);
719 WARN_ON(ret < 0);
720
721 return ret;
722}
723EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
724
ad909e21
SRRH
725/**
726 * trace_snapshot_alloc - allocate and take a snapshot of the current buffer.
727 *
728 * This is similar to trace_snapshot(), but it will allocate the
729 * snapshot buffer if it isn't already allocated. Use this only
730 * where it is safe to sleep, as the allocation may sleep.
731 *
732 * This causes a swap between the snapshot buffer and the current live
733 * tracing buffer. You can use this to take snapshots of the live
734 * trace when some condition is triggered, but continue to trace.
735 */
736void tracing_snapshot_alloc(void)
737{
ad909e21
SRRH
738 int ret;
739
93e31ffb
TZ
740 ret = tracing_alloc_snapshot();
741 if (ret < 0)
3209cff4 742 return;
ad909e21
SRRH
743
744 tracing_snapshot();
745}
1b22e382 746EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
ad909e21
SRRH
747#else
748void tracing_snapshot(void)
749{
750 WARN_ONCE(1, "Snapshot feature not enabled, but internal snapshot used");
751}
1b22e382 752EXPORT_SYMBOL_GPL(tracing_snapshot);
93e31ffb
TZ
753int tracing_alloc_snapshot(void)
754{
755 WARN_ONCE(1, "Snapshot feature not enabled, but snapshot allocation used");
756 return -ENODEV;
757}
758EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
ad909e21
SRRH
759void tracing_snapshot_alloc(void)
760{
761 /* Give warning */
762 tracing_snapshot();
763}
1b22e382 764EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
ad909e21
SRRH
765#endif /* CONFIG_TRACER_SNAPSHOT */
766
5280bcef 767static void tracer_tracing_off(struct trace_array *tr)
10246fa3
SRRH
768{
769 if (tr->trace_buffer.buffer)
770 ring_buffer_record_off(tr->trace_buffer.buffer);
771 /*
772 * This flag is looked at when buffers haven't been allocated
773 * yet, or by some tracers (like irqsoff), that just want to
774 * know if the ring buffer has been disabled, but it can handle
775 * races of where it gets disabled but we still do a record.
776 * As the check is in the fast path of the tracers, it is more
777 * important to be fast than accurate.
778 */
779 tr->buffer_disabled = 1;
780 /* Make the flag seen by readers */
781 smp_wmb();
782}
783
499e5470
SR
784/**
785 * tracing_off - turn off tracing buffers
786 *
787 * This function stops the tracing buffers from recording data.
788 * It does not disable any overhead the tracers themselves may
789 * be causing. This function simply causes all recording to
790 * the ring buffers to fail.
791 */
792void tracing_off(void)
793{
10246fa3 794 tracer_tracing_off(&global_trace);
499e5470
SR
795}
796EXPORT_SYMBOL_GPL(tracing_off);
797
de7edd31
SRRH
798void disable_trace_on_warning(void)
799{
800 if (__disable_trace_on_warning)
801 tracing_off();
802}
803
10246fa3
SRRH
804/**
805 * tracer_tracing_is_on - show real state of ring buffer enabled
806 * @tr : the trace array to know if ring buffer is enabled
807 *
808 * Shows real state of the ring buffer if it is enabled or not.
809 */
5280bcef 810static int tracer_tracing_is_on(struct trace_array *tr)
10246fa3
SRRH
811{
812 if (tr->trace_buffer.buffer)
813 return ring_buffer_record_is_on(tr->trace_buffer.buffer);
814 return !tr->buffer_disabled;
815}
816
499e5470
SR
817/**
818 * tracing_is_on - show state of ring buffers enabled
819 */
820int tracing_is_on(void)
821{
10246fa3 822 return tracer_tracing_is_on(&global_trace);
499e5470
SR
823}
824EXPORT_SYMBOL_GPL(tracing_is_on);
825
3928a8a2 826static int __init set_buf_size(char *str)
bc0c38d1 827{
3928a8a2 828 unsigned long buf_size;
c6caeeb1 829
bc0c38d1
SR
830 if (!str)
831 return 0;
9d612bef 832 buf_size = memparse(str, &str);
c6caeeb1 833 /* nr_entries can not be zero */
9d612bef 834 if (buf_size == 0)
c6caeeb1 835 return 0;
3928a8a2 836 trace_buf_size = buf_size;
bc0c38d1
SR
837 return 1;
838}
3928a8a2 839__setup("trace_buf_size=", set_buf_size);
bc0c38d1 840
0e950173
TB
841static int __init set_tracing_thresh(char *str)
842{
87abb3b1 843 unsigned long threshold;
0e950173
TB
844 int ret;
845
846 if (!str)
847 return 0;
bcd83ea6 848 ret = kstrtoul(str, 0, &threshold);
0e950173
TB
849 if (ret < 0)
850 return 0;
87abb3b1 851 tracing_thresh = threshold * 1000;
0e950173
TB
852 return 1;
853}
854__setup("tracing_thresh=", set_tracing_thresh);
855
57f50be1
SR
856unsigned long nsecs_to_usecs(unsigned long nsecs)
857{
858 return nsecs / 1000;
859}
860
a3418a36
SRRH
861/*
862 * TRACE_FLAGS is defined as a tuple matching bit masks with strings.
863 * It uses C(a, b) where 'a' is the enum name and 'b' is the string that
864 * matches it. By defining "C(a, b) b", TRACE_FLAGS becomes a list
865 * of strings in the order that the enums were defined.
866 */
867#undef C
868#define C(a, b) b
869
4fcdae83 870/* These must match the bit postions in trace_iterator_flags */
bc0c38d1 871static const char *trace_options[] = {
a3418a36 872 TRACE_FLAGS
bc0c38d1
SR
873 NULL
874};
875
5079f326
Z
876static struct {
877 u64 (*func)(void);
878 const char *name;
8be0709f 879 int in_ns; /* is this clock in nanoseconds? */
5079f326 880} trace_clocks[] = {
1b3e5c09
TG
881 { trace_clock_local, "local", 1 },
882 { trace_clock_global, "global", 1 },
883 { trace_clock_counter, "counter", 0 },
e7fda6c4 884 { trace_clock_jiffies, "uptime", 0 },
1b3e5c09
TG
885 { trace_clock, "perf", 1 },
886 { ktime_get_mono_fast_ns, "mono", 1 },
aabfa5f2 887 { ktime_get_raw_fast_ns, "mono_raw", 1 },
8cbd9cc6 888 ARCH_TRACE_CLOCKS
5079f326
Z
889};
890
b63f39ea 891/*
892 * trace_parser_get_init - gets the buffer for trace parser
893 */
894int trace_parser_get_init(struct trace_parser *parser, int size)
895{
896 memset(parser, 0, sizeof(*parser));
897
898 parser->buffer = kmalloc(size, GFP_KERNEL);
899 if (!parser->buffer)
900 return 1;
901
902 parser->size = size;
903 return 0;
904}
905
906/*
907 * trace_parser_put - frees the buffer for trace parser
908 */
909void trace_parser_put(struct trace_parser *parser)
910{
911 kfree(parser->buffer);
912}
913
914/*
915 * trace_get_user - reads the user input string separated by space
916 * (matched by isspace(ch))
917 *
918 * For each string found the 'struct trace_parser' is updated,
919 * and the function returns.
920 *
921 * Returns number of bytes read.
922 *
923 * See kernel/trace/trace.h for 'struct trace_parser' details.
924 */
925int trace_get_user(struct trace_parser *parser, const char __user *ubuf,
926 size_t cnt, loff_t *ppos)
927{
928 char ch;
929 size_t read = 0;
930 ssize_t ret;
931
932 if (!*ppos)
933 trace_parser_clear(parser);
934
935 ret = get_user(ch, ubuf++);
936 if (ret)
937 goto out;
938
939 read++;
940 cnt--;
941
942 /*
943 * The parser is not finished with the last write,
944 * continue reading the user input without skipping spaces.
945 */
946 if (!parser->cont) {
947 /* skip white space */
948 while (cnt && isspace(ch)) {
949 ret = get_user(ch, ubuf++);
950 if (ret)
951 goto out;
952 read++;
953 cnt--;
954 }
955
956 /* only spaces were written */
957 if (isspace(ch)) {
958 *ppos += read;
959 ret = read;
960 goto out;
961 }
962
963 parser->idx = 0;
964 }
965
966 /* read the non-space input */
967 while (cnt && !isspace(ch)) {
3c235a33 968 if (parser->idx < parser->size - 1)
b63f39ea 969 parser->buffer[parser->idx++] = ch;
970 else {
971 ret = -EINVAL;
972 goto out;
973 }
974 ret = get_user(ch, ubuf++);
975 if (ret)
976 goto out;
977 read++;
978 cnt--;
979 }
980
981 /* We either got finished input or we have to wait for another call. */
982 if (isspace(ch)) {
983 parser->buffer[parser->idx] = 0;
984 parser->cont = false;
057db848 985 } else if (parser->idx < parser->size - 1) {
b63f39ea 986 parser->cont = true;
987 parser->buffer[parser->idx++] = ch;
057db848
SR
988 } else {
989 ret = -EINVAL;
990 goto out;
b63f39ea 991 }
992
993 *ppos += read;
994 ret = read;
995
996out:
997 return ret;
998}
999
3a161d99 1000/* TODO add a seq_buf_to_buffer() */
b8b94265 1001static ssize_t trace_seq_to_buffer(struct trace_seq *s, void *buf, size_t cnt)
3c56819b
EGM
1002{
1003 int len;
3c56819b 1004
5ac48378 1005 if (trace_seq_used(s) <= s->seq.readpos)
3c56819b
EGM
1006 return -EBUSY;
1007
5ac48378 1008 len = trace_seq_used(s) - s->seq.readpos;
3c56819b
EGM
1009 if (cnt > len)
1010 cnt = len;
3a161d99 1011 memcpy(buf, s->buffer + s->seq.readpos, cnt);
3c56819b 1012
3a161d99 1013 s->seq.readpos += cnt;
3c56819b
EGM
1014 return cnt;
1015}
1016
0e950173
TB
1017unsigned long __read_mostly tracing_thresh;
1018
5d4a9dba 1019#ifdef CONFIG_TRACER_MAX_TRACE
5d4a9dba
SR
1020/*
1021 * Copy the new maximum trace into the separate maximum-trace
1022 * structure. (this way the maximum trace is permanently saved,
1023 * for later retrieval via /sys/kernel/debug/tracing/latency_trace)
1024 */
1025static void
1026__update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
1027{
12883efb
SRRH
1028 struct trace_buffer *trace_buf = &tr->trace_buffer;
1029 struct trace_buffer *max_buf = &tr->max_buffer;
1030 struct trace_array_cpu *data = per_cpu_ptr(trace_buf->data, cpu);
1031 struct trace_array_cpu *max_data = per_cpu_ptr(max_buf->data, cpu);
5d4a9dba 1032
12883efb
SRRH
1033 max_buf->cpu = cpu;
1034 max_buf->time_start = data->preempt_timestamp;
5d4a9dba 1035
6d9b3fa5 1036 max_data->saved_latency = tr->max_latency;
8248ac05
SR
1037 max_data->critical_start = data->critical_start;
1038 max_data->critical_end = data->critical_end;
5d4a9dba 1039
1acaa1b2 1040 memcpy(max_data->comm, tsk->comm, TASK_COMM_LEN);
8248ac05 1041 max_data->pid = tsk->pid;
f17a5194
SRRH
1042 /*
1043 * If tsk == current, then use current_uid(), as that does not use
1044 * RCU. The irq tracer can be called out of RCU scope.
1045 */
1046 if (tsk == current)
1047 max_data->uid = current_uid();
1048 else
1049 max_data->uid = task_uid(tsk);
1050
8248ac05
SR
1051 max_data->nice = tsk->static_prio - 20 - MAX_RT_PRIO;
1052 max_data->policy = tsk->policy;
1053 max_data->rt_priority = tsk->rt_priority;
5d4a9dba
SR
1054
1055 /* record this tasks comm */
1056 tracing_record_cmdline(tsk);
1057}
1058
4fcdae83
SR
1059/**
1060 * update_max_tr - snapshot all trace buffers from global_trace to max_tr
1061 * @tr: tracer
1062 * @tsk: the task with the latency
1063 * @cpu: The cpu that initiated the trace.
1064 *
1065 * Flip the buffers between the @tr and the max_tr and record information
1066 * about which task was the cause of this latency.
1067 */
e309b41d 1068void
bc0c38d1
SR
1069update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
1070{
2721e72d 1071 struct ring_buffer *buf;
bc0c38d1 1072
2b6080f2 1073 if (tr->stop_count)
b8de7bd1
SR
1074 return;
1075
4c11d7ae 1076 WARN_ON_ONCE(!irqs_disabled());
34600f0e 1077
45ad21ca 1078 if (!tr->allocated_snapshot) {
debdd57f 1079 /* Only the nop tracer should hit this when disabling */
2b6080f2 1080 WARN_ON_ONCE(tr->current_trace != &nop_trace);
34600f0e 1081 return;
debdd57f 1082 }
34600f0e 1083
0b9b12c1 1084 arch_spin_lock(&tr->max_lock);
3928a8a2 1085
12883efb
SRRH
1086 buf = tr->trace_buffer.buffer;
1087 tr->trace_buffer.buffer = tr->max_buffer.buffer;
1088 tr->max_buffer.buffer = buf;
3928a8a2 1089
bc0c38d1 1090 __update_max_tr(tr, tsk, cpu);
0b9b12c1 1091 arch_spin_unlock(&tr->max_lock);
bc0c38d1
SR
1092}
1093
1094/**
1095 * update_max_tr_single - only copy one trace over, and reset the rest
1096 * @tr - tracer
1097 * @tsk - task with the latency
1098 * @cpu - the cpu of the buffer to copy.
4fcdae83
SR
1099 *
1100 * Flip the trace of a single CPU buffer between the @tr and the max_tr.
bc0c38d1 1101 */
e309b41d 1102void
bc0c38d1
SR
1103update_max_tr_single(struct trace_array *tr, struct task_struct *tsk, int cpu)
1104{
3928a8a2 1105 int ret;
bc0c38d1 1106
2b6080f2 1107 if (tr->stop_count)
b8de7bd1
SR
1108 return;
1109
4c11d7ae 1110 WARN_ON_ONCE(!irqs_disabled());
6c24499f 1111 if (!tr->allocated_snapshot) {
2930e04d 1112 /* Only the nop tracer should hit this when disabling */
9e8529af 1113 WARN_ON_ONCE(tr->current_trace != &nop_trace);
ef710e10 1114 return;
2930e04d 1115 }
ef710e10 1116
0b9b12c1 1117 arch_spin_lock(&tr->max_lock);
bc0c38d1 1118
12883efb 1119 ret = ring_buffer_swap_cpu(tr->max_buffer.buffer, tr->trace_buffer.buffer, cpu);
3928a8a2 1120
e8165dbb
SR
1121 if (ret == -EBUSY) {
1122 /*
1123 * We failed to swap the buffer due to a commit taking
1124 * place on this CPU. We fail to record, but we reset
1125 * the max trace buffer (no one writes directly to it)
1126 * and flag that it failed.
1127 */
12883efb 1128 trace_array_printk_buf(tr->max_buffer.buffer, _THIS_IP_,
e8165dbb
SR
1129 "Failed to swap buffers due to commit in progress\n");
1130 }
1131
e8165dbb 1132 WARN_ON_ONCE(ret && ret != -EAGAIN && ret != -EBUSY);
bc0c38d1
SR
1133
1134 __update_max_tr(tr, tsk, cpu);
0b9b12c1 1135 arch_spin_unlock(&tr->max_lock);
bc0c38d1 1136}
5d4a9dba 1137#endif /* CONFIG_TRACER_MAX_TRACE */
bc0c38d1 1138
e30f53aa 1139static int wait_on_pipe(struct trace_iterator *iter, bool full)
0d5c6e1c 1140{
15693458
SRRH
1141 /* Iterators are static, they should be filled or empty */
1142 if (trace_buffer_iter(iter, iter->cpu_file))
8b8b3683 1143 return 0;
0d5c6e1c 1144
e30f53aa
RV
1145 return ring_buffer_wait(iter->trace_buffer->buffer, iter->cpu_file,
1146 full);
0d5c6e1c
SR
1147}
1148
f4e781c0
SRRH
1149#ifdef CONFIG_FTRACE_STARTUP_TEST
1150static int run_tracer_selftest(struct tracer *type)
1151{
1152 struct trace_array *tr = &global_trace;
1153 struct tracer *saved_tracer = tr->current_trace;
1154 int ret;
0d5c6e1c 1155
f4e781c0
SRRH
1156 if (!type->selftest || tracing_selftest_disabled)
1157 return 0;
0d5c6e1c
SR
1158
1159 /*
f4e781c0
SRRH
1160 * Run a selftest on this tracer.
1161 * Here we reset the trace buffer, and set the current
1162 * tracer to be this tracer. The tracer can then run some
1163 * internal tracing to verify that everything is in order.
1164 * If we fail, we do not register this tracer.
0d5c6e1c 1165 */
f4e781c0 1166 tracing_reset_online_cpus(&tr->trace_buffer);
0d5c6e1c 1167
f4e781c0
SRRH
1168 tr->current_trace = type;
1169
1170#ifdef CONFIG_TRACER_MAX_TRACE
1171 if (type->use_max_tr) {
1172 /* If we expanded the buffers, make sure the max is expanded too */
1173 if (ring_buffer_expanded)
1174 ring_buffer_resize(tr->max_buffer.buffer, trace_buf_size,
1175 RING_BUFFER_ALL_CPUS);
1176 tr->allocated_snapshot = true;
1177 }
1178#endif
1179
1180 /* the test is responsible for initializing and enabling */
1181 pr_info("Testing tracer %s: ", type->name);
1182 ret = type->selftest(type, tr);
1183 /* the test is responsible for resetting too */
1184 tr->current_trace = saved_tracer;
1185 if (ret) {
1186 printk(KERN_CONT "FAILED!\n");
1187 /* Add the warning after printing 'FAILED' */
1188 WARN_ON(1);
1189 return -1;
1190 }
1191 /* Only reset on passing, to avoid touching corrupted buffers */
1192 tracing_reset_online_cpus(&tr->trace_buffer);
1193
1194#ifdef CONFIG_TRACER_MAX_TRACE
1195 if (type->use_max_tr) {
1196 tr->allocated_snapshot = false;
0d5c6e1c 1197
f4e781c0
SRRH
1198 /* Shrink the max buffer again */
1199 if (ring_buffer_expanded)
1200 ring_buffer_resize(tr->max_buffer.buffer, 1,
1201 RING_BUFFER_ALL_CPUS);
1202 }
1203#endif
1204
1205 printk(KERN_CONT "PASSED\n");
1206 return 0;
1207}
1208#else
1209static inline int run_tracer_selftest(struct tracer *type)
1210{
1211 return 0;
0d5c6e1c 1212}
f4e781c0 1213#endif /* CONFIG_FTRACE_STARTUP_TEST */
0d5c6e1c 1214
41d9c0be
SRRH
1215static void add_tracer_options(struct trace_array *tr, struct tracer *t);
1216
a4d1e688
JW
1217static void __init apply_trace_boot_options(void);
1218
4fcdae83
SR
1219/**
1220 * register_tracer - register a tracer with the ftrace system.
1221 * @type - the plugin for the tracer
1222 *
1223 * Register a new plugin tracer.
1224 */
a4d1e688 1225int __init register_tracer(struct tracer *type)
bc0c38d1
SR
1226{
1227 struct tracer *t;
bc0c38d1
SR
1228 int ret = 0;
1229
1230 if (!type->name) {
1231 pr_info("Tracer must have a name\n");
1232 return -1;
1233 }
1234
24a461d5 1235 if (strlen(type->name) >= MAX_TRACER_SIZE) {
ee6c2c1b
LZ
1236 pr_info("Tracer has a name longer than %d\n", MAX_TRACER_SIZE);
1237 return -1;
1238 }
1239
bc0c38d1 1240 mutex_lock(&trace_types_lock);
86fa2f60 1241
8e1b82e0
FW
1242 tracing_selftest_running = true;
1243
bc0c38d1
SR
1244 for (t = trace_types; t; t = t->next) {
1245 if (strcmp(type->name, t->name) == 0) {
1246 /* already found */
ee6c2c1b 1247 pr_info("Tracer %s already registered\n",
bc0c38d1
SR
1248 type->name);
1249 ret = -1;
1250 goto out;
1251 }
1252 }
1253
adf9f195
FW
1254 if (!type->set_flag)
1255 type->set_flag = &dummy_set_flag;
d39cdd20
CH
1256 if (!type->flags) {
1257 /*allocate a dummy tracer_flags*/
1258 type->flags = kmalloc(sizeof(*type->flags), GFP_KERNEL);
c8ca003b
CH
1259 if (!type->flags) {
1260 ret = -ENOMEM;
1261 goto out;
1262 }
d39cdd20
CH
1263 type->flags->val = 0;
1264 type->flags->opts = dummy_tracer_opt;
1265 } else
adf9f195
FW
1266 if (!type->flags->opts)
1267 type->flags->opts = dummy_tracer_opt;
6eaaa5d5 1268
d39cdd20
CH
1269 /* store the tracer for __set_tracer_option */
1270 type->flags->trace = type;
1271
f4e781c0
SRRH
1272 ret = run_tracer_selftest(type);
1273 if (ret < 0)
1274 goto out;
60a11774 1275
bc0c38d1
SR
1276 type->next = trace_types;
1277 trace_types = type;
41d9c0be 1278 add_tracer_options(&global_trace, type);
60a11774 1279
bc0c38d1 1280 out:
8e1b82e0 1281 tracing_selftest_running = false;
bc0c38d1
SR
1282 mutex_unlock(&trace_types_lock);
1283
dac74940
SR
1284 if (ret || !default_bootup_tracer)
1285 goto out_unlock;
1286
ee6c2c1b 1287 if (strncmp(default_bootup_tracer, type->name, MAX_TRACER_SIZE))
dac74940
SR
1288 goto out_unlock;
1289
1290 printk(KERN_INFO "Starting tracer '%s'\n", type->name);
1291 /* Do we want this tracer to start on bootup? */
607e2ea1 1292 tracing_set_tracer(&global_trace, type->name);
dac74940 1293 default_bootup_tracer = NULL;
a4d1e688
JW
1294
1295 apply_trace_boot_options();
1296
dac74940 1297 /* disable other selftests, since this will break it. */
55034cd6 1298 tracing_selftest_disabled = true;
b2821ae6 1299#ifdef CONFIG_FTRACE_STARTUP_TEST
dac74940
SR
1300 printk(KERN_INFO "Disabling FTRACE selftests due to running tracer '%s'\n",
1301 type->name);
b2821ae6 1302#endif
b2821ae6 1303
dac74940 1304 out_unlock:
bc0c38d1
SR
1305 return ret;
1306}
1307
12883efb 1308void tracing_reset(struct trace_buffer *buf, int cpu)
f633903a 1309{
12883efb 1310 struct ring_buffer *buffer = buf->buffer;
f633903a 1311
a5416411
HT
1312 if (!buffer)
1313 return;
1314
f633903a
SR
1315 ring_buffer_record_disable(buffer);
1316
1317 /* Make sure all commits have finished */
1318 synchronize_sched();
68179686 1319 ring_buffer_reset_cpu(buffer, cpu);
f633903a
SR
1320
1321 ring_buffer_record_enable(buffer);
1322}
1323
12883efb 1324void tracing_reset_online_cpus(struct trace_buffer *buf)
213cc060 1325{
12883efb 1326 struct ring_buffer *buffer = buf->buffer;
213cc060
PE
1327 int cpu;
1328
a5416411
HT
1329 if (!buffer)
1330 return;
1331
621968cd
SR
1332 ring_buffer_record_disable(buffer);
1333
1334 /* Make sure all commits have finished */
1335 synchronize_sched();
1336
9457158b 1337 buf->time_start = buffer_ftrace_now(buf, buf->cpu);
213cc060
PE
1338
1339 for_each_online_cpu(cpu)
68179686 1340 ring_buffer_reset_cpu(buffer, cpu);
621968cd
SR
1341
1342 ring_buffer_record_enable(buffer);
213cc060
PE
1343}
1344
09d8091c 1345/* Must have trace_types_lock held */
873c642f 1346void tracing_reset_all_online_cpus(void)
9456f0fa 1347{
873c642f
SRRH
1348 struct trace_array *tr;
1349
873c642f 1350 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
12883efb
SRRH
1351 tracing_reset_online_cpus(&tr->trace_buffer);
1352#ifdef CONFIG_TRACER_MAX_TRACE
1353 tracing_reset_online_cpus(&tr->max_buffer);
1354#endif
873c642f 1355 }
9456f0fa
SR
1356}
1357
939c7a4f 1358#define SAVED_CMDLINES_DEFAULT 128
2c7eea4c 1359#define NO_CMDLINE_MAP UINT_MAX
edc35bd7 1360static arch_spinlock_t trace_cmdline_lock = __ARCH_SPIN_LOCK_UNLOCKED;
939c7a4f
YY
1361struct saved_cmdlines_buffer {
1362 unsigned map_pid_to_cmdline[PID_MAX_DEFAULT+1];
1363 unsigned *map_cmdline_to_pid;
1364 unsigned cmdline_num;
1365 int cmdline_idx;
1366 char *saved_cmdlines;
1367};
1368static struct saved_cmdlines_buffer *savedcmd;
25b0b44a 1369
25b0b44a 1370/* temporary disable recording */
4fd27358 1371static atomic_t trace_record_cmdline_disabled __read_mostly;
bc0c38d1 1372
939c7a4f
YY
1373static inline char *get_saved_cmdlines(int idx)
1374{
1375 return &savedcmd->saved_cmdlines[idx * TASK_COMM_LEN];
1376}
1377
1378static inline void set_cmdline(int idx, const char *cmdline)
bc0c38d1 1379{
939c7a4f
YY
1380 memcpy(get_saved_cmdlines(idx), cmdline, TASK_COMM_LEN);
1381}
1382
1383static int allocate_cmdlines_buffer(unsigned int val,
1384 struct saved_cmdlines_buffer *s)
1385{
1386 s->map_cmdline_to_pid = kmalloc(val * sizeof(*s->map_cmdline_to_pid),
1387 GFP_KERNEL);
1388 if (!s->map_cmdline_to_pid)
1389 return -ENOMEM;
1390
1391 s->saved_cmdlines = kmalloc(val * TASK_COMM_LEN, GFP_KERNEL);
1392 if (!s->saved_cmdlines) {
1393 kfree(s->map_cmdline_to_pid);
1394 return -ENOMEM;
1395 }
1396
1397 s->cmdline_idx = 0;
1398 s->cmdline_num = val;
1399 memset(&s->map_pid_to_cmdline, NO_CMDLINE_MAP,
1400 sizeof(s->map_pid_to_cmdline));
1401 memset(s->map_cmdline_to_pid, NO_CMDLINE_MAP,
1402 val * sizeof(*s->map_cmdline_to_pid));
1403
1404 return 0;
1405}
1406
1407static int trace_create_savedcmd(void)
1408{
1409 int ret;
1410
a6af8fbf 1411 savedcmd = kmalloc(sizeof(*savedcmd), GFP_KERNEL);
939c7a4f
YY
1412 if (!savedcmd)
1413 return -ENOMEM;
1414
1415 ret = allocate_cmdlines_buffer(SAVED_CMDLINES_DEFAULT, savedcmd);
1416 if (ret < 0) {
1417 kfree(savedcmd);
1418 savedcmd = NULL;
1419 return -ENOMEM;
1420 }
1421
1422 return 0;
bc0c38d1
SR
1423}
1424
b5130b1e
CE
1425int is_tracing_stopped(void)
1426{
2b6080f2 1427 return global_trace.stop_count;
b5130b1e
CE
1428}
1429
0f048701
SR
1430/**
1431 * tracing_start - quick start of the tracer
1432 *
1433 * If tracing is enabled but was stopped by tracing_stop,
1434 * this will start the tracer back up.
1435 */
1436void tracing_start(void)
1437{
1438 struct ring_buffer *buffer;
1439 unsigned long flags;
1440
1441 if (tracing_disabled)
1442 return;
1443
2b6080f2
SR
1444 raw_spin_lock_irqsave(&global_trace.start_lock, flags);
1445 if (--global_trace.stop_count) {
1446 if (global_trace.stop_count < 0) {
b06a8301
SR
1447 /* Someone screwed up their debugging */
1448 WARN_ON_ONCE(1);
2b6080f2 1449 global_trace.stop_count = 0;
b06a8301 1450 }
0f048701
SR
1451 goto out;
1452 }
1453
a2f80714 1454 /* Prevent the buffers from switching */
0b9b12c1 1455 arch_spin_lock(&global_trace.max_lock);
0f048701 1456
12883efb 1457 buffer = global_trace.trace_buffer.buffer;
0f048701
SR
1458 if (buffer)
1459 ring_buffer_record_enable(buffer);
1460
12883efb
SRRH
1461#ifdef CONFIG_TRACER_MAX_TRACE
1462 buffer = global_trace.max_buffer.buffer;
0f048701
SR
1463 if (buffer)
1464 ring_buffer_record_enable(buffer);
12883efb 1465#endif
0f048701 1466
0b9b12c1 1467 arch_spin_unlock(&global_trace.max_lock);
a2f80714 1468
0f048701 1469 out:
2b6080f2
SR
1470 raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
1471}
1472
1473static void tracing_start_tr(struct trace_array *tr)
1474{
1475 struct ring_buffer *buffer;
1476 unsigned long flags;
1477
1478 if (tracing_disabled)
1479 return;
1480
1481 /* If global, we need to also start the max tracer */
1482 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
1483 return tracing_start();
1484
1485 raw_spin_lock_irqsave(&tr->start_lock, flags);
1486
1487 if (--tr->stop_count) {
1488 if (tr->stop_count < 0) {
1489 /* Someone screwed up their debugging */
1490 WARN_ON_ONCE(1);
1491 tr->stop_count = 0;
1492 }
1493 goto out;
1494 }
1495
12883efb 1496 buffer = tr->trace_buffer.buffer;
2b6080f2
SR
1497 if (buffer)
1498 ring_buffer_record_enable(buffer);
1499
1500 out:
1501 raw_spin_unlock_irqrestore(&tr->start_lock, flags);
0f048701
SR
1502}
1503
1504/**
1505 * tracing_stop - quick stop of the tracer
1506 *
1507 * Light weight way to stop tracing. Use in conjunction with
1508 * tracing_start.
1509 */
1510void tracing_stop(void)
1511{
1512 struct ring_buffer *buffer;
1513 unsigned long flags;
1514
2b6080f2
SR
1515 raw_spin_lock_irqsave(&global_trace.start_lock, flags);
1516 if (global_trace.stop_count++)
0f048701
SR
1517 goto out;
1518
a2f80714 1519 /* Prevent the buffers from switching */
0b9b12c1 1520 arch_spin_lock(&global_trace.max_lock);
a2f80714 1521
12883efb 1522 buffer = global_trace.trace_buffer.buffer;
0f048701
SR
1523 if (buffer)
1524 ring_buffer_record_disable(buffer);
1525
12883efb
SRRH
1526#ifdef CONFIG_TRACER_MAX_TRACE
1527 buffer = global_trace.max_buffer.buffer;
0f048701
SR
1528 if (buffer)
1529 ring_buffer_record_disable(buffer);
12883efb 1530#endif
0f048701 1531
0b9b12c1 1532 arch_spin_unlock(&global_trace.max_lock);
a2f80714 1533
0f048701 1534 out:
2b6080f2
SR
1535 raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
1536}
1537
1538static void tracing_stop_tr(struct trace_array *tr)
1539{
1540 struct ring_buffer *buffer;
1541 unsigned long flags;
1542
1543 /* If global, we need to also stop the max tracer */
1544 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
1545 return tracing_stop();
1546
1547 raw_spin_lock_irqsave(&tr->start_lock, flags);
1548 if (tr->stop_count++)
1549 goto out;
1550
12883efb 1551 buffer = tr->trace_buffer.buffer;
2b6080f2
SR
1552 if (buffer)
1553 ring_buffer_record_disable(buffer);
1554
1555 out:
1556 raw_spin_unlock_irqrestore(&tr->start_lock, flags);
0f048701
SR
1557}
1558
e309b41d 1559void trace_stop_cmdline_recording(void);
bc0c38d1 1560
379cfdac 1561static int trace_save_cmdline(struct task_struct *tsk)
bc0c38d1 1562{
a635cf04 1563 unsigned pid, idx;
bc0c38d1
SR
1564
1565 if (!tsk->pid || unlikely(tsk->pid > PID_MAX_DEFAULT))
379cfdac 1566 return 0;
bc0c38d1
SR
1567
1568 /*
1569 * It's not the end of the world if we don't get
1570 * the lock, but we also don't want to spin
1571 * nor do we want to disable interrupts,
1572 * so if we miss here, then better luck next time.
1573 */
0199c4e6 1574 if (!arch_spin_trylock(&trace_cmdline_lock))
379cfdac 1575 return 0;
bc0c38d1 1576
939c7a4f 1577 idx = savedcmd->map_pid_to_cmdline[tsk->pid];
2c7eea4c 1578 if (idx == NO_CMDLINE_MAP) {
939c7a4f 1579 idx = (savedcmd->cmdline_idx + 1) % savedcmd->cmdline_num;
bc0c38d1 1580
a635cf04
CE
1581 /*
1582 * Check whether the cmdline buffer at idx has a pid
1583 * mapped. We are going to overwrite that entry so we
1584 * need to clear the map_pid_to_cmdline. Otherwise we
1585 * would read the new comm for the old pid.
1586 */
939c7a4f 1587 pid = savedcmd->map_cmdline_to_pid[idx];
a635cf04 1588 if (pid != NO_CMDLINE_MAP)
939c7a4f 1589 savedcmd->map_pid_to_cmdline[pid] = NO_CMDLINE_MAP;
bc0c38d1 1590
939c7a4f
YY
1591 savedcmd->map_cmdline_to_pid[idx] = tsk->pid;
1592 savedcmd->map_pid_to_cmdline[tsk->pid] = idx;
bc0c38d1 1593
939c7a4f 1594 savedcmd->cmdline_idx = idx;
bc0c38d1
SR
1595 }
1596
939c7a4f 1597 set_cmdline(idx, tsk->comm);
bc0c38d1 1598
0199c4e6 1599 arch_spin_unlock(&trace_cmdline_lock);
379cfdac
SRRH
1600
1601 return 1;
bc0c38d1
SR
1602}
1603
4c27e756 1604static void __trace_find_cmdline(int pid, char comm[])
bc0c38d1 1605{
bc0c38d1
SR
1606 unsigned map;
1607
4ca53085
SR
1608 if (!pid) {
1609 strcpy(comm, "<idle>");
1610 return;
1611 }
bc0c38d1 1612
74bf4076
SR
1613 if (WARN_ON_ONCE(pid < 0)) {
1614 strcpy(comm, "<XXX>");
1615 return;
1616 }
1617
4ca53085
SR
1618 if (pid > PID_MAX_DEFAULT) {
1619 strcpy(comm, "<...>");
1620 return;
1621 }
bc0c38d1 1622
939c7a4f 1623 map = savedcmd->map_pid_to_cmdline[pid];
50d88758 1624 if (map != NO_CMDLINE_MAP)
939c7a4f 1625 strcpy(comm, get_saved_cmdlines(map));
50d88758
TG
1626 else
1627 strcpy(comm, "<...>");
4c27e756
SRRH
1628}
1629
1630void trace_find_cmdline(int pid, char comm[])
1631{
1632 preempt_disable();
1633 arch_spin_lock(&trace_cmdline_lock);
1634
1635 __trace_find_cmdline(pid, comm);
bc0c38d1 1636
0199c4e6 1637 arch_spin_unlock(&trace_cmdline_lock);
5b6045a9 1638 preempt_enable();
bc0c38d1
SR
1639}
1640
e309b41d 1641void tracing_record_cmdline(struct task_struct *tsk)
bc0c38d1 1642{
0fb9656d 1643 if (atomic_read(&trace_record_cmdline_disabled) || !tracing_is_on())
bc0c38d1
SR
1644 return;
1645
7ffbd48d
SR
1646 if (!__this_cpu_read(trace_cmdline_save))
1647 return;
1648
379cfdac
SRRH
1649 if (trace_save_cmdline(tsk))
1650 __this_cpu_write(trace_cmdline_save, false);
bc0c38d1
SR
1651}
1652
45dcd8b8 1653void
38697053
SR
1654tracing_generic_entry_update(struct trace_entry *entry, unsigned long flags,
1655 int pc)
bc0c38d1
SR
1656{
1657 struct task_struct *tsk = current;
bc0c38d1 1658
777e208d
SR
1659 entry->preempt_count = pc & 0xff;
1660 entry->pid = (tsk) ? tsk->pid : 0;
1661 entry->flags =
9244489a 1662#ifdef CONFIG_TRACE_IRQFLAGS_SUPPORT
2e2ca155 1663 (irqs_disabled_flags(flags) ? TRACE_FLAG_IRQS_OFF : 0) |
9244489a
SR
1664#else
1665 TRACE_FLAG_IRQS_NOSUPPORT |
1666#endif
7e6867bf 1667 ((pc & NMI_MASK ) ? TRACE_FLAG_NMI : 0) |
bc0c38d1
SR
1668 ((pc & HARDIRQ_MASK) ? TRACE_FLAG_HARDIRQ : 0) |
1669 ((pc & SOFTIRQ_MASK) ? TRACE_FLAG_SOFTIRQ : 0) |
e5137b50
PZ
1670 (tif_need_resched() ? TRACE_FLAG_NEED_RESCHED : 0) |
1671 (test_preempt_need_resched() ? TRACE_FLAG_PREEMPT_RESCHED : 0);
bc0c38d1 1672}
f413cdb8 1673EXPORT_SYMBOL_GPL(tracing_generic_entry_update);
bc0c38d1 1674
e77405ad
SR
1675struct ring_buffer_event *
1676trace_buffer_lock_reserve(struct ring_buffer *buffer,
1677 int type,
1678 unsigned long len,
1679 unsigned long flags, int pc)
51a763dd
ACM
1680{
1681 struct ring_buffer_event *event;
1682
e77405ad 1683 event = ring_buffer_lock_reserve(buffer, len);
51a763dd
ACM
1684 if (event != NULL) {
1685 struct trace_entry *ent = ring_buffer_event_data(event);
1686
1687 tracing_generic_entry_update(ent, flags, pc);
1688 ent->type = type;
1689 }
1690
1691 return event;
1692}
51a763dd 1693
7ffbd48d
SR
1694void
1695__buffer_unlock_commit(struct ring_buffer *buffer, struct ring_buffer_event *event)
1696{
1697 __this_cpu_write(trace_cmdline_save, true);
1698 ring_buffer_unlock_commit(buffer, event);
1699}
1700
b7f0c959
SRRH
1701void trace_buffer_unlock_commit(struct trace_array *tr,
1702 struct ring_buffer *buffer,
1703 struct ring_buffer_event *event,
1704 unsigned long flags, int pc)
51a763dd 1705{
7ffbd48d 1706 __buffer_unlock_commit(buffer, event);
51a763dd 1707
2d34f489 1708 ftrace_trace_stack(tr, buffer, flags, 6, pc, NULL);
e77405ad 1709 ftrace_trace_userstack(buffer, flags, pc);
07edf712 1710}
0d5c6e1c 1711EXPORT_SYMBOL_GPL(trace_buffer_unlock_commit);
51a763dd 1712
2c4a33ab
SRRH
1713static struct ring_buffer *temp_buffer;
1714
ccb469a1
SR
1715struct ring_buffer_event *
1716trace_event_buffer_lock_reserve(struct ring_buffer **current_rb,
7f1d2f82 1717 struct trace_event_file *trace_file,
ccb469a1
SR
1718 int type, unsigned long len,
1719 unsigned long flags, int pc)
1720{
2c4a33ab
SRRH
1721 struct ring_buffer_event *entry;
1722
7f1d2f82 1723 *current_rb = trace_file->tr->trace_buffer.buffer;
2c4a33ab 1724 entry = trace_buffer_lock_reserve(*current_rb,
ccb469a1 1725 type, len, flags, pc);
2c4a33ab
SRRH
1726 /*
1727 * If tracing is off, but we have triggers enabled
1728 * we still need to look at the event data. Use the temp_buffer
1729 * to store the trace event for the tigger to use. It's recusive
1730 * safe and will not be recorded anywhere.
1731 */
5d6ad960 1732 if (!entry && trace_file->flags & EVENT_FILE_FL_TRIGGER_COND) {
2c4a33ab
SRRH
1733 *current_rb = temp_buffer;
1734 entry = trace_buffer_lock_reserve(*current_rb,
1735 type, len, flags, pc);
1736 }
1737 return entry;
ccb469a1
SR
1738}
1739EXPORT_SYMBOL_GPL(trace_event_buffer_lock_reserve);
1740
ef5580d0 1741struct ring_buffer_event *
e77405ad
SR
1742trace_current_buffer_lock_reserve(struct ring_buffer **current_rb,
1743 int type, unsigned long len,
ef5580d0
SR
1744 unsigned long flags, int pc)
1745{
12883efb 1746 *current_rb = global_trace.trace_buffer.buffer;
e77405ad 1747 return trace_buffer_lock_reserve(*current_rb,
ef5580d0
SR
1748 type, len, flags, pc);
1749}
94487d6d 1750EXPORT_SYMBOL_GPL(trace_current_buffer_lock_reserve);
ef5580d0 1751
b7f0c959
SRRH
1752void trace_buffer_unlock_commit_regs(struct trace_array *tr,
1753 struct ring_buffer *buffer,
0d5c6e1c
SR
1754 struct ring_buffer_event *event,
1755 unsigned long flags, int pc,
1756 struct pt_regs *regs)
1fd8df2c 1757{
7ffbd48d 1758 __buffer_unlock_commit(buffer, event);
1fd8df2c 1759
7717c6be 1760 ftrace_trace_stack(tr, buffer, flags, 0, pc, regs);
1fd8df2c
MH
1761 ftrace_trace_userstack(buffer, flags, pc);
1762}
0d5c6e1c 1763EXPORT_SYMBOL_GPL(trace_buffer_unlock_commit_regs);
1fd8df2c 1764
e77405ad
SR
1765void trace_current_buffer_discard_commit(struct ring_buffer *buffer,
1766 struct ring_buffer_event *event)
77d9f465 1767{
e77405ad 1768 ring_buffer_discard_commit(buffer, event);
ef5580d0 1769}
12acd473 1770EXPORT_SYMBOL_GPL(trace_current_buffer_discard_commit);
ef5580d0 1771
e309b41d 1772void
7be42151 1773trace_function(struct trace_array *tr,
38697053
SR
1774 unsigned long ip, unsigned long parent_ip, unsigned long flags,
1775 int pc)
bc0c38d1 1776{
2425bcb9 1777 struct trace_event_call *call = &event_function;
12883efb 1778 struct ring_buffer *buffer = tr->trace_buffer.buffer;
3928a8a2 1779 struct ring_buffer_event *event;
777e208d 1780 struct ftrace_entry *entry;
bc0c38d1 1781
e77405ad 1782 event = trace_buffer_lock_reserve(buffer, TRACE_FN, sizeof(*entry),
51a763dd 1783 flags, pc);
3928a8a2
SR
1784 if (!event)
1785 return;
1786 entry = ring_buffer_event_data(event);
777e208d
SR
1787 entry->ip = ip;
1788 entry->parent_ip = parent_ip;
e1112b4d 1789
f306cc82 1790 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1791 __buffer_unlock_commit(buffer, event);
bc0c38d1
SR
1792}
1793
c0a0d0d3 1794#ifdef CONFIG_STACKTRACE
4a9bd3f1
SR
1795
1796#define FTRACE_STACK_MAX_ENTRIES (PAGE_SIZE / sizeof(unsigned long))
1797struct ftrace_stack {
1798 unsigned long calls[FTRACE_STACK_MAX_ENTRIES];
1799};
1800
1801static DEFINE_PER_CPU(struct ftrace_stack, ftrace_stack);
1802static DEFINE_PER_CPU(int, ftrace_stack_reserve);
1803
e77405ad 1804static void __ftrace_trace_stack(struct ring_buffer *buffer,
53614991 1805 unsigned long flags,
1fd8df2c 1806 int skip, int pc, struct pt_regs *regs)
86387f7e 1807{
2425bcb9 1808 struct trace_event_call *call = &event_kernel_stack;
3928a8a2 1809 struct ring_buffer_event *event;
777e208d 1810 struct stack_entry *entry;
86387f7e 1811 struct stack_trace trace;
4a9bd3f1
SR
1812 int use_stack;
1813 int size = FTRACE_STACK_ENTRIES;
1814
1815 trace.nr_entries = 0;
1816 trace.skip = skip;
1817
1818 /*
1819 * Since events can happen in NMIs there's no safe way to
1820 * use the per cpu ftrace_stacks. We reserve it and if an interrupt
1821 * or NMI comes in, it will just have to use the default
1822 * FTRACE_STACK_SIZE.
1823 */
1824 preempt_disable_notrace();
1825
82146529 1826 use_stack = __this_cpu_inc_return(ftrace_stack_reserve);
4a9bd3f1
SR
1827 /*
1828 * We don't need any atomic variables, just a barrier.
1829 * If an interrupt comes in, we don't care, because it would
1830 * have exited and put the counter back to what we want.
1831 * We just need a barrier to keep gcc from moving things
1832 * around.
1833 */
1834 barrier();
1835 if (use_stack == 1) {
bdffd893 1836 trace.entries = this_cpu_ptr(ftrace_stack.calls);
4a9bd3f1
SR
1837 trace.max_entries = FTRACE_STACK_MAX_ENTRIES;
1838
1839 if (regs)
1840 save_stack_trace_regs(regs, &trace);
1841 else
1842 save_stack_trace(&trace);
1843
1844 if (trace.nr_entries > size)
1845 size = trace.nr_entries;
1846 } else
1847 /* From now on, use_stack is a boolean */
1848 use_stack = 0;
1849
1850 size *= sizeof(unsigned long);
86387f7e 1851
e77405ad 1852 event = trace_buffer_lock_reserve(buffer, TRACE_STACK,
4a9bd3f1 1853 sizeof(*entry) + size, flags, pc);
3928a8a2 1854 if (!event)
4a9bd3f1
SR
1855 goto out;
1856 entry = ring_buffer_event_data(event);
86387f7e 1857
4a9bd3f1
SR
1858 memset(&entry->caller, 0, size);
1859
1860 if (use_stack)
1861 memcpy(&entry->caller, trace.entries,
1862 trace.nr_entries * sizeof(unsigned long));
1863 else {
1864 trace.max_entries = FTRACE_STACK_ENTRIES;
1865 trace.entries = entry->caller;
1866 if (regs)
1867 save_stack_trace_regs(regs, &trace);
1868 else
1869 save_stack_trace(&trace);
1870 }
1871
1872 entry->size = trace.nr_entries;
86387f7e 1873
f306cc82 1874 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1875 __buffer_unlock_commit(buffer, event);
4a9bd3f1
SR
1876
1877 out:
1878 /* Again, don't let gcc optimize things here */
1879 barrier();
82146529 1880 __this_cpu_dec(ftrace_stack_reserve);
4a9bd3f1
SR
1881 preempt_enable_notrace();
1882
f0a920d5
IM
1883}
1884
2d34f489
SRRH
1885static inline void ftrace_trace_stack(struct trace_array *tr,
1886 struct ring_buffer *buffer,
73dddbb5
SRRH
1887 unsigned long flags,
1888 int skip, int pc, struct pt_regs *regs)
53614991 1889{
2d34f489 1890 if (!(tr->trace_flags & TRACE_ITER_STACKTRACE))
53614991
SR
1891 return;
1892
73dddbb5 1893 __ftrace_trace_stack(buffer, flags, skip, pc, regs);
53614991
SR
1894}
1895
c0a0d0d3
FW
1896void __trace_stack(struct trace_array *tr, unsigned long flags, int skip,
1897 int pc)
38697053 1898{
12883efb 1899 __ftrace_trace_stack(tr->trace_buffer.buffer, flags, skip, pc, NULL);
38697053
SR
1900}
1901
03889384
SR
1902/**
1903 * trace_dump_stack - record a stack back trace in the trace buffer
c142be8e 1904 * @skip: Number of functions to skip (helper handlers)
03889384 1905 */
c142be8e 1906void trace_dump_stack(int skip)
03889384
SR
1907{
1908 unsigned long flags;
1909
1910 if (tracing_disabled || tracing_selftest_running)
e36c5458 1911 return;
03889384
SR
1912
1913 local_save_flags(flags);
1914
c142be8e
SRRH
1915 /*
1916 * Skip 3 more, seems to get us at the caller of
1917 * this function.
1918 */
1919 skip += 3;
1920 __ftrace_trace_stack(global_trace.trace_buffer.buffer,
1921 flags, skip, preempt_count(), NULL);
03889384
SR
1922}
1923
91e86e56
SR
1924static DEFINE_PER_CPU(int, user_stack_count);
1925
e77405ad
SR
1926void
1927ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
02b67518 1928{
2425bcb9 1929 struct trace_event_call *call = &event_user_stack;
8d7c6a96 1930 struct ring_buffer_event *event;
02b67518
TE
1931 struct userstack_entry *entry;
1932 struct stack_trace trace;
02b67518 1933
983f938a 1934 if (!(global_trace.trace_flags & TRACE_ITER_USERSTACKTRACE))
02b67518
TE
1935 return;
1936
b6345879
SR
1937 /*
1938 * NMIs can not handle page faults, even with fix ups.
1939 * The save user stack can (and often does) fault.
1940 */
1941 if (unlikely(in_nmi()))
1942 return;
02b67518 1943
91e86e56
SR
1944 /*
1945 * prevent recursion, since the user stack tracing may
1946 * trigger other kernel events.
1947 */
1948 preempt_disable();
1949 if (__this_cpu_read(user_stack_count))
1950 goto out;
1951
1952 __this_cpu_inc(user_stack_count);
1953
e77405ad 1954 event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK,
51a763dd 1955 sizeof(*entry), flags, pc);
02b67518 1956 if (!event)
1dbd1951 1957 goto out_drop_count;
02b67518 1958 entry = ring_buffer_event_data(event);
02b67518 1959
48659d31 1960 entry->tgid = current->tgid;
02b67518
TE
1961 memset(&entry->caller, 0, sizeof(entry->caller));
1962
1963 trace.nr_entries = 0;
1964 trace.max_entries = FTRACE_STACK_ENTRIES;
1965 trace.skip = 0;
1966 trace.entries = entry->caller;
1967
1968 save_stack_trace_user(&trace);
f306cc82 1969 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1970 __buffer_unlock_commit(buffer, event);
91e86e56 1971
1dbd1951 1972 out_drop_count:
91e86e56 1973 __this_cpu_dec(user_stack_count);
91e86e56
SR
1974 out:
1975 preempt_enable();
02b67518
TE
1976}
1977
4fd27358
HE
1978#ifdef UNUSED
1979static void __trace_userstack(struct trace_array *tr, unsigned long flags)
02b67518 1980{
7be42151 1981 ftrace_trace_userstack(tr, flags, preempt_count());
02b67518 1982}
4fd27358 1983#endif /* UNUSED */
02b67518 1984
c0a0d0d3
FW
1985#endif /* CONFIG_STACKTRACE */
1986
07d777fe
SR
1987/* created for use with alloc_percpu */
1988struct trace_buffer_struct {
1989 char buffer[TRACE_BUF_SIZE];
1990};
1991
1992static struct trace_buffer_struct *trace_percpu_buffer;
1993static struct trace_buffer_struct *trace_percpu_sirq_buffer;
1994static struct trace_buffer_struct *trace_percpu_irq_buffer;
1995static struct trace_buffer_struct *trace_percpu_nmi_buffer;
1996
1997/*
1998 * The buffer used is dependent on the context. There is a per cpu
1999 * buffer for normal context, softirq contex, hard irq context and
2000 * for NMI context. Thise allows for lockless recording.
2001 *
2002 * Note, if the buffers failed to be allocated, then this returns NULL
2003 */
2004static char *get_trace_buf(void)
2005{
2006 struct trace_buffer_struct *percpu_buffer;
07d777fe
SR
2007
2008 /*
2009 * If we have allocated per cpu buffers, then we do not
2010 * need to do any locking.
2011 */
2012 if (in_nmi())
2013 percpu_buffer = trace_percpu_nmi_buffer;
2014 else if (in_irq())
2015 percpu_buffer = trace_percpu_irq_buffer;
2016 else if (in_softirq())
2017 percpu_buffer = trace_percpu_sirq_buffer;
2018 else
2019 percpu_buffer = trace_percpu_buffer;
2020
2021 if (!percpu_buffer)
2022 return NULL;
2023
d8a0349c 2024 return this_cpu_ptr(&percpu_buffer->buffer[0]);
07d777fe
SR
2025}
2026
2027static int alloc_percpu_trace_buffer(void)
2028{
2029 struct trace_buffer_struct *buffers;
2030 struct trace_buffer_struct *sirq_buffers;
2031 struct trace_buffer_struct *irq_buffers;
2032 struct trace_buffer_struct *nmi_buffers;
2033
2034 buffers = alloc_percpu(struct trace_buffer_struct);
2035 if (!buffers)
2036 goto err_warn;
2037
2038 sirq_buffers = alloc_percpu(struct trace_buffer_struct);
2039 if (!sirq_buffers)
2040 goto err_sirq;
2041
2042 irq_buffers = alloc_percpu(struct trace_buffer_struct);
2043 if (!irq_buffers)
2044 goto err_irq;
2045
2046 nmi_buffers = alloc_percpu(struct trace_buffer_struct);
2047 if (!nmi_buffers)
2048 goto err_nmi;
2049
2050 trace_percpu_buffer = buffers;
2051 trace_percpu_sirq_buffer = sirq_buffers;
2052 trace_percpu_irq_buffer = irq_buffers;
2053 trace_percpu_nmi_buffer = nmi_buffers;
2054
2055 return 0;
2056
2057 err_nmi:
2058 free_percpu(irq_buffers);
2059 err_irq:
2060 free_percpu(sirq_buffers);
2061 err_sirq:
2062 free_percpu(buffers);
2063 err_warn:
2064 WARN(1, "Could not allocate percpu trace_printk buffer");
2065 return -ENOMEM;
2066}
2067
81698831
SR
2068static int buffers_allocated;
2069
07d777fe
SR
2070void trace_printk_init_buffers(void)
2071{
07d777fe
SR
2072 if (buffers_allocated)
2073 return;
2074
2075 if (alloc_percpu_trace_buffer())
2076 return;
2077
2184db46
SR
2078 /* trace_printk() is for debug use only. Don't use it in production. */
2079
a395d6a7
JP
2080 pr_warn("\n");
2081 pr_warn("**********************************************************\n");
2082 pr_warn("** NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE **\n");
2083 pr_warn("** **\n");
2084 pr_warn("** trace_printk() being used. Allocating extra memory. **\n");
2085 pr_warn("** **\n");
2086 pr_warn("** This means that this is a DEBUG kernel and it is **\n");
2087 pr_warn("** unsafe for production use. **\n");
2088 pr_warn("** **\n");
2089 pr_warn("** If you see this message and you are not debugging **\n");
2090 pr_warn("** the kernel, report this immediately to your vendor! **\n");
2091 pr_warn("** **\n");
2092 pr_warn("** NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE **\n");
2093 pr_warn("**********************************************************\n");
07d777fe 2094
b382ede6
SR
2095 /* Expand the buffers to set size */
2096 tracing_update_buffers();
2097
07d777fe 2098 buffers_allocated = 1;
81698831
SR
2099
2100 /*
2101 * trace_printk_init_buffers() can be called by modules.
2102 * If that happens, then we need to start cmdline recording
2103 * directly here. If the global_trace.buffer is already
2104 * allocated here, then this was called by module code.
2105 */
12883efb 2106 if (global_trace.trace_buffer.buffer)
81698831
SR
2107 tracing_start_cmdline_record();
2108}
2109
2110void trace_printk_start_comm(void)
2111{
2112 /* Start tracing comms if trace printk is set */
2113 if (!buffers_allocated)
2114 return;
2115 tracing_start_cmdline_record();
2116}
2117
2118static void trace_printk_start_stop_comm(int enabled)
2119{
2120 if (!buffers_allocated)
2121 return;
2122
2123 if (enabled)
2124 tracing_start_cmdline_record();
2125 else
2126 tracing_stop_cmdline_record();
07d777fe
SR
2127}
2128
769b0441 2129/**
48ead020 2130 * trace_vbprintk - write binary msg to tracing buffer
769b0441
FW
2131 *
2132 */
40ce74f1 2133int trace_vbprintk(unsigned long ip, const char *fmt, va_list args)
769b0441 2134{
2425bcb9 2135 struct trace_event_call *call = &event_bprint;
769b0441 2136 struct ring_buffer_event *event;
e77405ad 2137 struct ring_buffer *buffer;
769b0441 2138 struct trace_array *tr = &global_trace;
48ead020 2139 struct bprint_entry *entry;
769b0441 2140 unsigned long flags;
07d777fe
SR
2141 char *tbuffer;
2142 int len = 0, size, pc;
769b0441
FW
2143
2144 if (unlikely(tracing_selftest_running || tracing_disabled))
2145 return 0;
2146
2147 /* Don't pollute graph traces with trace_vprintk internals */
2148 pause_graph_tracing();
2149
2150 pc = preempt_count();
5168ae50 2151 preempt_disable_notrace();
769b0441 2152
07d777fe
SR
2153 tbuffer = get_trace_buf();
2154 if (!tbuffer) {
2155 len = 0;
769b0441 2156 goto out;
07d777fe 2157 }
769b0441 2158
07d777fe 2159 len = vbin_printf((u32 *)tbuffer, TRACE_BUF_SIZE/sizeof(int), fmt, args);
769b0441 2160
07d777fe
SR
2161 if (len > TRACE_BUF_SIZE/sizeof(int) || len < 0)
2162 goto out;
769b0441 2163
07d777fe 2164 local_save_flags(flags);
769b0441 2165 size = sizeof(*entry) + sizeof(u32) * len;
12883efb 2166 buffer = tr->trace_buffer.buffer;
e77405ad
SR
2167 event = trace_buffer_lock_reserve(buffer, TRACE_BPRINT, size,
2168 flags, pc);
769b0441 2169 if (!event)
07d777fe 2170 goto out;
769b0441
FW
2171 entry = ring_buffer_event_data(event);
2172 entry->ip = ip;
769b0441
FW
2173 entry->fmt = fmt;
2174
07d777fe 2175 memcpy(entry->buf, tbuffer, sizeof(u32) * len);
f306cc82 2176 if (!call_filter_check_discard(call, entry, buffer, event)) {
7ffbd48d 2177 __buffer_unlock_commit(buffer, event);
2d34f489 2178 ftrace_trace_stack(tr, buffer, flags, 6, pc, NULL);
d931369b 2179 }
769b0441 2180
769b0441 2181out:
5168ae50 2182 preempt_enable_notrace();
769b0441
FW
2183 unpause_graph_tracing();
2184
2185 return len;
2186}
48ead020
FW
2187EXPORT_SYMBOL_GPL(trace_vbprintk);
2188
12883efb
SRRH
2189static int
2190__trace_array_vprintk(struct ring_buffer *buffer,
2191 unsigned long ip, const char *fmt, va_list args)
48ead020 2192{
2425bcb9 2193 struct trace_event_call *call = &event_print;
48ead020 2194 struct ring_buffer_event *event;
07d777fe 2195 int len = 0, size, pc;
48ead020 2196 struct print_entry *entry;
07d777fe
SR
2197 unsigned long flags;
2198 char *tbuffer;
48ead020
FW
2199
2200 if (tracing_disabled || tracing_selftest_running)
2201 return 0;
2202
07d777fe
SR
2203 /* Don't pollute graph traces with trace_vprintk internals */
2204 pause_graph_tracing();
2205
48ead020
FW
2206 pc = preempt_count();
2207 preempt_disable_notrace();
48ead020 2208
07d777fe
SR
2209
2210 tbuffer = get_trace_buf();
2211 if (!tbuffer) {
2212 len = 0;
48ead020 2213 goto out;
07d777fe 2214 }
48ead020 2215
3558a5ac 2216 len = vscnprintf(tbuffer, TRACE_BUF_SIZE, fmt, args);
48ead020 2217
07d777fe 2218 local_save_flags(flags);
48ead020 2219 size = sizeof(*entry) + len + 1;
e77405ad 2220 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, size,
07d777fe 2221 flags, pc);
48ead020 2222 if (!event)
07d777fe 2223 goto out;
48ead020 2224 entry = ring_buffer_event_data(event);
c13d2f7c 2225 entry->ip = ip;
48ead020 2226
3558a5ac 2227 memcpy(&entry->buf, tbuffer, len + 1);
f306cc82 2228 if (!call_filter_check_discard(call, entry, buffer, event)) {
7ffbd48d 2229 __buffer_unlock_commit(buffer, event);
2d34f489 2230 ftrace_trace_stack(&global_trace, buffer, flags, 6, pc, NULL);
d931369b 2231 }
48ead020
FW
2232 out:
2233 preempt_enable_notrace();
07d777fe 2234 unpause_graph_tracing();
48ead020
FW
2235
2236 return len;
2237}
659372d3 2238
12883efb
SRRH
2239int trace_array_vprintk(struct trace_array *tr,
2240 unsigned long ip, const char *fmt, va_list args)
2241{
2242 return __trace_array_vprintk(tr->trace_buffer.buffer, ip, fmt, args);
2243}
2244
2245int trace_array_printk(struct trace_array *tr,
2246 unsigned long ip, const char *fmt, ...)
2247{
2248 int ret;
2249 va_list ap;
2250
983f938a 2251 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
12883efb
SRRH
2252 return 0;
2253
2254 va_start(ap, fmt);
2255 ret = trace_array_vprintk(tr, ip, fmt, ap);
2256 va_end(ap);
2257 return ret;
2258}
2259
2260int trace_array_printk_buf(struct ring_buffer *buffer,
2261 unsigned long ip, const char *fmt, ...)
2262{
2263 int ret;
2264 va_list ap;
2265
983f938a 2266 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
12883efb
SRRH
2267 return 0;
2268
2269 va_start(ap, fmt);
2270 ret = __trace_array_vprintk(buffer, ip, fmt, ap);
2271 va_end(ap);
2272 return ret;
2273}
2274
659372d3
SR
2275int trace_vprintk(unsigned long ip, const char *fmt, va_list args)
2276{
a813a159 2277 return trace_array_vprintk(&global_trace, ip, fmt, args);
659372d3 2278}
769b0441
FW
2279EXPORT_SYMBOL_GPL(trace_vprintk);
2280
e2ac8ef5 2281static void trace_iterator_increment(struct trace_iterator *iter)
5a90f577 2282{
6d158a81
SR
2283 struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, iter->cpu);
2284
5a90f577 2285 iter->idx++;
6d158a81
SR
2286 if (buf_iter)
2287 ring_buffer_read(buf_iter, NULL);
5a90f577
SR
2288}
2289
e309b41d 2290static struct trace_entry *
bc21b478
SR
2291peek_next_entry(struct trace_iterator *iter, int cpu, u64 *ts,
2292 unsigned long *lost_events)
dd0e545f 2293{
3928a8a2 2294 struct ring_buffer_event *event;
6d158a81 2295 struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, cpu);
dd0e545f 2296
d769041f
SR
2297 if (buf_iter)
2298 event = ring_buffer_iter_peek(buf_iter, ts);
2299 else
12883efb 2300 event = ring_buffer_peek(iter->trace_buffer->buffer, cpu, ts,
bc21b478 2301 lost_events);
d769041f 2302
4a9bd3f1
SR
2303 if (event) {
2304 iter->ent_size = ring_buffer_event_length(event);
2305 return ring_buffer_event_data(event);
2306 }
2307 iter->ent_size = 0;
2308 return NULL;
dd0e545f 2309}
d769041f 2310
dd0e545f 2311static struct trace_entry *
bc21b478
SR
2312__find_next_entry(struct trace_iterator *iter, int *ent_cpu,
2313 unsigned long *missing_events, u64 *ent_ts)
bc0c38d1 2314{
12883efb 2315 struct ring_buffer *buffer = iter->trace_buffer->buffer;
bc0c38d1 2316 struct trace_entry *ent, *next = NULL;
aa27497c 2317 unsigned long lost_events = 0, next_lost = 0;
b04cc6b1 2318 int cpu_file = iter->cpu_file;
3928a8a2 2319 u64 next_ts = 0, ts;
bc0c38d1 2320 int next_cpu = -1;
12b5da34 2321 int next_size = 0;
bc0c38d1
SR
2322 int cpu;
2323
b04cc6b1
FW
2324 /*
2325 * If we are in a per_cpu trace file, don't bother by iterating over
2326 * all cpu and peek directly.
2327 */
ae3b5093 2328 if (cpu_file > RING_BUFFER_ALL_CPUS) {
b04cc6b1
FW
2329 if (ring_buffer_empty_cpu(buffer, cpu_file))
2330 return NULL;
bc21b478 2331 ent = peek_next_entry(iter, cpu_file, ent_ts, missing_events);
b04cc6b1
FW
2332 if (ent_cpu)
2333 *ent_cpu = cpu_file;
2334
2335 return ent;
2336 }
2337
ab46428c 2338 for_each_tracing_cpu(cpu) {
dd0e545f 2339
3928a8a2
SR
2340 if (ring_buffer_empty_cpu(buffer, cpu))
2341 continue;
dd0e545f 2342
bc21b478 2343 ent = peek_next_entry(iter, cpu, &ts, &lost_events);
dd0e545f 2344
cdd31cd2
IM
2345 /*
2346 * Pick the entry with the smallest timestamp:
2347 */
3928a8a2 2348 if (ent && (!next || ts < next_ts)) {
bc0c38d1
SR
2349 next = ent;
2350 next_cpu = cpu;
3928a8a2 2351 next_ts = ts;
bc21b478 2352 next_lost = lost_events;
12b5da34 2353 next_size = iter->ent_size;
bc0c38d1
SR
2354 }
2355 }
2356
12b5da34
SR
2357 iter->ent_size = next_size;
2358
bc0c38d1
SR
2359 if (ent_cpu)
2360 *ent_cpu = next_cpu;
2361
3928a8a2
SR
2362 if (ent_ts)
2363 *ent_ts = next_ts;
2364
bc21b478
SR
2365 if (missing_events)
2366 *missing_events = next_lost;
2367
bc0c38d1
SR
2368 return next;
2369}
2370
dd0e545f 2371/* Find the next real entry, without updating the iterator itself */
c4a8e8be
FW
2372struct trace_entry *trace_find_next_entry(struct trace_iterator *iter,
2373 int *ent_cpu, u64 *ent_ts)
bc0c38d1 2374{
bc21b478 2375 return __find_next_entry(iter, ent_cpu, NULL, ent_ts);
dd0e545f
SR
2376}
2377
2378/* Find the next real entry, and increment the iterator to the next entry */
955b61e5 2379void *trace_find_next_entry_inc(struct trace_iterator *iter)
dd0e545f 2380{
bc21b478
SR
2381 iter->ent = __find_next_entry(iter, &iter->cpu,
2382 &iter->lost_events, &iter->ts);
dd0e545f 2383
3928a8a2 2384 if (iter->ent)
e2ac8ef5 2385 trace_iterator_increment(iter);
dd0e545f 2386
3928a8a2 2387 return iter->ent ? iter : NULL;
b3806b43 2388}
bc0c38d1 2389
e309b41d 2390static void trace_consume(struct trace_iterator *iter)
b3806b43 2391{
12883efb 2392 ring_buffer_consume(iter->trace_buffer->buffer, iter->cpu, &iter->ts,
bc21b478 2393 &iter->lost_events);
bc0c38d1
SR
2394}
2395
e309b41d 2396static void *s_next(struct seq_file *m, void *v, loff_t *pos)
bc0c38d1
SR
2397{
2398 struct trace_iterator *iter = m->private;
bc0c38d1 2399 int i = (int)*pos;
4e3c3333 2400 void *ent;
bc0c38d1 2401
a63ce5b3
SR
2402 WARN_ON_ONCE(iter->leftover);
2403
bc0c38d1
SR
2404 (*pos)++;
2405
2406 /* can't go backwards */
2407 if (iter->idx > i)
2408 return NULL;
2409
2410 if (iter->idx < 0)
955b61e5 2411 ent = trace_find_next_entry_inc(iter);
bc0c38d1
SR
2412 else
2413 ent = iter;
2414
2415 while (ent && iter->idx < i)
955b61e5 2416 ent = trace_find_next_entry_inc(iter);
bc0c38d1
SR
2417
2418 iter->pos = *pos;
2419
bc0c38d1
SR
2420 return ent;
2421}
2422
955b61e5 2423void tracing_iter_reset(struct trace_iterator *iter, int cpu)
2f26ebd5 2424{
2f26ebd5
SR
2425 struct ring_buffer_event *event;
2426 struct ring_buffer_iter *buf_iter;
2427 unsigned long entries = 0;
2428 u64 ts;
2429
12883efb 2430 per_cpu_ptr(iter->trace_buffer->data, cpu)->skipped_entries = 0;
2f26ebd5 2431
6d158a81
SR
2432 buf_iter = trace_buffer_iter(iter, cpu);
2433 if (!buf_iter)
2f26ebd5
SR
2434 return;
2435
2f26ebd5
SR
2436 ring_buffer_iter_reset(buf_iter);
2437
2438 /*
2439 * We could have the case with the max latency tracers
2440 * that a reset never took place on a cpu. This is evident
2441 * by the timestamp being before the start of the buffer.
2442 */
2443 while ((event = ring_buffer_iter_peek(buf_iter, &ts))) {
12883efb 2444 if (ts >= iter->trace_buffer->time_start)
2f26ebd5
SR
2445 break;
2446 entries++;
2447 ring_buffer_read(buf_iter, NULL);
2448 }
2449
12883efb 2450 per_cpu_ptr(iter->trace_buffer->data, cpu)->skipped_entries = entries;
2f26ebd5
SR
2451}
2452
d7350c3f 2453/*
d7350c3f
FW
2454 * The current tracer is copied to avoid a global locking
2455 * all around.
2456 */
bc0c38d1
SR
2457static void *s_start(struct seq_file *m, loff_t *pos)
2458{
2459 struct trace_iterator *iter = m->private;
2b6080f2 2460 struct trace_array *tr = iter->tr;
b04cc6b1 2461 int cpu_file = iter->cpu_file;
bc0c38d1
SR
2462 void *p = NULL;
2463 loff_t l = 0;
3928a8a2 2464 int cpu;
bc0c38d1 2465
2fd196ec
HT
2466 /*
2467 * copy the tracer to avoid using a global lock all around.
2468 * iter->trace is a copy of current_trace, the pointer to the
2469 * name may be used instead of a strcmp(), as iter->trace->name
2470 * will point to the same string as current_trace->name.
2471 */
bc0c38d1 2472 mutex_lock(&trace_types_lock);
2b6080f2
SR
2473 if (unlikely(tr->current_trace && iter->trace->name != tr->current_trace->name))
2474 *iter->trace = *tr->current_trace;
d7350c3f 2475 mutex_unlock(&trace_types_lock);
bc0c38d1 2476
12883efb 2477#ifdef CONFIG_TRACER_MAX_TRACE
debdd57f
HT
2478 if (iter->snapshot && iter->trace->use_max_tr)
2479 return ERR_PTR(-EBUSY);
12883efb 2480#endif
debdd57f
HT
2481
2482 if (!iter->snapshot)
2483 atomic_inc(&trace_record_cmdline_disabled);
bc0c38d1 2484
bc0c38d1
SR
2485 if (*pos != iter->pos) {
2486 iter->ent = NULL;
2487 iter->cpu = 0;
2488 iter->idx = -1;
2489
ae3b5093 2490 if (cpu_file == RING_BUFFER_ALL_CPUS) {
b04cc6b1 2491 for_each_tracing_cpu(cpu)
2f26ebd5 2492 tracing_iter_reset(iter, cpu);
b04cc6b1 2493 } else
2f26ebd5 2494 tracing_iter_reset(iter, cpu_file);
bc0c38d1 2495
ac91d854 2496 iter->leftover = 0;
bc0c38d1
SR
2497 for (p = iter; p && l < *pos; p = s_next(m, p, &l))
2498 ;
2499
2500 } else {
a63ce5b3
SR
2501 /*
2502 * If we overflowed the seq_file before, then we want
2503 * to just reuse the trace_seq buffer again.
2504 */
2505 if (iter->leftover)
2506 p = iter;
2507 else {
2508 l = *pos - 1;
2509 p = s_next(m, p, &l);
2510 }
bc0c38d1
SR
2511 }
2512
4f535968 2513 trace_event_read_lock();
7e53bd42 2514 trace_access_lock(cpu_file);
bc0c38d1
SR
2515 return p;
2516}
2517
2518static void s_stop(struct seq_file *m, void *p)
2519{
7e53bd42
LJ
2520 struct trace_iterator *iter = m->private;
2521
12883efb 2522#ifdef CONFIG_TRACER_MAX_TRACE
debdd57f
HT
2523 if (iter->snapshot && iter->trace->use_max_tr)
2524 return;
12883efb 2525#endif
debdd57f
HT
2526
2527 if (!iter->snapshot)
2528 atomic_dec(&trace_record_cmdline_disabled);
12883efb 2529
7e53bd42 2530 trace_access_unlock(iter->cpu_file);
4f535968 2531 trace_event_read_unlock();
bc0c38d1
SR
2532}
2533
39eaf7ef 2534static void
12883efb
SRRH
2535get_total_entries(struct trace_buffer *buf,
2536 unsigned long *total, unsigned long *entries)
39eaf7ef
SR
2537{
2538 unsigned long count;
2539 int cpu;
2540
2541 *total = 0;
2542 *entries = 0;
2543
2544 for_each_tracing_cpu(cpu) {
12883efb 2545 count = ring_buffer_entries_cpu(buf->buffer, cpu);
39eaf7ef
SR
2546 /*
2547 * If this buffer has skipped entries, then we hold all
2548 * entries for the trace and we need to ignore the
2549 * ones before the time stamp.
2550 */
12883efb
SRRH
2551 if (per_cpu_ptr(buf->data, cpu)->skipped_entries) {
2552 count -= per_cpu_ptr(buf->data, cpu)->skipped_entries;
39eaf7ef
SR
2553 /* total is the same as the entries */
2554 *total += count;
2555 } else
2556 *total += count +
12883efb 2557 ring_buffer_overrun_cpu(buf->buffer, cpu);
39eaf7ef
SR
2558 *entries += count;
2559 }
2560}
2561
e309b41d 2562static void print_lat_help_header(struct seq_file *m)
bc0c38d1 2563{
d79ac28f
RV
2564 seq_puts(m, "# _------=> CPU# \n"
2565 "# / _-----=> irqs-off \n"
2566 "# | / _----=> need-resched \n"
2567 "# || / _---=> hardirq/softirq \n"
2568 "# ||| / _--=> preempt-depth \n"
2569 "# |||| / delay \n"
2570 "# cmd pid ||||| time | caller \n"
2571 "# \\ / ||||| \\ | / \n");
bc0c38d1
SR
2572}
2573
12883efb 2574static void print_event_info(struct trace_buffer *buf, struct seq_file *m)
bc0c38d1 2575{
39eaf7ef
SR
2576 unsigned long total;
2577 unsigned long entries;
2578
12883efb 2579 get_total_entries(buf, &total, &entries);
39eaf7ef
SR
2580 seq_printf(m, "# entries-in-buffer/entries-written: %lu/%lu #P:%d\n",
2581 entries, total, num_online_cpus());
2582 seq_puts(m, "#\n");
2583}
2584
12883efb 2585static void print_func_help_header(struct trace_buffer *buf, struct seq_file *m)
39eaf7ef 2586{
12883efb 2587 print_event_info(buf, m);
d79ac28f
RV
2588 seq_puts(m, "# TASK-PID CPU# TIMESTAMP FUNCTION\n"
2589 "# | | | | |\n");
bc0c38d1
SR
2590}
2591
12883efb 2592static void print_func_help_header_irq(struct trace_buffer *buf, struct seq_file *m)
77271ce4 2593{
12883efb 2594 print_event_info(buf, m);
d79ac28f
RV
2595 seq_puts(m, "# _-----=> irqs-off\n"
2596 "# / _----=> need-resched\n"
2597 "# | / _---=> hardirq/softirq\n"
2598 "# || / _--=> preempt-depth\n"
2599 "# ||| / delay\n"
2600 "# TASK-PID CPU# |||| TIMESTAMP FUNCTION\n"
2601 "# | | | |||| | |\n");
77271ce4 2602}
bc0c38d1 2603
62b915f1 2604void
bc0c38d1
SR
2605print_trace_header(struct seq_file *m, struct trace_iterator *iter)
2606{
983f938a 2607 unsigned long sym_flags = (global_trace.trace_flags & TRACE_ITER_SYM_MASK);
12883efb
SRRH
2608 struct trace_buffer *buf = iter->trace_buffer;
2609 struct trace_array_cpu *data = per_cpu_ptr(buf->data, buf->cpu);
2b6080f2 2610 struct tracer *type = iter->trace;
39eaf7ef
SR
2611 unsigned long entries;
2612 unsigned long total;
bc0c38d1
SR
2613 const char *name = "preemption";
2614
d840f718 2615 name = type->name;
bc0c38d1 2616
12883efb 2617 get_total_entries(buf, &total, &entries);
bc0c38d1 2618
888b55dc 2619 seq_printf(m, "# %s latency trace v1.1.5 on %s\n",
bc0c38d1 2620 name, UTS_RELEASE);
888b55dc 2621 seq_puts(m, "# -----------------------------------"
bc0c38d1 2622 "---------------------------------\n");
888b55dc 2623 seq_printf(m, "# latency: %lu us, #%lu/%lu, CPU#%d |"
bc0c38d1 2624 " (M:%s VP:%d, KP:%d, SP:%d HP:%d",
57f50be1 2625 nsecs_to_usecs(data->saved_latency),
bc0c38d1 2626 entries,
4c11d7ae 2627 total,
12883efb 2628 buf->cpu,
bc0c38d1
SR
2629#if defined(CONFIG_PREEMPT_NONE)
2630 "server",
2631#elif defined(CONFIG_PREEMPT_VOLUNTARY)
2632 "desktop",
b5c21b45 2633#elif defined(CONFIG_PREEMPT)
bc0c38d1
SR
2634 "preempt",
2635#else
2636 "unknown",
2637#endif
2638 /* These are reserved for later use */
2639 0, 0, 0, 0);
2640#ifdef CONFIG_SMP
2641 seq_printf(m, " #P:%d)\n", num_online_cpus());
2642#else
2643 seq_puts(m, ")\n");
2644#endif
888b55dc
KM
2645 seq_puts(m, "# -----------------\n");
2646 seq_printf(m, "# | task: %.16s-%d "
bc0c38d1 2647 "(uid:%d nice:%ld policy:%ld rt_prio:%ld)\n",
d20b92ab
EB
2648 data->comm, data->pid,
2649 from_kuid_munged(seq_user_ns(m), data->uid), data->nice,
bc0c38d1 2650 data->policy, data->rt_priority);
888b55dc 2651 seq_puts(m, "# -----------------\n");
bc0c38d1
SR
2652
2653 if (data->critical_start) {
888b55dc 2654 seq_puts(m, "# => started at: ");
214023c3
SR
2655 seq_print_ip_sym(&iter->seq, data->critical_start, sym_flags);
2656 trace_print_seq(m, &iter->seq);
888b55dc 2657 seq_puts(m, "\n# => ended at: ");
214023c3
SR
2658 seq_print_ip_sym(&iter->seq, data->critical_end, sym_flags);
2659 trace_print_seq(m, &iter->seq);
8248ac05 2660 seq_puts(m, "\n#\n");
bc0c38d1
SR
2661 }
2662
888b55dc 2663 seq_puts(m, "#\n");
bc0c38d1
SR
2664}
2665
a309720c
SR
2666static void test_cpu_buff_start(struct trace_iterator *iter)
2667{
2668 struct trace_seq *s = &iter->seq;
983f938a 2669 struct trace_array *tr = iter->tr;
a309720c 2670
983f938a 2671 if (!(tr->trace_flags & TRACE_ITER_ANNOTATE))
12ef7d44
SR
2672 return;
2673
2674 if (!(iter->iter_flags & TRACE_FILE_ANNOTATE))
2675 return;
2676
919cd979 2677 if (iter->started && cpumask_test_cpu(iter->cpu, iter->started))
a309720c
SR
2678 return;
2679
12883efb 2680 if (per_cpu_ptr(iter->trace_buffer->data, iter->cpu)->skipped_entries)
2f26ebd5
SR
2681 return;
2682
919cd979
SL
2683 if (iter->started)
2684 cpumask_set_cpu(iter->cpu, iter->started);
b0dfa978
FW
2685
2686 /* Don't print started cpu buffer for the first entry of the trace */
2687 if (iter->idx > 1)
2688 trace_seq_printf(s, "##### CPU %u buffer started ####\n",
2689 iter->cpu);
a309720c
SR
2690}
2691
2c4f035f 2692static enum print_line_t print_trace_fmt(struct trace_iterator *iter)
bc0c38d1 2693{
983f938a 2694 struct trace_array *tr = iter->tr;
214023c3 2695 struct trace_seq *s = &iter->seq;
983f938a 2696 unsigned long sym_flags = (tr->trace_flags & TRACE_ITER_SYM_MASK);
4e3c3333 2697 struct trace_entry *entry;
f633cef0 2698 struct trace_event *event;
bc0c38d1 2699
4e3c3333 2700 entry = iter->ent;
dd0e545f 2701
a309720c
SR
2702 test_cpu_buff_start(iter);
2703
c4a8e8be 2704 event = ftrace_find_event(entry->type);
bc0c38d1 2705
983f938a 2706 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2707 if (iter->iter_flags & TRACE_FILE_LAT_FMT)
2708 trace_print_lat_context(iter);
2709 else
2710 trace_print_context(iter);
c4a8e8be 2711 }
bc0c38d1 2712
19a7fe20
SRRH
2713 if (trace_seq_has_overflowed(s))
2714 return TRACE_TYPE_PARTIAL_LINE;
2715
268ccda0 2716 if (event)
a9a57763 2717 return event->funcs->trace(iter, sym_flags, event);
d9793bd8 2718
19a7fe20 2719 trace_seq_printf(s, "Unknown type %d\n", entry->type);
02b67518 2720
19a7fe20 2721 return trace_handle_return(s);
bc0c38d1
SR
2722}
2723
2c4f035f 2724static enum print_line_t print_raw_fmt(struct trace_iterator *iter)
f9896bf3 2725{
983f938a 2726 struct trace_array *tr = iter->tr;
f9896bf3
IM
2727 struct trace_seq *s = &iter->seq;
2728 struct trace_entry *entry;
f633cef0 2729 struct trace_event *event;
f9896bf3
IM
2730
2731 entry = iter->ent;
dd0e545f 2732
983f938a 2733 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO)
19a7fe20
SRRH
2734 trace_seq_printf(s, "%d %d %llu ",
2735 entry->pid, iter->cpu, iter->ts);
2736
2737 if (trace_seq_has_overflowed(s))
2738 return TRACE_TYPE_PARTIAL_LINE;
f9896bf3 2739
f633cef0 2740 event = ftrace_find_event(entry->type);
268ccda0 2741 if (event)
a9a57763 2742 return event->funcs->raw(iter, 0, event);
d9793bd8 2743
19a7fe20 2744 trace_seq_printf(s, "%d ?\n", entry->type);
777e208d 2745
19a7fe20 2746 return trace_handle_return(s);
f9896bf3
IM
2747}
2748
2c4f035f 2749static enum print_line_t print_hex_fmt(struct trace_iterator *iter)
5e3ca0ec 2750{
983f938a 2751 struct trace_array *tr = iter->tr;
5e3ca0ec
IM
2752 struct trace_seq *s = &iter->seq;
2753 unsigned char newline = '\n';
2754 struct trace_entry *entry;
f633cef0 2755 struct trace_event *event;
5e3ca0ec
IM
2756
2757 entry = iter->ent;
dd0e545f 2758
983f938a 2759 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2760 SEQ_PUT_HEX_FIELD(s, entry->pid);
2761 SEQ_PUT_HEX_FIELD(s, iter->cpu);
2762 SEQ_PUT_HEX_FIELD(s, iter->ts);
2763 if (trace_seq_has_overflowed(s))
2764 return TRACE_TYPE_PARTIAL_LINE;
c4a8e8be 2765 }
5e3ca0ec 2766
f633cef0 2767 event = ftrace_find_event(entry->type);
268ccda0 2768 if (event) {
a9a57763 2769 enum print_line_t ret = event->funcs->hex(iter, 0, event);
d9793bd8
ACM
2770 if (ret != TRACE_TYPE_HANDLED)
2771 return ret;
2772 }
7104f300 2773
19a7fe20 2774 SEQ_PUT_FIELD(s, newline);
5e3ca0ec 2775
19a7fe20 2776 return trace_handle_return(s);
5e3ca0ec
IM
2777}
2778
2c4f035f 2779static enum print_line_t print_bin_fmt(struct trace_iterator *iter)
cb0f12aa 2780{
983f938a 2781 struct trace_array *tr = iter->tr;
cb0f12aa
IM
2782 struct trace_seq *s = &iter->seq;
2783 struct trace_entry *entry;
f633cef0 2784 struct trace_event *event;
cb0f12aa
IM
2785
2786 entry = iter->ent;
dd0e545f 2787
983f938a 2788 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2789 SEQ_PUT_FIELD(s, entry->pid);
2790 SEQ_PUT_FIELD(s, iter->cpu);
2791 SEQ_PUT_FIELD(s, iter->ts);
2792 if (trace_seq_has_overflowed(s))
2793 return TRACE_TYPE_PARTIAL_LINE;
c4a8e8be 2794 }
cb0f12aa 2795
f633cef0 2796 event = ftrace_find_event(entry->type);
a9a57763
SR
2797 return event ? event->funcs->binary(iter, 0, event) :
2798 TRACE_TYPE_HANDLED;
cb0f12aa
IM
2799}
2800
62b915f1 2801int trace_empty(struct trace_iterator *iter)
bc0c38d1 2802{
6d158a81 2803 struct ring_buffer_iter *buf_iter;
bc0c38d1
SR
2804 int cpu;
2805
9aba60fe 2806 /* If we are looking at one CPU buffer, only check that one */
ae3b5093 2807 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
9aba60fe 2808 cpu = iter->cpu_file;
6d158a81
SR
2809 buf_iter = trace_buffer_iter(iter, cpu);
2810 if (buf_iter) {
2811 if (!ring_buffer_iter_empty(buf_iter))
9aba60fe
SR
2812 return 0;
2813 } else {
12883efb 2814 if (!ring_buffer_empty_cpu(iter->trace_buffer->buffer, cpu))
9aba60fe
SR
2815 return 0;
2816 }
2817 return 1;
2818 }
2819
ab46428c 2820 for_each_tracing_cpu(cpu) {
6d158a81
SR
2821 buf_iter = trace_buffer_iter(iter, cpu);
2822 if (buf_iter) {
2823 if (!ring_buffer_iter_empty(buf_iter))
d769041f
SR
2824 return 0;
2825 } else {
12883efb 2826 if (!ring_buffer_empty_cpu(iter->trace_buffer->buffer, cpu))
d769041f
SR
2827 return 0;
2828 }
bc0c38d1 2829 }
d769041f 2830
797d3712 2831 return 1;
bc0c38d1
SR
2832}
2833
4f535968 2834/* Called with trace_event_read_lock() held. */
955b61e5 2835enum print_line_t print_trace_line(struct trace_iterator *iter)
f9896bf3 2836{
983f938a
SRRH
2837 struct trace_array *tr = iter->tr;
2838 unsigned long trace_flags = tr->trace_flags;
2c4f035f
FW
2839 enum print_line_t ret;
2840
19a7fe20
SRRH
2841 if (iter->lost_events) {
2842 trace_seq_printf(&iter->seq, "CPU:%d [LOST %lu EVENTS]\n",
2843 iter->cpu, iter->lost_events);
2844 if (trace_seq_has_overflowed(&iter->seq))
2845 return TRACE_TYPE_PARTIAL_LINE;
2846 }
bc21b478 2847
2c4f035f
FW
2848 if (iter->trace && iter->trace->print_line) {
2849 ret = iter->trace->print_line(iter);
2850 if (ret != TRACE_TYPE_UNHANDLED)
2851 return ret;
2852 }
72829bc3 2853
09ae7234
SRRH
2854 if (iter->ent->type == TRACE_BPUTS &&
2855 trace_flags & TRACE_ITER_PRINTK &&
2856 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
2857 return trace_print_bputs_msg_only(iter);
2858
48ead020
FW
2859 if (iter->ent->type == TRACE_BPRINT &&
2860 trace_flags & TRACE_ITER_PRINTK &&
2861 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
5ef841f6 2862 return trace_print_bprintk_msg_only(iter);
48ead020 2863
66896a85
FW
2864 if (iter->ent->type == TRACE_PRINT &&
2865 trace_flags & TRACE_ITER_PRINTK &&
2866 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
5ef841f6 2867 return trace_print_printk_msg_only(iter);
66896a85 2868
cb0f12aa
IM
2869 if (trace_flags & TRACE_ITER_BIN)
2870 return print_bin_fmt(iter);
2871
5e3ca0ec
IM
2872 if (trace_flags & TRACE_ITER_HEX)
2873 return print_hex_fmt(iter);
2874
f9896bf3
IM
2875 if (trace_flags & TRACE_ITER_RAW)
2876 return print_raw_fmt(iter);
2877
f9896bf3
IM
2878 return print_trace_fmt(iter);
2879}
2880
7e9a49ef
JO
2881void trace_latency_header(struct seq_file *m)
2882{
2883 struct trace_iterator *iter = m->private;
983f938a 2884 struct trace_array *tr = iter->tr;
7e9a49ef
JO
2885
2886 /* print nothing if the buffers are empty */
2887 if (trace_empty(iter))
2888 return;
2889
2890 if (iter->iter_flags & TRACE_FILE_LAT_FMT)
2891 print_trace_header(m, iter);
2892
983f938a 2893 if (!(tr->trace_flags & TRACE_ITER_VERBOSE))
7e9a49ef
JO
2894 print_lat_help_header(m);
2895}
2896
62b915f1
JO
2897void trace_default_header(struct seq_file *m)
2898{
2899 struct trace_iterator *iter = m->private;
983f938a
SRRH
2900 struct trace_array *tr = iter->tr;
2901 unsigned long trace_flags = tr->trace_flags;
62b915f1 2902
f56e7f8e
JO
2903 if (!(trace_flags & TRACE_ITER_CONTEXT_INFO))
2904 return;
2905
62b915f1
JO
2906 if (iter->iter_flags & TRACE_FILE_LAT_FMT) {
2907 /* print nothing if the buffers are empty */
2908 if (trace_empty(iter))
2909 return;
2910 print_trace_header(m, iter);
2911 if (!(trace_flags & TRACE_ITER_VERBOSE))
2912 print_lat_help_header(m);
2913 } else {
77271ce4
SR
2914 if (!(trace_flags & TRACE_ITER_VERBOSE)) {
2915 if (trace_flags & TRACE_ITER_IRQ_INFO)
12883efb 2916 print_func_help_header_irq(iter->trace_buffer, m);
77271ce4 2917 else
12883efb 2918 print_func_help_header(iter->trace_buffer, m);
77271ce4 2919 }
62b915f1
JO
2920 }
2921}
2922
e0a413f6
SR
2923static void test_ftrace_alive(struct seq_file *m)
2924{
2925 if (!ftrace_is_dead())
2926 return;
d79ac28f
RV
2927 seq_puts(m, "# WARNING: FUNCTION TRACING IS CORRUPTED\n"
2928 "# MAY BE MISSING FUNCTION EVENTS\n");
e0a413f6
SR
2929}
2930
d8741e2e 2931#ifdef CONFIG_TRACER_MAX_TRACE
f1affcaa 2932static void show_snapshot_main_help(struct seq_file *m)
d8741e2e 2933{
d79ac28f
RV
2934 seq_puts(m, "# echo 0 > snapshot : Clears and frees snapshot buffer\n"
2935 "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
2936 "# Takes a snapshot of the main buffer.\n"
2937 "# echo 2 > snapshot : Clears snapshot buffer (but does not allocate or free)\n"
2938 "# (Doesn't have to be '2' works with any number that\n"
2939 "# is not a '0' or '1')\n");
d8741e2e 2940}
f1affcaa
SRRH
2941
2942static void show_snapshot_percpu_help(struct seq_file *m)
2943{
fa6f0cc7 2944 seq_puts(m, "# echo 0 > snapshot : Invalid for per_cpu snapshot file.\n");
f1affcaa 2945#ifdef CONFIG_RING_BUFFER_ALLOW_SWAP
d79ac28f
RV
2946 seq_puts(m, "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
2947 "# Takes a snapshot of the main buffer for this cpu.\n");
f1affcaa 2948#else
d79ac28f
RV
2949 seq_puts(m, "# echo 1 > snapshot : Not supported with this kernel.\n"
2950 "# Must use main snapshot file to allocate.\n");
f1affcaa 2951#endif
d79ac28f
RV
2952 seq_puts(m, "# echo 2 > snapshot : Clears this cpu's snapshot buffer (but does not allocate)\n"
2953 "# (Doesn't have to be '2' works with any number that\n"
2954 "# is not a '0' or '1')\n");
f1affcaa
SRRH
2955}
2956
d8741e2e
SRRH
2957static void print_snapshot_help(struct seq_file *m, struct trace_iterator *iter)
2958{
45ad21ca 2959 if (iter->tr->allocated_snapshot)
fa6f0cc7 2960 seq_puts(m, "#\n# * Snapshot is allocated *\n#\n");
d8741e2e 2961 else
fa6f0cc7 2962 seq_puts(m, "#\n# * Snapshot is freed *\n#\n");
d8741e2e 2963
fa6f0cc7 2964 seq_puts(m, "# Snapshot commands:\n");
f1affcaa
SRRH
2965 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
2966 show_snapshot_main_help(m);
2967 else
2968 show_snapshot_percpu_help(m);
d8741e2e
SRRH
2969}
2970#else
2971/* Should never be called */
2972static inline void print_snapshot_help(struct seq_file *m, struct trace_iterator *iter) { }
2973#endif
2974
bc0c38d1
SR
2975static int s_show(struct seq_file *m, void *v)
2976{
2977 struct trace_iterator *iter = v;
a63ce5b3 2978 int ret;
bc0c38d1
SR
2979
2980 if (iter->ent == NULL) {
2981 if (iter->tr) {
2982 seq_printf(m, "# tracer: %s\n", iter->trace->name);
2983 seq_puts(m, "#\n");
e0a413f6 2984 test_ftrace_alive(m);
bc0c38d1 2985 }
d8741e2e
SRRH
2986 if (iter->snapshot && trace_empty(iter))
2987 print_snapshot_help(m, iter);
2988 else if (iter->trace && iter->trace->print_header)
8bba1bf5 2989 iter->trace->print_header(m);
62b915f1
JO
2990 else
2991 trace_default_header(m);
2992
a63ce5b3
SR
2993 } else if (iter->leftover) {
2994 /*
2995 * If we filled the seq_file buffer earlier, we
2996 * want to just show it now.
2997 */
2998 ret = trace_print_seq(m, &iter->seq);
2999
3000 /* ret should this time be zero, but you never know */
3001 iter->leftover = ret;
3002
bc0c38d1 3003 } else {
f9896bf3 3004 print_trace_line(iter);
a63ce5b3
SR
3005 ret = trace_print_seq(m, &iter->seq);
3006 /*
3007 * If we overflow the seq_file buffer, then it will
3008 * ask us for this data again at start up.
3009 * Use that instead.
3010 * ret is 0 if seq_file write succeeded.
3011 * -1 otherwise.
3012 */
3013 iter->leftover = ret;
bc0c38d1
SR
3014 }
3015
3016 return 0;
3017}
3018
649e9c70
ON
3019/*
3020 * Should be used after trace_array_get(), trace_types_lock
3021 * ensures that i_cdev was already initialized.
3022 */
3023static inline int tracing_get_cpu(struct inode *inode)
3024{
3025 if (inode->i_cdev) /* See trace_create_cpu_file() */
3026 return (long)inode->i_cdev - 1;
3027 return RING_BUFFER_ALL_CPUS;
3028}
3029
88e9d34c 3030static const struct seq_operations tracer_seq_ops = {
4bf39a94
IM
3031 .start = s_start,
3032 .next = s_next,
3033 .stop = s_stop,
3034 .show = s_show,
bc0c38d1
SR
3035};
3036
e309b41d 3037static struct trace_iterator *
6484c71c 3038__tracing_open(struct inode *inode, struct file *file, bool snapshot)
bc0c38d1 3039{
6484c71c 3040 struct trace_array *tr = inode->i_private;
bc0c38d1 3041 struct trace_iterator *iter;
50e18b94 3042 int cpu;
bc0c38d1 3043
85a2f9b4
SR
3044 if (tracing_disabled)
3045 return ERR_PTR(-ENODEV);
60a11774 3046
50e18b94 3047 iter = __seq_open_private(file, &tracer_seq_ops, sizeof(*iter));
85a2f9b4
SR
3048 if (!iter)
3049 return ERR_PTR(-ENOMEM);
bc0c38d1 3050
72917235 3051 iter->buffer_iter = kcalloc(nr_cpu_ids, sizeof(*iter->buffer_iter),
6d158a81 3052 GFP_KERNEL);
93574fcc
DC
3053 if (!iter->buffer_iter)
3054 goto release;
3055
d7350c3f
FW
3056 /*
3057 * We make a copy of the current tracer to avoid concurrent
3058 * changes on it while we are reading.
3059 */
bc0c38d1 3060 mutex_lock(&trace_types_lock);
d7350c3f 3061 iter->trace = kzalloc(sizeof(*iter->trace), GFP_KERNEL);
85a2f9b4 3062 if (!iter->trace)
d7350c3f 3063 goto fail;
85a2f9b4 3064
2b6080f2 3065 *iter->trace = *tr->current_trace;
d7350c3f 3066
79f55997 3067 if (!zalloc_cpumask_var(&iter->started, GFP_KERNEL))
b0dfa978
FW
3068 goto fail;
3069
12883efb
SRRH
3070 iter->tr = tr;
3071
3072#ifdef CONFIG_TRACER_MAX_TRACE
2b6080f2
SR
3073 /* Currently only the top directory has a snapshot */
3074 if (tr->current_trace->print_max || snapshot)
12883efb 3075 iter->trace_buffer = &tr->max_buffer;
bc0c38d1 3076 else
12883efb
SRRH
3077#endif
3078 iter->trace_buffer = &tr->trace_buffer;
debdd57f 3079 iter->snapshot = snapshot;
bc0c38d1 3080 iter->pos = -1;
6484c71c 3081 iter->cpu_file = tracing_get_cpu(inode);
d7350c3f 3082 mutex_init(&iter->mutex);
bc0c38d1 3083
8bba1bf5
MM
3084 /* Notify the tracer early; before we stop tracing. */
3085 if (iter->trace && iter->trace->open)
a93751ca 3086 iter->trace->open(iter);
8bba1bf5 3087
12ef7d44 3088 /* Annotate start of buffers if we had overruns */
12883efb 3089 if (ring_buffer_overruns(iter->trace_buffer->buffer))
12ef7d44
SR
3090 iter->iter_flags |= TRACE_FILE_ANNOTATE;
3091
8be0709f 3092 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
58e8eedf 3093 if (trace_clocks[tr->clock_id].in_ns)
8be0709f
DS
3094 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
3095
debdd57f
HT
3096 /* stop the trace while dumping if we are not opening "snapshot" */
3097 if (!iter->snapshot)
2b6080f2 3098 tracing_stop_tr(tr);
2f26ebd5 3099
ae3b5093 3100 if (iter->cpu_file == RING_BUFFER_ALL_CPUS) {
b04cc6b1 3101 for_each_tracing_cpu(cpu) {
b04cc6b1 3102 iter->buffer_iter[cpu] =
12883efb 3103 ring_buffer_read_prepare(iter->trace_buffer->buffer, cpu);
72c9ddfd
DM
3104 }
3105 ring_buffer_read_prepare_sync();
3106 for_each_tracing_cpu(cpu) {
3107 ring_buffer_read_start(iter->buffer_iter[cpu]);
2f26ebd5 3108 tracing_iter_reset(iter, cpu);
b04cc6b1
FW
3109 }
3110 } else {
3111 cpu = iter->cpu_file;
3928a8a2 3112 iter->buffer_iter[cpu] =
12883efb 3113 ring_buffer_read_prepare(iter->trace_buffer->buffer, cpu);
72c9ddfd
DM
3114 ring_buffer_read_prepare_sync();
3115 ring_buffer_read_start(iter->buffer_iter[cpu]);
2f26ebd5 3116 tracing_iter_reset(iter, cpu);
3928a8a2
SR
3117 }
3118
bc0c38d1
SR
3119 mutex_unlock(&trace_types_lock);
3120
bc0c38d1 3121 return iter;
3928a8a2 3122
d7350c3f 3123 fail:
3928a8a2 3124 mutex_unlock(&trace_types_lock);
d7350c3f 3125 kfree(iter->trace);
6d158a81 3126 kfree(iter->buffer_iter);
93574fcc 3127release:
50e18b94
JO
3128 seq_release_private(inode, file);
3129 return ERR_PTR(-ENOMEM);
bc0c38d1
SR
3130}
3131
3132int tracing_open_generic(struct inode *inode, struct file *filp)
3133{
60a11774
SR
3134 if (tracing_disabled)
3135 return -ENODEV;
3136
bc0c38d1
SR
3137 filp->private_data = inode->i_private;
3138 return 0;
3139}
3140
2e86421d
GB
3141bool tracing_is_disabled(void)
3142{
3143 return (tracing_disabled) ? true: false;
3144}
3145
7b85af63
SRRH
3146/*
3147 * Open and update trace_array ref count.
3148 * Must have the current trace_array passed to it.
3149 */
dcc30223 3150static int tracing_open_generic_tr(struct inode *inode, struct file *filp)
7b85af63
SRRH
3151{
3152 struct trace_array *tr = inode->i_private;
3153
3154 if (tracing_disabled)
3155 return -ENODEV;
3156
3157 if (trace_array_get(tr) < 0)
3158 return -ENODEV;
3159
3160 filp->private_data = inode->i_private;
3161
3162 return 0;
7b85af63
SRRH
3163}
3164
4fd27358 3165static int tracing_release(struct inode *inode, struct file *file)
bc0c38d1 3166{
6484c71c 3167 struct trace_array *tr = inode->i_private;
907f2784 3168 struct seq_file *m = file->private_data;
4acd4d00 3169 struct trace_iterator *iter;
3928a8a2 3170 int cpu;
bc0c38d1 3171
ff451961 3172 if (!(file->f_mode & FMODE_READ)) {
6484c71c 3173 trace_array_put(tr);
4acd4d00 3174 return 0;
ff451961 3175 }
4acd4d00 3176
6484c71c 3177 /* Writes do not use seq_file */
4acd4d00 3178 iter = m->private;
bc0c38d1 3179 mutex_lock(&trace_types_lock);
a695cb58 3180
3928a8a2
SR
3181 for_each_tracing_cpu(cpu) {
3182 if (iter->buffer_iter[cpu])
3183 ring_buffer_read_finish(iter->buffer_iter[cpu]);
3184 }
3185
bc0c38d1
SR
3186 if (iter->trace && iter->trace->close)
3187 iter->trace->close(iter);
3188
debdd57f
HT
3189 if (!iter->snapshot)
3190 /* reenable tracing if it was previously enabled */
2b6080f2 3191 tracing_start_tr(tr);
f77d09a3
AL
3192
3193 __trace_array_put(tr);
3194
bc0c38d1
SR
3195 mutex_unlock(&trace_types_lock);
3196
d7350c3f 3197 mutex_destroy(&iter->mutex);
b0dfa978 3198 free_cpumask_var(iter->started);
d7350c3f 3199 kfree(iter->trace);
6d158a81 3200 kfree(iter->buffer_iter);
50e18b94 3201 seq_release_private(inode, file);
ff451961 3202
bc0c38d1
SR
3203 return 0;
3204}
3205
7b85af63
SRRH
3206static int tracing_release_generic_tr(struct inode *inode, struct file *file)
3207{
3208 struct trace_array *tr = inode->i_private;
3209
3210 trace_array_put(tr);
bc0c38d1
SR
3211 return 0;
3212}
3213
7b85af63
SRRH
3214static int tracing_single_release_tr(struct inode *inode, struct file *file)
3215{
3216 struct trace_array *tr = inode->i_private;
3217
3218 trace_array_put(tr);
3219
3220 return single_release(inode, file);
3221}
3222
bc0c38d1
SR
3223static int tracing_open(struct inode *inode, struct file *file)
3224{
6484c71c 3225 struct trace_array *tr = inode->i_private;
85a2f9b4
SR
3226 struct trace_iterator *iter;
3227 int ret = 0;
bc0c38d1 3228
ff451961
SRRH
3229 if (trace_array_get(tr) < 0)
3230 return -ENODEV;
3231
4acd4d00 3232 /* If this file was open for write, then erase contents */
6484c71c
ON
3233 if ((file->f_mode & FMODE_WRITE) && (file->f_flags & O_TRUNC)) {
3234 int cpu = tracing_get_cpu(inode);
3235
3236 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 3237 tracing_reset_online_cpus(&tr->trace_buffer);
4acd4d00 3238 else
6484c71c 3239 tracing_reset(&tr->trace_buffer, cpu);
4acd4d00 3240 }
bc0c38d1 3241
4acd4d00 3242 if (file->f_mode & FMODE_READ) {
6484c71c 3243 iter = __tracing_open(inode, file, false);
4acd4d00
SR
3244 if (IS_ERR(iter))
3245 ret = PTR_ERR(iter);
983f938a 3246 else if (tr->trace_flags & TRACE_ITER_LATENCY_FMT)
4acd4d00
SR
3247 iter->iter_flags |= TRACE_FILE_LAT_FMT;
3248 }
ff451961
SRRH
3249
3250 if (ret < 0)
3251 trace_array_put(tr);
3252
bc0c38d1
SR
3253 return ret;
3254}
3255
607e2ea1
SRRH
3256/*
3257 * Some tracers are not suitable for instance buffers.
3258 * A tracer is always available for the global array (toplevel)
3259 * or if it explicitly states that it is.
3260 */
3261static bool
3262trace_ok_for_array(struct tracer *t, struct trace_array *tr)
3263{
3264 return (tr->flags & TRACE_ARRAY_FL_GLOBAL) || t->allow_instances;
3265}
3266
3267/* Find the next tracer that this trace array may use */
3268static struct tracer *
3269get_tracer_for_array(struct trace_array *tr, struct tracer *t)
3270{
3271 while (t && !trace_ok_for_array(t, tr))
3272 t = t->next;
3273
3274 return t;
3275}
3276
e309b41d 3277static void *
bc0c38d1
SR
3278t_next(struct seq_file *m, void *v, loff_t *pos)
3279{
607e2ea1 3280 struct trace_array *tr = m->private;
f129e965 3281 struct tracer *t = v;
bc0c38d1
SR
3282
3283 (*pos)++;
3284
3285 if (t)
607e2ea1 3286 t = get_tracer_for_array(tr, t->next);
bc0c38d1 3287
bc0c38d1
SR
3288 return t;
3289}
3290
3291static void *t_start(struct seq_file *m, loff_t *pos)
3292{
607e2ea1 3293 struct trace_array *tr = m->private;
f129e965 3294 struct tracer *t;
bc0c38d1
SR
3295 loff_t l = 0;
3296
3297 mutex_lock(&trace_types_lock);
607e2ea1
SRRH
3298
3299 t = get_tracer_for_array(tr, trace_types);
3300 for (; t && l < *pos; t = t_next(m, t, &l))
3301 ;
bc0c38d1
SR
3302
3303 return t;
3304}
3305
3306static void t_stop(struct seq_file *m, void *p)
3307{
3308 mutex_unlock(&trace_types_lock);
3309}
3310
3311static int t_show(struct seq_file *m, void *v)
3312{
3313 struct tracer *t = v;
3314
3315 if (!t)
3316 return 0;
3317
fa6f0cc7 3318 seq_puts(m, t->name);
bc0c38d1
SR
3319 if (t->next)
3320 seq_putc(m, ' ');
3321 else
3322 seq_putc(m, '\n');
3323
3324 return 0;
3325}
3326
88e9d34c 3327static const struct seq_operations show_traces_seq_ops = {
4bf39a94
IM
3328 .start = t_start,
3329 .next = t_next,
3330 .stop = t_stop,
3331 .show = t_show,
bc0c38d1
SR
3332};
3333
3334static int show_traces_open(struct inode *inode, struct file *file)
3335{
607e2ea1
SRRH
3336 struct trace_array *tr = inode->i_private;
3337 struct seq_file *m;
3338 int ret;
3339
60a11774
SR
3340 if (tracing_disabled)
3341 return -ENODEV;
3342
607e2ea1
SRRH
3343 ret = seq_open(file, &show_traces_seq_ops);
3344 if (ret)
3345 return ret;
3346
3347 m = file->private_data;
3348 m->private = tr;
3349
3350 return 0;
bc0c38d1
SR
3351}
3352
4acd4d00
SR
3353static ssize_t
3354tracing_write_stub(struct file *filp, const char __user *ubuf,
3355 size_t count, loff_t *ppos)
3356{
3357 return count;
3358}
3359
098c879e 3360loff_t tracing_lseek(struct file *file, loff_t offset, int whence)
364829b1 3361{
098c879e
SRRH
3362 int ret;
3363
364829b1 3364 if (file->f_mode & FMODE_READ)
098c879e 3365 ret = seq_lseek(file, offset, whence);
364829b1 3366 else
098c879e
SRRH
3367 file->f_pos = ret = 0;
3368
3369 return ret;
364829b1
SP
3370}
3371
5e2336a0 3372static const struct file_operations tracing_fops = {
4bf39a94
IM
3373 .open = tracing_open,
3374 .read = seq_read,
4acd4d00 3375 .write = tracing_write_stub,
098c879e 3376 .llseek = tracing_lseek,
4bf39a94 3377 .release = tracing_release,
bc0c38d1
SR
3378};
3379
5e2336a0 3380static const struct file_operations show_traces_fops = {
c7078de1
IM
3381 .open = show_traces_open,
3382 .read = seq_read,
3383 .release = seq_release,
b444786f 3384 .llseek = seq_lseek,
c7078de1
IM
3385};
3386
36dfe925
IM
3387/*
3388 * The tracer itself will not take this lock, but still we want
3389 * to provide a consistent cpumask to user-space:
3390 */
3391static DEFINE_MUTEX(tracing_cpumask_update_lock);
3392
3393/*
3394 * Temporary storage for the character representation of the
3395 * CPU bitmask (and one more byte for the newline):
3396 */
3397static char mask_str[NR_CPUS + 1];
3398
c7078de1
IM
3399static ssize_t
3400tracing_cpumask_read(struct file *filp, char __user *ubuf,
3401 size_t count, loff_t *ppos)
3402{
ccfe9e42 3403 struct trace_array *tr = file_inode(filp)->i_private;
36dfe925 3404 int len;
c7078de1
IM
3405
3406 mutex_lock(&tracing_cpumask_update_lock);
36dfe925 3407
1a40243b
TH
3408 len = snprintf(mask_str, count, "%*pb\n",
3409 cpumask_pr_args(tr->tracing_cpumask));
3410 if (len >= count) {
36dfe925
IM
3411 count = -EINVAL;
3412 goto out_err;
3413 }
36dfe925
IM
3414 count = simple_read_from_buffer(ubuf, count, ppos, mask_str, NR_CPUS+1);
3415
3416out_err:
c7078de1
IM
3417 mutex_unlock(&tracing_cpumask_update_lock);
3418
3419 return count;
3420}
3421
3422static ssize_t
3423tracing_cpumask_write(struct file *filp, const char __user *ubuf,
3424 size_t count, loff_t *ppos)
3425{
ccfe9e42 3426 struct trace_array *tr = file_inode(filp)->i_private;
9e01c1b7 3427 cpumask_var_t tracing_cpumask_new;
2b6080f2 3428 int err, cpu;
9e01c1b7
RR
3429
3430 if (!alloc_cpumask_var(&tracing_cpumask_new, GFP_KERNEL))
3431 return -ENOMEM;
c7078de1 3432
9e01c1b7 3433 err = cpumask_parse_user(ubuf, count, tracing_cpumask_new);
c7078de1 3434 if (err)
36dfe925
IM
3435 goto err_unlock;
3436
215368e8
LZ
3437 mutex_lock(&tracing_cpumask_update_lock);
3438
a5e25883 3439 local_irq_disable();
0b9b12c1 3440 arch_spin_lock(&tr->max_lock);
ab46428c 3441 for_each_tracing_cpu(cpu) {
36dfe925
IM
3442 /*
3443 * Increase/decrease the disabled counter if we are
3444 * about to flip a bit in the cpumask:
3445 */
ccfe9e42 3446 if (cpumask_test_cpu(cpu, tr->tracing_cpumask) &&
9e01c1b7 3447 !cpumask_test_cpu(cpu, tracing_cpumask_new)) {
12883efb
SRRH
3448 atomic_inc(&per_cpu_ptr(tr->trace_buffer.data, cpu)->disabled);
3449 ring_buffer_record_disable_cpu(tr->trace_buffer.buffer, cpu);
36dfe925 3450 }
ccfe9e42 3451 if (!cpumask_test_cpu(cpu, tr->tracing_cpumask) &&
9e01c1b7 3452 cpumask_test_cpu(cpu, tracing_cpumask_new)) {
12883efb
SRRH
3453 atomic_dec(&per_cpu_ptr(tr->trace_buffer.data, cpu)->disabled);
3454 ring_buffer_record_enable_cpu(tr->trace_buffer.buffer, cpu);
36dfe925
IM
3455 }
3456 }
0b9b12c1 3457 arch_spin_unlock(&tr->max_lock);
a5e25883 3458 local_irq_enable();
36dfe925 3459
ccfe9e42 3460 cpumask_copy(tr->tracing_cpumask, tracing_cpumask_new);
36dfe925
IM
3461
3462 mutex_unlock(&tracing_cpumask_update_lock);
9e01c1b7 3463 free_cpumask_var(tracing_cpumask_new);
c7078de1
IM
3464
3465 return count;
36dfe925
IM
3466
3467err_unlock:
215368e8 3468 free_cpumask_var(tracing_cpumask_new);
36dfe925
IM
3469
3470 return err;
c7078de1
IM
3471}
3472
5e2336a0 3473static const struct file_operations tracing_cpumask_fops = {
ccfe9e42 3474 .open = tracing_open_generic_tr,
c7078de1
IM
3475 .read = tracing_cpumask_read,
3476 .write = tracing_cpumask_write,
ccfe9e42 3477 .release = tracing_release_generic_tr,
b444786f 3478 .llseek = generic_file_llseek,
bc0c38d1
SR
3479};
3480
fdb372ed 3481static int tracing_trace_options_show(struct seq_file *m, void *v)
bc0c38d1 3482{
d8e83d26 3483 struct tracer_opt *trace_opts;
2b6080f2 3484 struct trace_array *tr = m->private;
d8e83d26 3485 u32 tracer_flags;
d8e83d26 3486 int i;
adf9f195 3487
d8e83d26 3488 mutex_lock(&trace_types_lock);
2b6080f2
SR
3489 tracer_flags = tr->current_trace->flags->val;
3490 trace_opts = tr->current_trace->flags->opts;
d8e83d26 3491
bc0c38d1 3492 for (i = 0; trace_options[i]; i++) {
983f938a 3493 if (tr->trace_flags & (1 << i))
fdb372ed 3494 seq_printf(m, "%s\n", trace_options[i]);
bc0c38d1 3495 else
fdb372ed 3496 seq_printf(m, "no%s\n", trace_options[i]);
bc0c38d1
SR
3497 }
3498
adf9f195
FW
3499 for (i = 0; trace_opts[i].name; i++) {
3500 if (tracer_flags & trace_opts[i].bit)
fdb372ed 3501 seq_printf(m, "%s\n", trace_opts[i].name);
adf9f195 3502 else
fdb372ed 3503 seq_printf(m, "no%s\n", trace_opts[i].name);
adf9f195 3504 }
d8e83d26 3505 mutex_unlock(&trace_types_lock);
adf9f195 3506
fdb372ed 3507 return 0;
bc0c38d1 3508}
bc0c38d1 3509
8c1a49ae 3510static int __set_tracer_option(struct trace_array *tr,
8d18eaaf
LZ
3511 struct tracer_flags *tracer_flags,
3512 struct tracer_opt *opts, int neg)
3513{
d39cdd20 3514 struct tracer *trace = tracer_flags->trace;
8d18eaaf 3515 int ret;
bc0c38d1 3516
8c1a49ae 3517 ret = trace->set_flag(tr, tracer_flags->val, opts->bit, !neg);
8d18eaaf
LZ
3518 if (ret)
3519 return ret;
3520
3521 if (neg)
3522 tracer_flags->val &= ~opts->bit;
3523 else
3524 tracer_flags->val |= opts->bit;
3525 return 0;
bc0c38d1
SR
3526}
3527
adf9f195 3528/* Try to assign a tracer specific option */
8c1a49ae 3529static int set_tracer_option(struct trace_array *tr, char *cmp, int neg)
adf9f195 3530{
8c1a49ae 3531 struct tracer *trace = tr->current_trace;
7770841e 3532 struct tracer_flags *tracer_flags = trace->flags;
adf9f195 3533 struct tracer_opt *opts = NULL;
8d18eaaf 3534 int i;
adf9f195 3535
7770841e
Z
3536 for (i = 0; tracer_flags->opts[i].name; i++) {
3537 opts = &tracer_flags->opts[i];
adf9f195 3538
8d18eaaf 3539 if (strcmp(cmp, opts->name) == 0)
8c1a49ae 3540 return __set_tracer_option(tr, trace->flags, opts, neg);
adf9f195 3541 }
adf9f195 3542
8d18eaaf 3543 return -EINVAL;
adf9f195
FW
3544}
3545
613f04a0
SRRH
3546/* Some tracers require overwrite to stay enabled */
3547int trace_keep_overwrite(struct tracer *tracer, u32 mask, int set)
3548{
3549 if (tracer->enabled && (mask & TRACE_ITER_OVERWRITE) && !set)
3550 return -1;
3551
3552 return 0;
3553}
3554
2b6080f2 3555int set_tracer_flag(struct trace_array *tr, unsigned int mask, int enabled)
af4617bd
SR
3556{
3557 /* do nothing if flag is already set */
983f938a 3558 if (!!(tr->trace_flags & mask) == !!enabled)
613f04a0
SRRH
3559 return 0;
3560
3561 /* Give the tracer a chance to approve the change */
2b6080f2 3562 if (tr->current_trace->flag_changed)
bf6065b5 3563 if (tr->current_trace->flag_changed(tr, mask, !!enabled))
613f04a0 3564 return -EINVAL;
af4617bd
SR
3565
3566 if (enabled)
983f938a 3567 tr->trace_flags |= mask;
af4617bd 3568 else
983f938a 3569 tr->trace_flags &= ~mask;
e870e9a1
LZ
3570
3571 if (mask == TRACE_ITER_RECORD_CMD)
3572 trace_event_enable_cmd_record(enabled);
750912fa 3573
c37775d5
SR
3574 if (mask == TRACE_ITER_EVENT_FORK)
3575 trace_event_follow_fork(tr, enabled);
3576
80902822 3577 if (mask == TRACE_ITER_OVERWRITE) {
12883efb 3578 ring_buffer_change_overwrite(tr->trace_buffer.buffer, enabled);
80902822 3579#ifdef CONFIG_TRACER_MAX_TRACE
12883efb 3580 ring_buffer_change_overwrite(tr->max_buffer.buffer, enabled);
80902822
SRRH
3581#endif
3582 }
81698831 3583
b9f9108c 3584 if (mask == TRACE_ITER_PRINTK) {
81698831 3585 trace_printk_start_stop_comm(enabled);
b9f9108c
SRRH
3586 trace_printk_control(enabled);
3587 }
613f04a0
SRRH
3588
3589 return 0;
af4617bd
SR
3590}
3591
2b6080f2 3592static int trace_set_options(struct trace_array *tr, char *option)
bc0c38d1 3593{
8d18eaaf 3594 char *cmp;
bc0c38d1 3595 int neg = 0;
613f04a0 3596 int ret = -ENODEV;
bc0c38d1 3597 int i;
a4d1e688 3598 size_t orig_len = strlen(option);
bc0c38d1 3599
7bcfaf54 3600 cmp = strstrip(option);
bc0c38d1 3601
8d18eaaf 3602 if (strncmp(cmp, "no", 2) == 0) {
bc0c38d1
SR
3603 neg = 1;
3604 cmp += 2;
3605 }
3606
69d34da2
SRRH
3607 mutex_lock(&trace_types_lock);
3608
bc0c38d1 3609 for (i = 0; trace_options[i]; i++) {
8d18eaaf 3610 if (strcmp(cmp, trace_options[i]) == 0) {
2b6080f2 3611 ret = set_tracer_flag(tr, 1 << i, !neg);
bc0c38d1
SR
3612 break;
3613 }
3614 }
adf9f195
FW
3615
3616 /* If no option could be set, test the specific tracer options */
69d34da2 3617 if (!trace_options[i])
8c1a49ae 3618 ret = set_tracer_option(tr, cmp, neg);
69d34da2
SRRH
3619
3620 mutex_unlock(&trace_types_lock);
bc0c38d1 3621
a4d1e688
JW
3622 /*
3623 * If the first trailing whitespace is replaced with '\0' by strstrip,
3624 * turn it back into a space.
3625 */
3626 if (orig_len > strlen(option))
3627 option[strlen(option)] = ' ';
3628
7bcfaf54
SR
3629 return ret;
3630}
3631
a4d1e688
JW
3632static void __init apply_trace_boot_options(void)
3633{
3634 char *buf = trace_boot_options_buf;
3635 char *option;
3636
3637 while (true) {
3638 option = strsep(&buf, ",");
3639
3640 if (!option)
3641 break;
a4d1e688 3642
43ed3843
SRRH
3643 if (*option)
3644 trace_set_options(&global_trace, option);
a4d1e688
JW
3645
3646 /* Put back the comma to allow this to be called again */
3647 if (buf)
3648 *(buf - 1) = ',';
3649 }
3650}
3651
7bcfaf54
SR
3652static ssize_t
3653tracing_trace_options_write(struct file *filp, const char __user *ubuf,
3654 size_t cnt, loff_t *ppos)
3655{
2b6080f2
SR
3656 struct seq_file *m = filp->private_data;
3657 struct trace_array *tr = m->private;
7bcfaf54 3658 char buf[64];
613f04a0 3659 int ret;
7bcfaf54
SR
3660
3661 if (cnt >= sizeof(buf))
3662 return -EINVAL;
3663
3664 if (copy_from_user(&buf, ubuf, cnt))
3665 return -EFAULT;
3666
a8dd2176
SR
3667 buf[cnt] = 0;
3668
2b6080f2 3669 ret = trace_set_options(tr, buf);
613f04a0
SRRH
3670 if (ret < 0)
3671 return ret;
7bcfaf54 3672
cf8517cf 3673 *ppos += cnt;
bc0c38d1
SR
3674
3675 return cnt;
3676}
3677
fdb372ed
LZ
3678static int tracing_trace_options_open(struct inode *inode, struct file *file)
3679{
7b85af63 3680 struct trace_array *tr = inode->i_private;
f77d09a3 3681 int ret;
7b85af63 3682
fdb372ed
LZ
3683 if (tracing_disabled)
3684 return -ENODEV;
2b6080f2 3685
7b85af63
SRRH
3686 if (trace_array_get(tr) < 0)
3687 return -ENODEV;
3688
f77d09a3
AL
3689 ret = single_open(file, tracing_trace_options_show, inode->i_private);
3690 if (ret < 0)
3691 trace_array_put(tr);
3692
3693 return ret;
fdb372ed
LZ
3694}
3695
5e2336a0 3696static const struct file_operations tracing_iter_fops = {
fdb372ed
LZ
3697 .open = tracing_trace_options_open,
3698 .read = seq_read,
3699 .llseek = seq_lseek,
7b85af63 3700 .release = tracing_single_release_tr,
ee6bce52 3701 .write = tracing_trace_options_write,
bc0c38d1
SR
3702};
3703
7bd2f24c
IM
3704static const char readme_msg[] =
3705 "tracing mini-HOWTO:\n\n"
22f45649
SRRH
3706 "# echo 0 > tracing_on : quick way to disable tracing\n"
3707 "# echo 1 > tracing_on : quick way to re-enable tracing\n\n"
3708 " Important files:\n"
3709 " trace\t\t\t- The static contents of the buffer\n"
3710 "\t\t\t To clear the buffer write into this file: echo > trace\n"
3711 " trace_pipe\t\t- A consuming read to see the contents of the buffer\n"
3712 " current_tracer\t- function and latency tracers\n"
3713 " available_tracers\t- list of configured tracers for current_tracer\n"
3714 " buffer_size_kb\t- view and modify size of per cpu buffer\n"
3715 " buffer_total_size_kb - view total size of all cpu buffers\n\n"
3716 " trace_clock\t\t-change the clock used to order events\n"
3717 " local: Per cpu clock but may not be synced across CPUs\n"
3718 " global: Synced across CPUs but slows tracing down.\n"
3719 " counter: Not a clock, but just an increment\n"
3720 " uptime: Jiffy counter from time of boot\n"
3721 " perf: Same clock that perf events use\n"
3722#ifdef CONFIG_X86_64
3723 " x86-tsc: TSC cycle counter\n"
3724#endif
3725 "\n trace_marker\t\t- Writes into this file writes into the kernel buffer\n"
3726 " tracing_cpumask\t- Limit which CPUs to trace\n"
3727 " instances\t\t- Make sub-buffers with: mkdir instances/foo\n"
3728 "\t\t\t Remove sub-buffer with rmdir\n"
3729 " trace_options\t\t- Set format or modify how tracing happens\n"
71485c45
SRRH
3730 "\t\t\t Disable an option by adding a suffix 'no' to the\n"
3731 "\t\t\t option name\n"
939c7a4f 3732 " saved_cmdlines_size\t- echo command number in here to store comm-pid list\n"
22f45649
SRRH
3733#ifdef CONFIG_DYNAMIC_FTRACE
3734 "\n available_filter_functions - list of functions that can be filtered on\n"
71485c45
SRRH
3735 " set_ftrace_filter\t- echo function name in here to only trace these\n"
3736 "\t\t\t functions\n"
3737 "\t accepts: func_full_name, *func_end, func_begin*, *func_middle*\n"
3738 "\t modules: Can select a group via module\n"
3739 "\t Format: :mod:<module-name>\n"
3740 "\t example: echo :mod:ext3 > set_ftrace_filter\n"
3741 "\t triggers: a command to perform when function is hit\n"
3742 "\t Format: <function>:<trigger>[:count]\n"
3743 "\t trigger: traceon, traceoff\n"
3744 "\t\t enable_event:<system>:<event>\n"
3745 "\t\t disable_event:<system>:<event>\n"
22f45649 3746#ifdef CONFIG_STACKTRACE
71485c45 3747 "\t\t stacktrace\n"
22f45649
SRRH
3748#endif
3749#ifdef CONFIG_TRACER_SNAPSHOT
71485c45 3750 "\t\t snapshot\n"
22f45649 3751#endif
17a280ea
SRRH
3752 "\t\t dump\n"
3753 "\t\t cpudump\n"
71485c45
SRRH
3754 "\t example: echo do_fault:traceoff > set_ftrace_filter\n"
3755 "\t echo do_trap:traceoff:3 > set_ftrace_filter\n"
3756 "\t The first one will disable tracing every time do_fault is hit\n"
3757 "\t The second will disable tracing at most 3 times when do_trap is hit\n"
3758 "\t The first time do trap is hit and it disables tracing, the\n"
3759 "\t counter will decrement to 2. If tracing is already disabled,\n"
3760 "\t the counter will not decrement. It only decrements when the\n"
3761 "\t trigger did work\n"
3762 "\t To remove trigger without count:\n"
3763 "\t echo '!<function>:<trigger> > set_ftrace_filter\n"
3764 "\t To remove trigger with a count:\n"
3765 "\t echo '!<function>:<trigger>:0 > set_ftrace_filter\n"
22f45649 3766 " set_ftrace_notrace\t- echo function name in here to never trace.\n"
71485c45
SRRH
3767 "\t accepts: func_full_name, *func_end, func_begin*, *func_middle*\n"
3768 "\t modules: Can select a group via module command :mod:\n"
3769 "\t Does not accept triggers\n"
22f45649
SRRH
3770#endif /* CONFIG_DYNAMIC_FTRACE */
3771#ifdef CONFIG_FUNCTION_TRACER
71485c45
SRRH
3772 " set_ftrace_pid\t- Write pid(s) to only function trace those pids\n"
3773 "\t\t (function)\n"
22f45649
SRRH
3774#endif
3775#ifdef CONFIG_FUNCTION_GRAPH_TRACER
3776 " set_graph_function\t- Trace the nested calls of a function (function_graph)\n"
d048a8c7 3777 " set_graph_notrace\t- Do not trace the nested calls of a function (function_graph)\n"
22f45649
SRRH
3778 " max_graph_depth\t- Trace a limited depth of nested calls (0 is unlimited)\n"
3779#endif
3780#ifdef CONFIG_TRACER_SNAPSHOT
71485c45
SRRH
3781 "\n snapshot\t\t- Like 'trace' but shows the content of the static\n"
3782 "\t\t\t snapshot buffer. Read the contents for more\n"
3783 "\t\t\t information\n"
22f45649 3784#endif
991821c8 3785#ifdef CONFIG_STACK_TRACER
22f45649
SRRH
3786 " stack_trace\t\t- Shows the max stack trace when active\n"
3787 " stack_max_size\t- Shows current max stack size that was traced\n"
71485c45
SRRH
3788 "\t\t\t Write into this file to reset the max size (trigger a\n"
3789 "\t\t\t new trace)\n"
22f45649 3790#ifdef CONFIG_DYNAMIC_FTRACE
71485c45
SRRH
3791 " stack_trace_filter\t- Like set_ftrace_filter but limits what stack_trace\n"
3792 "\t\t\t traces\n"
22f45649 3793#endif
991821c8 3794#endif /* CONFIG_STACK_TRACER */
26f25564
TZ
3795 " events/\t\t- Directory containing all trace event subsystems:\n"
3796 " enable\t\t- Write 0/1 to enable/disable tracing of all events\n"
3797 " events/<system>/\t- Directory containing all trace events for <system>:\n"
71485c45
SRRH
3798 " enable\t\t- Write 0/1 to enable/disable tracing of all <system>\n"
3799 "\t\t\t events\n"
26f25564 3800 " filter\t\t- If set, only events passing filter are traced\n"
71485c45
SRRH
3801 " events/<system>/<event>/\t- Directory containing control files for\n"
3802 "\t\t\t <event>:\n"
26f25564
TZ
3803 " enable\t\t- Write 0/1 to enable/disable tracing of <event>\n"
3804 " filter\t\t- If set, only events passing filter are traced\n"
3805 " trigger\t\t- If set, a command to perform when event is hit\n"
71485c45
SRRH
3806 "\t Format: <trigger>[:count][if <filter>]\n"
3807 "\t trigger: traceon, traceoff\n"
3808 "\t enable_event:<system>:<event>\n"
3809 "\t disable_event:<system>:<event>\n"
26f25564 3810#ifdef CONFIG_STACKTRACE
71485c45 3811 "\t\t stacktrace\n"
26f25564
TZ
3812#endif
3813#ifdef CONFIG_TRACER_SNAPSHOT
71485c45 3814 "\t\t snapshot\n"
7ef224d1
TZ
3815#endif
3816#ifdef CONFIG_HIST_TRIGGERS
3817 "\t\t hist (see below)\n"
26f25564 3818#endif
71485c45
SRRH
3819 "\t example: echo traceoff > events/block/block_unplug/trigger\n"
3820 "\t echo traceoff:3 > events/block/block_unplug/trigger\n"
3821 "\t echo 'enable_event:kmem:kmalloc:3 if nr_rq > 1' > \\\n"
3822 "\t events/block/block_unplug/trigger\n"
3823 "\t The first disables tracing every time block_unplug is hit.\n"
3824 "\t The second disables tracing the first 3 times block_unplug is hit.\n"
3825 "\t The third enables the kmalloc event the first 3 times block_unplug\n"
3826 "\t is hit and has value of greater than 1 for the 'nr_rq' event field.\n"
3827 "\t Like function triggers, the counter is only decremented if it\n"
3828 "\t enabled or disabled tracing.\n"
3829 "\t To remove a trigger without a count:\n"
3830 "\t echo '!<trigger> > <system>/<event>/trigger\n"
3831 "\t To remove a trigger with a count:\n"
3832 "\t echo '!<trigger>:0 > <system>/<event>/trigger\n"
3833 "\t Filters can be ignored when removing a trigger.\n"
7ef224d1
TZ
3834#ifdef CONFIG_HIST_TRIGGERS
3835 " hist trigger\t- If set, event hits are aggregated into a hash table\n"
76a3b0c8 3836 "\t Format: hist:keys=<field1[,field2,...]>\n"
f2606835 3837 "\t [:values=<field1[,field2,...]>]\n"
e62347d2 3838 "\t [:sort=<field1[,field2,...]>]\n"
7ef224d1 3839 "\t [:size=#entries]\n"
e86ae9ba 3840 "\t [:pause][:continue][:clear]\n"
7ef224d1
TZ
3841 "\t [if <filter>]\n\n"
3842 "\t When a matching event is hit, an entry is added to a hash\n"
f2606835
TZ
3843 "\t table using the key(s) and value(s) named, and the value of a\n"
3844 "\t sum called 'hitcount' is incremented. Keys and values\n"
3845 "\t correspond to fields in the event's format description. Keys\n"
76a3b0c8
TZ
3846 "\t can be any field. Compound keys consisting of up to two\n"
3847 "\t fields can be specified by the 'keys' keyword. Values must\n"
e62347d2
TZ
3848 "\t correspond to numeric fields. Sort keys consisting of up to\n"
3849 "\t two fields can be specified using the 'sort' keyword. The\n"
3850 "\t sort direction can be modified by appending '.descending' or\n"
3851 "\t '.ascending' to a sort field. The 'size' parameter can be\n"
76a3b0c8
TZ
3852 "\t used to specify more or fewer than the default 2048 entries\n"
3853 "\t for the hashtable size.\n\n"
7ef224d1 3854 "\t Reading the 'hist' file for the event will dump the hash\n"
0c4a6b46
TZ
3855 "\t table in its entirety to stdout. The default format used to\n"
3856 "\t display a given field can be modified by appending any of the\n"
3857 "\t following modifiers to the field name, as applicable:\n\n"
c6afad49
TZ
3858 "\t .hex display a number as a hex value\n"
3859 "\t .sym display an address as a symbol\n"
6b4827ad
TZ
3860 "\t .sym-offset display an address as a symbol and offset\n"
3861 "\t .execname display a common_pid as a program name\n\n"
83e99914
TZ
3862 "\t The 'pause' parameter can be used to pause an existing hist\n"
3863 "\t trigger or to start a hist trigger but not log any events\n"
3864 "\t until told to do so. 'continue' can be used to start or\n"
3865 "\t restart a paused hist trigger.\n\n"
e86ae9ba
TZ
3866 "\t The 'clear' parameter will clear the contents of a running\n"
3867 "\t hist trigger and leave its current paused/active state\n"
3868 "\t unchanged.\n\n"
7ef224d1 3869#endif
7bd2f24c
IM
3870;
3871
3872static ssize_t
3873tracing_readme_read(struct file *filp, char __user *ubuf,
3874 size_t cnt, loff_t *ppos)
3875{
3876 return simple_read_from_buffer(ubuf, cnt, ppos,
3877 readme_msg, strlen(readme_msg));
3878}
3879
5e2336a0 3880static const struct file_operations tracing_readme_fops = {
c7078de1
IM
3881 .open = tracing_open_generic,
3882 .read = tracing_readme_read,
b444786f 3883 .llseek = generic_file_llseek,
7bd2f24c
IM
3884};
3885
42584c81
YY
3886static void *saved_cmdlines_next(struct seq_file *m, void *v, loff_t *pos)
3887{
3888 unsigned int *ptr = v;
69abe6a5 3889
42584c81
YY
3890 if (*pos || m->count)
3891 ptr++;
69abe6a5 3892
42584c81 3893 (*pos)++;
69abe6a5 3894
939c7a4f
YY
3895 for (; ptr < &savedcmd->map_cmdline_to_pid[savedcmd->cmdline_num];
3896 ptr++) {
42584c81
YY
3897 if (*ptr == -1 || *ptr == NO_CMDLINE_MAP)
3898 continue;
69abe6a5 3899
42584c81
YY
3900 return ptr;
3901 }
69abe6a5 3902
42584c81
YY
3903 return NULL;
3904}
3905
3906static void *saved_cmdlines_start(struct seq_file *m, loff_t *pos)
3907{
3908 void *v;
3909 loff_t l = 0;
69abe6a5 3910
4c27e756
SRRH
3911 preempt_disable();
3912 arch_spin_lock(&trace_cmdline_lock);
3913
939c7a4f 3914 v = &savedcmd->map_cmdline_to_pid[0];
42584c81
YY
3915 while (l <= *pos) {
3916 v = saved_cmdlines_next(m, v, &l);
3917 if (!v)
3918 return NULL;
69abe6a5
AP
3919 }
3920
42584c81
YY
3921 return v;
3922}
3923
3924static void saved_cmdlines_stop(struct seq_file *m, void *v)
3925{
4c27e756
SRRH
3926 arch_spin_unlock(&trace_cmdline_lock);
3927 preempt_enable();
42584c81 3928}
69abe6a5 3929
42584c81
YY
3930static int saved_cmdlines_show(struct seq_file *m, void *v)
3931{
3932 char buf[TASK_COMM_LEN];
3933 unsigned int *pid = v;
69abe6a5 3934
4c27e756 3935 __trace_find_cmdline(*pid, buf);
42584c81
YY
3936 seq_printf(m, "%d %s\n", *pid, buf);
3937 return 0;
3938}
3939
3940static const struct seq_operations tracing_saved_cmdlines_seq_ops = {
3941 .start = saved_cmdlines_start,
3942 .next = saved_cmdlines_next,
3943 .stop = saved_cmdlines_stop,
3944 .show = saved_cmdlines_show,
3945};
3946
3947static int tracing_saved_cmdlines_open(struct inode *inode, struct file *filp)
3948{
3949 if (tracing_disabled)
3950 return -ENODEV;
3951
3952 return seq_open(filp, &tracing_saved_cmdlines_seq_ops);
69abe6a5
AP
3953}
3954
3955static const struct file_operations tracing_saved_cmdlines_fops = {
42584c81
YY
3956 .open = tracing_saved_cmdlines_open,
3957 .read = seq_read,
3958 .llseek = seq_lseek,
3959 .release = seq_release,
69abe6a5
AP
3960};
3961
939c7a4f
YY
3962static ssize_t
3963tracing_saved_cmdlines_size_read(struct file *filp, char __user *ubuf,
3964 size_t cnt, loff_t *ppos)
3965{
3966 char buf[64];
3967 int r;
3968
3969 arch_spin_lock(&trace_cmdline_lock);
a6af8fbf 3970 r = scnprintf(buf, sizeof(buf), "%u\n", savedcmd->cmdline_num);
939c7a4f
YY
3971 arch_spin_unlock(&trace_cmdline_lock);
3972
3973 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
3974}
3975
3976static void free_saved_cmdlines_buffer(struct saved_cmdlines_buffer *s)
3977{
3978 kfree(s->saved_cmdlines);
3979 kfree(s->map_cmdline_to_pid);
3980 kfree(s);
3981}
3982
3983static int tracing_resize_saved_cmdlines(unsigned int val)
3984{
3985 struct saved_cmdlines_buffer *s, *savedcmd_temp;
3986
a6af8fbf 3987 s = kmalloc(sizeof(*s), GFP_KERNEL);
939c7a4f
YY
3988 if (!s)
3989 return -ENOMEM;
3990
3991 if (allocate_cmdlines_buffer(val, s) < 0) {
3992 kfree(s);
3993 return -ENOMEM;
3994 }
3995
3996 arch_spin_lock(&trace_cmdline_lock);
3997 savedcmd_temp = savedcmd;
3998 savedcmd = s;
3999 arch_spin_unlock(&trace_cmdline_lock);
4000 free_saved_cmdlines_buffer(savedcmd_temp);
4001
4002 return 0;
4003}
4004
4005static ssize_t
4006tracing_saved_cmdlines_size_write(struct file *filp, const char __user *ubuf,
4007 size_t cnt, loff_t *ppos)
4008{
4009 unsigned long val;
4010 int ret;
4011
4012 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
4013 if (ret)
4014 return ret;
4015
4016 /* must have at least 1 entry or less than PID_MAX_DEFAULT */
4017 if (!val || val > PID_MAX_DEFAULT)
4018 return -EINVAL;
4019
4020 ret = tracing_resize_saved_cmdlines((unsigned int)val);
4021 if (ret < 0)
4022 return ret;
4023
4024 *ppos += cnt;
4025
4026 return cnt;
4027}
4028
4029static const struct file_operations tracing_saved_cmdlines_size_fops = {
4030 .open = tracing_open_generic,
4031 .read = tracing_saved_cmdlines_size_read,
4032 .write = tracing_saved_cmdlines_size_write,
4033};
4034
9828413d
SRRH
4035#ifdef CONFIG_TRACE_ENUM_MAP_FILE
4036static union trace_enum_map_item *
4037update_enum_map(union trace_enum_map_item *ptr)
4038{
4039 if (!ptr->map.enum_string) {
4040 if (ptr->tail.next) {
4041 ptr = ptr->tail.next;
4042 /* Set ptr to the next real item (skip head) */
4043 ptr++;
4044 } else
4045 return NULL;
4046 }
4047 return ptr;
4048}
4049
4050static void *enum_map_next(struct seq_file *m, void *v, loff_t *pos)
4051{
4052 union trace_enum_map_item *ptr = v;
4053
4054 /*
4055 * Paranoid! If ptr points to end, we don't want to increment past it.
4056 * This really should never happen.
4057 */
4058 ptr = update_enum_map(ptr);
4059 if (WARN_ON_ONCE(!ptr))
4060 return NULL;
4061
4062 ptr++;
4063
4064 (*pos)++;
4065
4066 ptr = update_enum_map(ptr);
4067
4068 return ptr;
4069}
4070
4071static void *enum_map_start(struct seq_file *m, loff_t *pos)
4072{
4073 union trace_enum_map_item *v;
4074 loff_t l = 0;
4075
4076 mutex_lock(&trace_enum_mutex);
4077
4078 v = trace_enum_maps;
4079 if (v)
4080 v++;
4081
4082 while (v && l < *pos) {
4083 v = enum_map_next(m, v, &l);
4084 }
4085
4086 return v;
4087}
4088
4089static void enum_map_stop(struct seq_file *m, void *v)
4090{
4091 mutex_unlock(&trace_enum_mutex);
4092}
4093
4094static int enum_map_show(struct seq_file *m, void *v)
4095{
4096 union trace_enum_map_item *ptr = v;
4097
4098 seq_printf(m, "%s %ld (%s)\n",
4099 ptr->map.enum_string, ptr->map.enum_value,
4100 ptr->map.system);
4101
4102 return 0;
4103}
4104
4105static const struct seq_operations tracing_enum_map_seq_ops = {
4106 .start = enum_map_start,
4107 .next = enum_map_next,
4108 .stop = enum_map_stop,
4109 .show = enum_map_show,
4110};
4111
4112static int tracing_enum_map_open(struct inode *inode, struct file *filp)
4113{
4114 if (tracing_disabled)
4115 return -ENODEV;
4116
4117 return seq_open(filp, &tracing_enum_map_seq_ops);
4118}
4119
4120static const struct file_operations tracing_enum_map_fops = {
4121 .open = tracing_enum_map_open,
4122 .read = seq_read,
4123 .llseek = seq_lseek,
4124 .release = seq_release,
4125};
4126
4127static inline union trace_enum_map_item *
4128trace_enum_jmp_to_tail(union trace_enum_map_item *ptr)
4129{
4130 /* Return tail of array given the head */
4131 return ptr + ptr->head.length + 1;
4132}
4133
4134static void
4135trace_insert_enum_map_file(struct module *mod, struct trace_enum_map **start,
4136 int len)
4137{
4138 struct trace_enum_map **stop;
4139 struct trace_enum_map **map;
4140 union trace_enum_map_item *map_array;
4141 union trace_enum_map_item *ptr;
4142
4143 stop = start + len;
4144
4145 /*
4146 * The trace_enum_maps contains the map plus a head and tail item,
4147 * where the head holds the module and length of array, and the
4148 * tail holds a pointer to the next list.
4149 */
4150 map_array = kmalloc(sizeof(*map_array) * (len + 2), GFP_KERNEL);
4151 if (!map_array) {
a395d6a7 4152 pr_warn("Unable to allocate trace enum mapping\n");
9828413d
SRRH
4153 return;
4154 }
4155
4156 mutex_lock(&trace_enum_mutex);
4157
4158 if (!trace_enum_maps)
4159 trace_enum_maps = map_array;
4160 else {
4161 ptr = trace_enum_maps;
4162 for (;;) {
4163 ptr = trace_enum_jmp_to_tail(ptr);
4164 if (!ptr->tail.next)
4165 break;
4166 ptr = ptr->tail.next;
4167
4168 }
4169 ptr->tail.next = map_array;
4170 }
4171 map_array->head.mod = mod;
4172 map_array->head.length = len;
4173 map_array++;
4174
4175 for (map = start; (unsigned long)map < (unsigned long)stop; map++) {
4176 map_array->map = **map;
4177 map_array++;
4178 }
4179 memset(map_array, 0, sizeof(*map_array));
4180
4181 mutex_unlock(&trace_enum_mutex);
4182}
4183
4184static void trace_create_enum_file(struct dentry *d_tracer)
4185{
4186 trace_create_file("enum_map", 0444, d_tracer,
4187 NULL, &tracing_enum_map_fops);
4188}
4189
4190#else /* CONFIG_TRACE_ENUM_MAP_FILE */
4191static inline void trace_create_enum_file(struct dentry *d_tracer) { }
4192static inline void trace_insert_enum_map_file(struct module *mod,
4193 struct trace_enum_map **start, int len) { }
4194#endif /* !CONFIG_TRACE_ENUM_MAP_FILE */
4195
4196static void trace_insert_enum_map(struct module *mod,
4197 struct trace_enum_map **start, int len)
0c564a53
SRRH
4198{
4199 struct trace_enum_map **map;
0c564a53
SRRH
4200
4201 if (len <= 0)
4202 return;
4203
4204 map = start;
4205
4206 trace_event_enum_update(map, len);
9828413d
SRRH
4207
4208 trace_insert_enum_map_file(mod, start, len);
0c564a53
SRRH
4209}
4210
bc0c38d1
SR
4211static ssize_t
4212tracing_set_trace_read(struct file *filp, char __user *ubuf,
4213 size_t cnt, loff_t *ppos)
4214{
2b6080f2 4215 struct trace_array *tr = filp->private_data;
ee6c2c1b 4216 char buf[MAX_TRACER_SIZE+2];
bc0c38d1
SR
4217 int r;
4218
4219 mutex_lock(&trace_types_lock);
2b6080f2 4220 r = sprintf(buf, "%s\n", tr->current_trace->name);
bc0c38d1
SR
4221 mutex_unlock(&trace_types_lock);
4222
4bf39a94 4223 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
bc0c38d1
SR
4224}
4225
b6f11df2
ACM
4226int tracer_init(struct tracer *t, struct trace_array *tr)
4227{
12883efb 4228 tracing_reset_online_cpus(&tr->trace_buffer);
b6f11df2
ACM
4229 return t->init(tr);
4230}
4231
12883efb 4232static void set_buffer_entries(struct trace_buffer *buf, unsigned long val)
438ced17
VN
4233{
4234 int cpu;
737223fb 4235
438ced17 4236 for_each_tracing_cpu(cpu)
12883efb 4237 per_cpu_ptr(buf->data, cpu)->entries = val;
438ced17
VN
4238}
4239
12883efb 4240#ifdef CONFIG_TRACER_MAX_TRACE
d60da506 4241/* resize @tr's buffer to the size of @size_tr's entries */
12883efb
SRRH
4242static int resize_buffer_duplicate_size(struct trace_buffer *trace_buf,
4243 struct trace_buffer *size_buf, int cpu_id)
d60da506
HT
4244{
4245 int cpu, ret = 0;
4246
4247 if (cpu_id == RING_BUFFER_ALL_CPUS) {
4248 for_each_tracing_cpu(cpu) {
12883efb
SRRH
4249 ret = ring_buffer_resize(trace_buf->buffer,
4250 per_cpu_ptr(size_buf->data, cpu)->entries, cpu);
d60da506
HT
4251 if (ret < 0)
4252 break;
12883efb
SRRH
4253 per_cpu_ptr(trace_buf->data, cpu)->entries =
4254 per_cpu_ptr(size_buf->data, cpu)->entries;
d60da506
HT
4255 }
4256 } else {
12883efb
SRRH
4257 ret = ring_buffer_resize(trace_buf->buffer,
4258 per_cpu_ptr(size_buf->data, cpu_id)->entries, cpu_id);
d60da506 4259 if (ret == 0)
12883efb
SRRH
4260 per_cpu_ptr(trace_buf->data, cpu_id)->entries =
4261 per_cpu_ptr(size_buf->data, cpu_id)->entries;
d60da506
HT
4262 }
4263
4264 return ret;
4265}
12883efb 4266#endif /* CONFIG_TRACER_MAX_TRACE */
d60da506 4267
2b6080f2
SR
4268static int __tracing_resize_ring_buffer(struct trace_array *tr,
4269 unsigned long size, int cpu)
73c5162a
SR
4270{
4271 int ret;
4272
4273 /*
4274 * If kernel or user changes the size of the ring buffer
a123c52b
SR
4275 * we use the size that was given, and we can forget about
4276 * expanding it later.
73c5162a 4277 */
55034cd6 4278 ring_buffer_expanded = true;
73c5162a 4279
b382ede6 4280 /* May be called before buffers are initialized */
12883efb 4281 if (!tr->trace_buffer.buffer)
b382ede6
SR
4282 return 0;
4283
12883efb 4284 ret = ring_buffer_resize(tr->trace_buffer.buffer, size, cpu);
73c5162a
SR
4285 if (ret < 0)
4286 return ret;
4287
12883efb 4288#ifdef CONFIG_TRACER_MAX_TRACE
2b6080f2
SR
4289 if (!(tr->flags & TRACE_ARRAY_FL_GLOBAL) ||
4290 !tr->current_trace->use_max_tr)
ef710e10
KM
4291 goto out;
4292
12883efb 4293 ret = ring_buffer_resize(tr->max_buffer.buffer, size, cpu);
73c5162a 4294 if (ret < 0) {
12883efb
SRRH
4295 int r = resize_buffer_duplicate_size(&tr->trace_buffer,
4296 &tr->trace_buffer, cpu);
73c5162a 4297 if (r < 0) {
a123c52b
SR
4298 /*
4299 * AARGH! We are left with different
4300 * size max buffer!!!!
4301 * The max buffer is our "snapshot" buffer.
4302 * When a tracer needs a snapshot (one of the
4303 * latency tracers), it swaps the max buffer
4304 * with the saved snap shot. We succeeded to
4305 * update the size of the main buffer, but failed to
4306 * update the size of the max buffer. But when we tried
4307 * to reset the main buffer to the original size, we
4308 * failed there too. This is very unlikely to
4309 * happen, but if it does, warn and kill all
4310 * tracing.
4311 */
73c5162a
SR
4312 WARN_ON(1);
4313 tracing_disabled = 1;
4314 }
4315 return ret;
4316 }
4317
438ced17 4318 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 4319 set_buffer_entries(&tr->max_buffer, size);
438ced17 4320 else
12883efb 4321 per_cpu_ptr(tr->max_buffer.data, cpu)->entries = size;
438ced17 4322
ef710e10 4323 out:
12883efb
SRRH
4324#endif /* CONFIG_TRACER_MAX_TRACE */
4325
438ced17 4326 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 4327 set_buffer_entries(&tr->trace_buffer, size);
438ced17 4328 else
12883efb 4329 per_cpu_ptr(tr->trace_buffer.data, cpu)->entries = size;
73c5162a
SR
4330
4331 return ret;
4332}
4333
2b6080f2
SR
4334static ssize_t tracing_resize_ring_buffer(struct trace_array *tr,
4335 unsigned long size, int cpu_id)
4f271a2a 4336{
83f40318 4337 int ret = size;
4f271a2a
VN
4338
4339 mutex_lock(&trace_types_lock);
4340
438ced17
VN
4341 if (cpu_id != RING_BUFFER_ALL_CPUS) {
4342 /* make sure, this cpu is enabled in the mask */
4343 if (!cpumask_test_cpu(cpu_id, tracing_buffer_mask)) {
4344 ret = -EINVAL;
4345 goto out;
4346 }
4347 }
4f271a2a 4348
2b6080f2 4349 ret = __tracing_resize_ring_buffer(tr, size, cpu_id);
4f271a2a
VN
4350 if (ret < 0)
4351 ret = -ENOMEM;
4352
438ced17 4353out:
4f271a2a
VN
4354 mutex_unlock(&trace_types_lock);
4355
4356 return ret;
4357}
4358
ef710e10 4359
1852fcce
SR
4360/**
4361 * tracing_update_buffers - used by tracing facility to expand ring buffers
4362 *
4363 * To save on memory when the tracing is never used on a system with it
4364 * configured in. The ring buffers are set to a minimum size. But once
4365 * a user starts to use the tracing facility, then they need to grow
4366 * to their default size.
4367 *
4368 * This function is to be called when a tracer is about to be used.
4369 */
4370int tracing_update_buffers(void)
4371{
4372 int ret = 0;
4373
1027fcb2 4374 mutex_lock(&trace_types_lock);
1852fcce 4375 if (!ring_buffer_expanded)
2b6080f2 4376 ret = __tracing_resize_ring_buffer(&global_trace, trace_buf_size,
438ced17 4377 RING_BUFFER_ALL_CPUS);
1027fcb2 4378 mutex_unlock(&trace_types_lock);
1852fcce
SR
4379
4380 return ret;
4381}
4382
577b785f
SR
4383struct trace_option_dentry;
4384
37aea98b 4385static void
2b6080f2 4386create_trace_option_files(struct trace_array *tr, struct tracer *tracer);
577b785f 4387
6b450d25
SRRH
4388/*
4389 * Used to clear out the tracer before deletion of an instance.
4390 * Must have trace_types_lock held.
4391 */
4392static void tracing_set_nop(struct trace_array *tr)
4393{
4394 if (tr->current_trace == &nop_trace)
4395 return;
4396
50512ab5 4397 tr->current_trace->enabled--;
6b450d25
SRRH
4398
4399 if (tr->current_trace->reset)
4400 tr->current_trace->reset(tr);
4401
4402 tr->current_trace = &nop_trace;
4403}
4404
41d9c0be 4405static void add_tracer_options(struct trace_array *tr, struct tracer *t)
bc0c38d1 4406{
09d23a1d
SRRH
4407 /* Only enable if the directory has been created already. */
4408 if (!tr->dir)
4409 return;
4410
37aea98b 4411 create_trace_option_files(tr, t);
09d23a1d
SRRH
4412}
4413
4414static int tracing_set_tracer(struct trace_array *tr, const char *buf)
4415{
bc0c38d1 4416 struct tracer *t;
12883efb 4417#ifdef CONFIG_TRACER_MAX_TRACE
34600f0e 4418 bool had_max_tr;
12883efb 4419#endif
d9e54076 4420 int ret = 0;
bc0c38d1 4421
1027fcb2
SR
4422 mutex_lock(&trace_types_lock);
4423
73c5162a 4424 if (!ring_buffer_expanded) {
2b6080f2 4425 ret = __tracing_resize_ring_buffer(tr, trace_buf_size,
438ced17 4426 RING_BUFFER_ALL_CPUS);
73c5162a 4427 if (ret < 0)
59f586db 4428 goto out;
73c5162a
SR
4429 ret = 0;
4430 }
4431
bc0c38d1
SR
4432 for (t = trace_types; t; t = t->next) {
4433 if (strcmp(t->name, buf) == 0)
4434 break;
4435 }
c2931e05
FW
4436 if (!t) {
4437 ret = -EINVAL;
4438 goto out;
4439 }
2b6080f2 4440 if (t == tr->current_trace)
bc0c38d1
SR
4441 goto out;
4442
607e2ea1
SRRH
4443 /* Some tracers are only allowed for the top level buffer */
4444 if (!trace_ok_for_array(t, tr)) {
4445 ret = -EINVAL;
4446 goto out;
4447 }
4448
cf6ab6d9
SRRH
4449 /* If trace pipe files are being read, we can't change the tracer */
4450 if (tr->current_trace->ref) {
4451 ret = -EBUSY;
4452 goto out;
4453 }
4454
9f029e83 4455 trace_branch_disable();
613f04a0 4456
50512ab5 4457 tr->current_trace->enabled--;
613f04a0 4458
2b6080f2
SR
4459 if (tr->current_trace->reset)
4460 tr->current_trace->reset(tr);
34600f0e 4461
12883efb 4462 /* Current trace needs to be nop_trace before synchronize_sched */
2b6080f2 4463 tr->current_trace = &nop_trace;
34600f0e 4464
45ad21ca
SRRH
4465#ifdef CONFIG_TRACER_MAX_TRACE
4466 had_max_tr = tr->allocated_snapshot;
34600f0e
SR
4467
4468 if (had_max_tr && !t->use_max_tr) {
4469 /*
4470 * We need to make sure that the update_max_tr sees that
4471 * current_trace changed to nop_trace to keep it from
4472 * swapping the buffers after we resize it.
4473 * The update_max_tr is called from interrupts disabled
4474 * so a synchronized_sched() is sufficient.
4475 */
4476 synchronize_sched();
3209cff4 4477 free_snapshot(tr);
ef710e10 4478 }
12883efb 4479#endif
12883efb
SRRH
4480
4481#ifdef CONFIG_TRACER_MAX_TRACE
34600f0e 4482 if (t->use_max_tr && !had_max_tr) {
3209cff4 4483 ret = alloc_snapshot(tr);
d60da506
HT
4484 if (ret < 0)
4485 goto out;
ef710e10 4486 }
12883efb 4487#endif
577b785f 4488
1c80025a 4489 if (t->init) {
b6f11df2 4490 ret = tracer_init(t, tr);
1c80025a
FW
4491 if (ret)
4492 goto out;
4493 }
bc0c38d1 4494
2b6080f2 4495 tr->current_trace = t;
50512ab5 4496 tr->current_trace->enabled++;
9f029e83 4497 trace_branch_enable(tr);
bc0c38d1
SR
4498 out:
4499 mutex_unlock(&trace_types_lock);
4500
d9e54076
PZ
4501 return ret;
4502}
4503
4504static ssize_t
4505tracing_set_trace_write(struct file *filp, const char __user *ubuf,
4506 size_t cnt, loff_t *ppos)
4507{
607e2ea1 4508 struct trace_array *tr = filp->private_data;
ee6c2c1b 4509 char buf[MAX_TRACER_SIZE+1];
d9e54076
PZ
4510 int i;
4511 size_t ret;
e6e7a65a
FW
4512 int err;
4513
4514 ret = cnt;
d9e54076 4515
ee6c2c1b
LZ
4516 if (cnt > MAX_TRACER_SIZE)
4517 cnt = MAX_TRACER_SIZE;
d9e54076
PZ
4518
4519 if (copy_from_user(&buf, ubuf, cnt))
4520 return -EFAULT;
4521
4522 buf[cnt] = 0;
4523
4524 /* strip ending whitespace. */
4525 for (i = cnt - 1; i > 0 && isspace(buf[i]); i--)
4526 buf[i] = 0;
4527
607e2ea1 4528 err = tracing_set_tracer(tr, buf);
e6e7a65a
FW
4529 if (err)
4530 return err;
d9e54076 4531
cf8517cf 4532 *ppos += ret;
bc0c38d1 4533
c2931e05 4534 return ret;
bc0c38d1
SR
4535}
4536
4537static ssize_t
6508fa76
SF
4538tracing_nsecs_read(unsigned long *ptr, char __user *ubuf,
4539 size_t cnt, loff_t *ppos)
bc0c38d1 4540{
bc0c38d1
SR
4541 char buf[64];
4542 int r;
4543
cffae437 4544 r = snprintf(buf, sizeof(buf), "%ld\n",
bc0c38d1 4545 *ptr == (unsigned long)-1 ? -1 : nsecs_to_usecs(*ptr));
cffae437
SR
4546 if (r > sizeof(buf))
4547 r = sizeof(buf);
4bf39a94 4548 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
bc0c38d1
SR
4549}
4550
4551static ssize_t
6508fa76
SF
4552tracing_nsecs_write(unsigned long *ptr, const char __user *ubuf,
4553 size_t cnt, loff_t *ppos)
bc0c38d1 4554{
5e39841c 4555 unsigned long val;
c6caeeb1 4556 int ret;
bc0c38d1 4557
22fe9b54
PH
4558 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
4559 if (ret)
c6caeeb1 4560 return ret;
bc0c38d1
SR
4561
4562 *ptr = val * 1000;
4563
4564 return cnt;
4565}
4566
6508fa76
SF
4567static ssize_t
4568tracing_thresh_read(struct file *filp, char __user *ubuf,
4569 size_t cnt, loff_t *ppos)
4570{
4571 return tracing_nsecs_read(&tracing_thresh, ubuf, cnt, ppos);
4572}
4573
4574static ssize_t
4575tracing_thresh_write(struct file *filp, const char __user *ubuf,
4576 size_t cnt, loff_t *ppos)
4577{
4578 struct trace_array *tr = filp->private_data;
4579 int ret;
4580
4581 mutex_lock(&trace_types_lock);
4582 ret = tracing_nsecs_write(&tracing_thresh, ubuf, cnt, ppos);
4583 if (ret < 0)
4584 goto out;
4585
4586 if (tr->current_trace->update_thresh) {
4587 ret = tr->current_trace->update_thresh(tr);
4588 if (ret < 0)
4589 goto out;
4590 }
4591
4592 ret = cnt;
4593out:
4594 mutex_unlock(&trace_types_lock);
4595
4596 return ret;
4597}
4598
e428abbb
CG
4599#ifdef CONFIG_TRACER_MAX_TRACE
4600
6508fa76
SF
4601static ssize_t
4602tracing_max_lat_read(struct file *filp, char __user *ubuf,
4603 size_t cnt, loff_t *ppos)
4604{
4605 return tracing_nsecs_read(filp->private_data, ubuf, cnt, ppos);
4606}
4607
4608static ssize_t
4609tracing_max_lat_write(struct file *filp, const char __user *ubuf,
4610 size_t cnt, loff_t *ppos)
4611{
4612 return tracing_nsecs_write(filp->private_data, ubuf, cnt, ppos);
4613}
4614
e428abbb
CG
4615#endif
4616
b3806b43
SR
4617static int tracing_open_pipe(struct inode *inode, struct file *filp)
4618{
15544209 4619 struct trace_array *tr = inode->i_private;
b3806b43 4620 struct trace_iterator *iter;
b04cc6b1 4621 int ret = 0;
b3806b43
SR
4622
4623 if (tracing_disabled)
4624 return -ENODEV;
4625
7b85af63
SRRH
4626 if (trace_array_get(tr) < 0)
4627 return -ENODEV;
4628
b04cc6b1
FW
4629 mutex_lock(&trace_types_lock);
4630
b3806b43
SR
4631 /* create a buffer to store the information to pass to userspace */
4632 iter = kzalloc(sizeof(*iter), GFP_KERNEL);
b04cc6b1
FW
4633 if (!iter) {
4634 ret = -ENOMEM;
f77d09a3 4635 __trace_array_put(tr);
b04cc6b1
FW
4636 goto out;
4637 }
b3806b43 4638
3a161d99 4639 trace_seq_init(&iter->seq);
d716ff71 4640 iter->trace = tr->current_trace;
d7350c3f 4641
4462344e 4642 if (!alloc_cpumask_var(&iter->started, GFP_KERNEL)) {
b04cc6b1 4643 ret = -ENOMEM;
d7350c3f 4644 goto fail;
4462344e
RR
4645 }
4646
a309720c 4647 /* trace pipe does not show start of buffer */
4462344e 4648 cpumask_setall(iter->started);
a309720c 4649
983f938a 4650 if (tr->trace_flags & TRACE_ITER_LATENCY_FMT)
112f38a7
SR
4651 iter->iter_flags |= TRACE_FILE_LAT_FMT;
4652
8be0709f 4653 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
58e8eedf 4654 if (trace_clocks[tr->clock_id].in_ns)
8be0709f
DS
4655 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
4656
15544209
ON
4657 iter->tr = tr;
4658 iter->trace_buffer = &tr->trace_buffer;
4659 iter->cpu_file = tracing_get_cpu(inode);
d7350c3f 4660 mutex_init(&iter->mutex);
b3806b43
SR
4661 filp->private_data = iter;
4662
107bad8b
SR
4663 if (iter->trace->pipe_open)
4664 iter->trace->pipe_open(iter);
107bad8b 4665
b444786f 4666 nonseekable_open(inode, filp);
cf6ab6d9
SRRH
4667
4668 tr->current_trace->ref++;
b04cc6b1
FW
4669out:
4670 mutex_unlock(&trace_types_lock);
4671 return ret;
d7350c3f
FW
4672
4673fail:
4674 kfree(iter->trace);
4675 kfree(iter);
7b85af63 4676 __trace_array_put(tr);
d7350c3f
FW
4677 mutex_unlock(&trace_types_lock);
4678 return ret;
b3806b43
SR
4679}
4680
4681static int tracing_release_pipe(struct inode *inode, struct file *file)
4682{
4683 struct trace_iterator *iter = file->private_data;
15544209 4684 struct trace_array *tr = inode->i_private;
b3806b43 4685
b04cc6b1
FW
4686 mutex_lock(&trace_types_lock);
4687
cf6ab6d9
SRRH
4688 tr->current_trace->ref--;
4689
29bf4a5e 4690 if (iter->trace->pipe_close)
c521efd1
SR
4691 iter->trace->pipe_close(iter);
4692
b04cc6b1
FW
4693 mutex_unlock(&trace_types_lock);
4694
4462344e 4695 free_cpumask_var(iter->started);
d7350c3f 4696 mutex_destroy(&iter->mutex);
b3806b43 4697 kfree(iter);
b3806b43 4698
7b85af63
SRRH
4699 trace_array_put(tr);
4700
b3806b43
SR
4701 return 0;
4702}
4703
2a2cc8f7 4704static unsigned int
cc60cdc9 4705trace_poll(struct trace_iterator *iter, struct file *filp, poll_table *poll_table)
2a2cc8f7 4706{
983f938a
SRRH
4707 struct trace_array *tr = iter->tr;
4708
15693458
SRRH
4709 /* Iterators are static, they should be filled or empty */
4710 if (trace_buffer_iter(iter, iter->cpu_file))
4711 return POLLIN | POLLRDNORM;
2a2cc8f7 4712
983f938a 4713 if (tr->trace_flags & TRACE_ITER_BLOCK)
2a2cc8f7
SSP
4714 /*
4715 * Always select as readable when in blocking mode
4716 */
4717 return POLLIN | POLLRDNORM;
15693458 4718 else
12883efb 4719 return ring_buffer_poll_wait(iter->trace_buffer->buffer, iter->cpu_file,
15693458 4720 filp, poll_table);
2a2cc8f7 4721}
2a2cc8f7 4722
cc60cdc9
SR
4723static unsigned int
4724tracing_poll_pipe(struct file *filp, poll_table *poll_table)
4725{
4726 struct trace_iterator *iter = filp->private_data;
4727
4728 return trace_poll(iter, filp, poll_table);
2a2cc8f7
SSP
4729}
4730
d716ff71 4731/* Must be called with iter->mutex held. */
ff98781b 4732static int tracing_wait_pipe(struct file *filp)
b3806b43
SR
4733{
4734 struct trace_iterator *iter = filp->private_data;
8b8b3683 4735 int ret;
b3806b43 4736
b3806b43 4737 while (trace_empty(iter)) {
2dc8f095 4738
107bad8b 4739 if ((filp->f_flags & O_NONBLOCK)) {
ff98781b 4740 return -EAGAIN;
107bad8b 4741 }
2dc8f095 4742
b3806b43 4743 /*
250bfd3d 4744 * We block until we read something and tracing is disabled.
b3806b43
SR
4745 * We still block if tracing is disabled, but we have never
4746 * read anything. This allows a user to cat this file, and
4747 * then enable tracing. But after we have read something,
4748 * we give an EOF when tracing is again disabled.
4749 *
4750 * iter->pos will be 0 if we haven't read anything.
4751 */
10246fa3 4752 if (!tracing_is_on() && iter->pos)
b3806b43 4753 break;
f4874261
SRRH
4754
4755 mutex_unlock(&iter->mutex);
4756
e30f53aa 4757 ret = wait_on_pipe(iter, false);
f4874261
SRRH
4758
4759 mutex_lock(&iter->mutex);
4760
8b8b3683
SRRH
4761 if (ret)
4762 return ret;
b3806b43
SR
4763 }
4764
ff98781b
EGM
4765 return 1;
4766}
4767
4768/*
4769 * Consumer reader.
4770 */
4771static ssize_t
4772tracing_read_pipe(struct file *filp, char __user *ubuf,
4773 size_t cnt, loff_t *ppos)
4774{
4775 struct trace_iterator *iter = filp->private_data;
4776 ssize_t sret;
4777
4778 /* return any leftover data */
4779 sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
4780 if (sret != -EBUSY)
4781 return sret;
4782
f9520750 4783 trace_seq_init(&iter->seq);
ff98781b 4784
d7350c3f
FW
4785 /*
4786 * Avoid more than one consumer on a single file descriptor
4787 * This is just a matter of traces coherency, the ring buffer itself
4788 * is protected.
4789 */
4790 mutex_lock(&iter->mutex);
ff98781b
EGM
4791 if (iter->trace->read) {
4792 sret = iter->trace->read(iter, filp, ubuf, cnt, ppos);
4793 if (sret)
4794 goto out;
4795 }
4796
4797waitagain:
4798 sret = tracing_wait_pipe(filp);
4799 if (sret <= 0)
4800 goto out;
4801
b3806b43 4802 /* stop when tracing is finished */
ff98781b
EGM
4803 if (trace_empty(iter)) {
4804 sret = 0;
107bad8b 4805 goto out;
ff98781b 4806 }
b3806b43
SR
4807
4808 if (cnt >= PAGE_SIZE)
4809 cnt = PAGE_SIZE - 1;
4810
53d0aa77 4811 /* reset all but tr, trace, and overruns */
53d0aa77
SR
4812 memset(&iter->seq, 0,
4813 sizeof(struct trace_iterator) -
4814 offsetof(struct trace_iterator, seq));
ed5467da 4815 cpumask_clear(iter->started);
4823ed7e 4816 iter->pos = -1;
b3806b43 4817
4f535968 4818 trace_event_read_lock();
7e53bd42 4819 trace_access_lock(iter->cpu_file);
955b61e5 4820 while (trace_find_next_entry_inc(iter) != NULL) {
2c4f035f 4821 enum print_line_t ret;
5ac48378 4822 int save_len = iter->seq.seq.len;
088b1e42 4823
f9896bf3 4824 ret = print_trace_line(iter);
2c4f035f 4825 if (ret == TRACE_TYPE_PARTIAL_LINE) {
088b1e42 4826 /* don't print partial lines */
5ac48378 4827 iter->seq.seq.len = save_len;
b3806b43 4828 break;
088b1e42 4829 }
b91facc3
FW
4830 if (ret != TRACE_TYPE_NO_CONSUME)
4831 trace_consume(iter);
b3806b43 4832
5ac48378 4833 if (trace_seq_used(&iter->seq) >= cnt)
b3806b43 4834 break;
ee5e51f5
JO
4835
4836 /*
4837 * Setting the full flag means we reached the trace_seq buffer
4838 * size and we should leave by partial output condition above.
4839 * One of the trace_seq_* functions is not used properly.
4840 */
4841 WARN_ONCE(iter->seq.full, "full flag set for trace type %d",
4842 iter->ent->type);
b3806b43 4843 }
7e53bd42 4844 trace_access_unlock(iter->cpu_file);
4f535968 4845 trace_event_read_unlock();
b3806b43 4846
b3806b43 4847 /* Now copy what we have to the user */
6c6c2796 4848 sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
5ac48378 4849 if (iter->seq.seq.readpos >= trace_seq_used(&iter->seq))
f9520750 4850 trace_seq_init(&iter->seq);
9ff4b974
PP
4851
4852 /*
25985edc 4853 * If there was nothing to send to user, in spite of consuming trace
9ff4b974
PP
4854 * entries, go back to wait for more entries.
4855 */
6c6c2796 4856 if (sret == -EBUSY)
9ff4b974 4857 goto waitagain;
b3806b43 4858
107bad8b 4859out:
d7350c3f 4860 mutex_unlock(&iter->mutex);
107bad8b 4861
6c6c2796 4862 return sret;
b3806b43
SR
4863}
4864
3c56819b
EGM
4865static void tracing_spd_release_pipe(struct splice_pipe_desc *spd,
4866 unsigned int idx)
4867{
4868 __free_page(spd->pages[idx]);
4869}
4870
28dfef8f 4871static const struct pipe_buf_operations tracing_pipe_buf_ops = {
34cd4998 4872 .can_merge = 0,
34cd4998 4873 .confirm = generic_pipe_buf_confirm,
92fdd98c 4874 .release = generic_pipe_buf_release,
34cd4998
SR
4875 .steal = generic_pipe_buf_steal,
4876 .get = generic_pipe_buf_get,
3c56819b
EGM
4877};
4878
34cd4998 4879static size_t
fa7c7f6e 4880tracing_fill_pipe_page(size_t rem, struct trace_iterator *iter)
34cd4998
SR
4881{
4882 size_t count;
74f06bb7 4883 int save_len;
34cd4998
SR
4884 int ret;
4885
4886 /* Seq buffer is page-sized, exactly what we need. */
4887 for (;;) {
74f06bb7 4888 save_len = iter->seq.seq.len;
34cd4998 4889 ret = print_trace_line(iter);
74f06bb7
SRRH
4890
4891 if (trace_seq_has_overflowed(&iter->seq)) {
4892 iter->seq.seq.len = save_len;
34cd4998
SR
4893 break;
4894 }
74f06bb7
SRRH
4895
4896 /*
4897 * This should not be hit, because it should only
4898 * be set if the iter->seq overflowed. But check it
4899 * anyway to be safe.
4900 */
34cd4998 4901 if (ret == TRACE_TYPE_PARTIAL_LINE) {
74f06bb7
SRRH
4902 iter->seq.seq.len = save_len;
4903 break;
4904 }
4905
5ac48378 4906 count = trace_seq_used(&iter->seq) - save_len;
74f06bb7
SRRH
4907 if (rem < count) {
4908 rem = 0;
4909 iter->seq.seq.len = save_len;
34cd4998
SR
4910 break;
4911 }
4912
74e7ff8c
LJ
4913 if (ret != TRACE_TYPE_NO_CONSUME)
4914 trace_consume(iter);
34cd4998 4915 rem -= count;
955b61e5 4916 if (!trace_find_next_entry_inc(iter)) {
34cd4998
SR
4917 rem = 0;
4918 iter->ent = NULL;
4919 break;
4920 }
4921 }
4922
4923 return rem;
4924}
4925
3c56819b
EGM
4926static ssize_t tracing_splice_read_pipe(struct file *filp,
4927 loff_t *ppos,
4928 struct pipe_inode_info *pipe,
4929 size_t len,
4930 unsigned int flags)
4931{
35f3d14d
JA
4932 struct page *pages_def[PIPE_DEF_BUFFERS];
4933 struct partial_page partial_def[PIPE_DEF_BUFFERS];
3c56819b
EGM
4934 struct trace_iterator *iter = filp->private_data;
4935 struct splice_pipe_desc spd = {
35f3d14d
JA
4936 .pages = pages_def,
4937 .partial = partial_def,
34cd4998 4938 .nr_pages = 0, /* This gets updated below. */
047fe360 4939 .nr_pages_max = PIPE_DEF_BUFFERS,
34cd4998
SR
4940 .flags = flags,
4941 .ops = &tracing_pipe_buf_ops,
4942 .spd_release = tracing_spd_release_pipe,
3c56819b
EGM
4943 };
4944 ssize_t ret;
34cd4998 4945 size_t rem;
3c56819b
EGM
4946 unsigned int i;
4947
35f3d14d
JA
4948 if (splice_grow_spd(pipe, &spd))
4949 return -ENOMEM;
4950
d7350c3f 4951 mutex_lock(&iter->mutex);
3c56819b
EGM
4952
4953 if (iter->trace->splice_read) {
4954 ret = iter->trace->splice_read(iter, filp,
4955 ppos, pipe, len, flags);
4956 if (ret)
34cd4998 4957 goto out_err;
3c56819b
EGM
4958 }
4959
4960 ret = tracing_wait_pipe(filp);
4961 if (ret <= 0)
34cd4998 4962 goto out_err;
3c56819b 4963
955b61e5 4964 if (!iter->ent && !trace_find_next_entry_inc(iter)) {
3c56819b 4965 ret = -EFAULT;
34cd4998 4966 goto out_err;
3c56819b
EGM
4967 }
4968
4f535968 4969 trace_event_read_lock();
7e53bd42 4970 trace_access_lock(iter->cpu_file);
4f535968 4971
3c56819b 4972 /* Fill as many pages as possible. */
a786c06d 4973 for (i = 0, rem = len; i < spd.nr_pages_max && rem; i++) {
35f3d14d
JA
4974 spd.pages[i] = alloc_page(GFP_KERNEL);
4975 if (!spd.pages[i])
34cd4998 4976 break;
3c56819b 4977
fa7c7f6e 4978 rem = tracing_fill_pipe_page(rem, iter);
3c56819b
EGM
4979
4980 /* Copy the data into the page, so we can start over. */
4981 ret = trace_seq_to_buffer(&iter->seq,
35f3d14d 4982 page_address(spd.pages[i]),
5ac48378 4983 trace_seq_used(&iter->seq));
3c56819b 4984 if (ret < 0) {
35f3d14d 4985 __free_page(spd.pages[i]);
3c56819b
EGM
4986 break;
4987 }
35f3d14d 4988 spd.partial[i].offset = 0;
5ac48378 4989 spd.partial[i].len = trace_seq_used(&iter->seq);
3c56819b 4990
f9520750 4991 trace_seq_init(&iter->seq);
3c56819b
EGM
4992 }
4993
7e53bd42 4994 trace_access_unlock(iter->cpu_file);
4f535968 4995 trace_event_read_unlock();
d7350c3f 4996 mutex_unlock(&iter->mutex);
3c56819b
EGM
4997
4998 spd.nr_pages = i;
4999
a29054d9
SRRH
5000 if (i)
5001 ret = splice_to_pipe(pipe, &spd);
5002 else
5003 ret = 0;
35f3d14d 5004out:
047fe360 5005 splice_shrink_spd(&spd);
35f3d14d 5006 return ret;
3c56819b 5007
34cd4998 5008out_err:
d7350c3f 5009 mutex_unlock(&iter->mutex);
35f3d14d 5010 goto out;
3c56819b
EGM
5011}
5012
a98a3c3f
SR
5013static ssize_t
5014tracing_entries_read(struct file *filp, char __user *ubuf,
5015 size_t cnt, loff_t *ppos)
5016{
0bc392ee
ON
5017 struct inode *inode = file_inode(filp);
5018 struct trace_array *tr = inode->i_private;
5019 int cpu = tracing_get_cpu(inode);
438ced17
VN
5020 char buf[64];
5021 int r = 0;
5022 ssize_t ret;
a98a3c3f 5023
db526ca3 5024 mutex_lock(&trace_types_lock);
438ced17 5025
0bc392ee 5026 if (cpu == RING_BUFFER_ALL_CPUS) {
438ced17
VN
5027 int cpu, buf_size_same;
5028 unsigned long size;
5029
5030 size = 0;
5031 buf_size_same = 1;
5032 /* check if all cpu sizes are same */
5033 for_each_tracing_cpu(cpu) {
5034 /* fill in the size from first enabled cpu */
5035 if (size == 0)
12883efb
SRRH
5036 size = per_cpu_ptr(tr->trace_buffer.data, cpu)->entries;
5037 if (size != per_cpu_ptr(tr->trace_buffer.data, cpu)->entries) {
438ced17
VN
5038 buf_size_same = 0;
5039 break;
5040 }
5041 }
5042
5043 if (buf_size_same) {
5044 if (!ring_buffer_expanded)
5045 r = sprintf(buf, "%lu (expanded: %lu)\n",
5046 size >> 10,
5047 trace_buf_size >> 10);
5048 else
5049 r = sprintf(buf, "%lu\n", size >> 10);
5050 } else
5051 r = sprintf(buf, "X\n");
5052 } else
0bc392ee 5053 r = sprintf(buf, "%lu\n", per_cpu_ptr(tr->trace_buffer.data, cpu)->entries >> 10);
438ced17 5054
db526ca3
SR
5055 mutex_unlock(&trace_types_lock);
5056
438ced17
VN
5057 ret = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
5058 return ret;
a98a3c3f
SR
5059}
5060
5061static ssize_t
5062tracing_entries_write(struct file *filp, const char __user *ubuf,
5063 size_t cnt, loff_t *ppos)
5064{
0bc392ee
ON
5065 struct inode *inode = file_inode(filp);
5066 struct trace_array *tr = inode->i_private;
a98a3c3f 5067 unsigned long val;
4f271a2a 5068 int ret;
a98a3c3f 5069
22fe9b54
PH
5070 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
5071 if (ret)
c6caeeb1 5072 return ret;
a98a3c3f
SR
5073
5074 /* must have at least 1 entry */
5075 if (!val)
5076 return -EINVAL;
5077
1696b2b0
SR
5078 /* value is in KB */
5079 val <<= 10;
0bc392ee 5080 ret = tracing_resize_ring_buffer(tr, val, tracing_get_cpu(inode));
4f271a2a
VN
5081 if (ret < 0)
5082 return ret;
a98a3c3f 5083
cf8517cf 5084 *ppos += cnt;
a98a3c3f 5085
4f271a2a
VN
5086 return cnt;
5087}
bf5e6519 5088
f81ab074
VN
5089static ssize_t
5090tracing_total_entries_read(struct file *filp, char __user *ubuf,
5091 size_t cnt, loff_t *ppos)
5092{
5093 struct trace_array *tr = filp->private_data;
5094 char buf[64];
5095 int r, cpu;
5096 unsigned long size = 0, expanded_size = 0;
5097
5098 mutex_lock(&trace_types_lock);
5099 for_each_tracing_cpu(cpu) {
12883efb 5100 size += per_cpu_ptr(tr->trace_buffer.data, cpu)->entries >> 10;
f81ab074
VN
5101 if (!ring_buffer_expanded)
5102 expanded_size += trace_buf_size >> 10;
5103 }
5104 if (ring_buffer_expanded)
5105 r = sprintf(buf, "%lu\n", size);
5106 else
5107 r = sprintf(buf, "%lu (expanded: %lu)\n", size, expanded_size);
5108 mutex_unlock(&trace_types_lock);
5109
5110 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
5111}
5112
4f271a2a
VN
5113static ssize_t
5114tracing_free_buffer_write(struct file *filp, const char __user *ubuf,
5115 size_t cnt, loff_t *ppos)
5116{
5117 /*
5118 * There is no need to read what the user has written, this function
5119 * is just to make sure that there is no error when "echo" is used
5120 */
5121
5122 *ppos += cnt;
a98a3c3f
SR
5123
5124 return cnt;
5125}
5126
4f271a2a
VN
5127static int
5128tracing_free_buffer_release(struct inode *inode, struct file *filp)
5129{
2b6080f2
SR
5130 struct trace_array *tr = inode->i_private;
5131
cf30cf67 5132 /* disable tracing ? */
983f938a 5133 if (tr->trace_flags & TRACE_ITER_STOP_ON_FREE)
711e1243 5134 tracer_tracing_off(tr);
4f271a2a 5135 /* resize the ring buffer to 0 */
2b6080f2 5136 tracing_resize_ring_buffer(tr, 0, RING_BUFFER_ALL_CPUS);
4f271a2a 5137
7b85af63
SRRH
5138 trace_array_put(tr);
5139
4f271a2a
VN
5140 return 0;
5141}
5142
5bf9a1ee
PP
5143static ssize_t
5144tracing_mark_write(struct file *filp, const char __user *ubuf,
5145 size_t cnt, loff_t *fpos)
5146{
d696b58c 5147 unsigned long addr = (unsigned long)ubuf;
2d71619c 5148 struct trace_array *tr = filp->private_data;
d696b58c
SR
5149 struct ring_buffer_event *event;
5150 struct ring_buffer *buffer;
5151 struct print_entry *entry;
5152 unsigned long irq_flags;
5153 struct page *pages[2];
6edb2a8a 5154 void *map_page[2];
d696b58c
SR
5155 int nr_pages = 1;
5156 ssize_t written;
d696b58c
SR
5157 int offset;
5158 int size;
5159 int len;
5160 int ret;
6edb2a8a 5161 int i;
5bf9a1ee 5162
c76f0694 5163 if (tracing_disabled)
5bf9a1ee
PP
5164 return -EINVAL;
5165
983f938a 5166 if (!(tr->trace_flags & TRACE_ITER_MARKERS))
5224c3a3
MSB
5167 return -EINVAL;
5168
5bf9a1ee
PP
5169 if (cnt > TRACE_BUF_SIZE)
5170 cnt = TRACE_BUF_SIZE;
5171
d696b58c
SR
5172 /*
5173 * Userspace is injecting traces into the kernel trace buffer.
5174 * We want to be as non intrusive as possible.
5175 * To do so, we do not want to allocate any special buffers
5176 * or take any locks, but instead write the userspace data
5177 * straight into the ring buffer.
5178 *
5179 * First we need to pin the userspace buffer into memory,
5180 * which, most likely it is, because it just referenced it.
5181 * But there's no guarantee that it is. By using get_user_pages_fast()
5182 * and kmap_atomic/kunmap_atomic() we can get access to the
5183 * pages directly. We then write the data directly into the
5184 * ring buffer.
5185 */
5186 BUILD_BUG_ON(TRACE_BUF_SIZE >= PAGE_SIZE);
5bf9a1ee 5187
d696b58c
SR
5188 /* check if we cross pages */
5189 if ((addr & PAGE_MASK) != ((addr + cnt) & PAGE_MASK))
5190 nr_pages = 2;
5191
5192 offset = addr & (PAGE_SIZE - 1);
5193 addr &= PAGE_MASK;
5194
5195 ret = get_user_pages_fast(addr, nr_pages, 0, pages);
5196 if (ret < nr_pages) {
5197 while (--ret >= 0)
5198 put_page(pages[ret]);
5199 written = -EFAULT;
5200 goto out;
5bf9a1ee 5201 }
d696b58c 5202
6edb2a8a
SR
5203 for (i = 0; i < nr_pages; i++)
5204 map_page[i] = kmap_atomic(pages[i]);
d696b58c
SR
5205
5206 local_save_flags(irq_flags);
5207 size = sizeof(*entry) + cnt + 2; /* possible \n added */
2d71619c 5208 buffer = tr->trace_buffer.buffer;
d696b58c
SR
5209 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, size,
5210 irq_flags, preempt_count());
5211 if (!event) {
5212 /* Ring buffer disabled, return as if not open for write */
5213 written = -EBADF;
5214 goto out_unlock;
5bf9a1ee 5215 }
d696b58c
SR
5216
5217 entry = ring_buffer_event_data(event);
5218 entry->ip = _THIS_IP_;
5219
5220 if (nr_pages == 2) {
5221 len = PAGE_SIZE - offset;
6edb2a8a
SR
5222 memcpy(&entry->buf, map_page[0] + offset, len);
5223 memcpy(&entry->buf[len], map_page[1], cnt - len);
c13d2f7c 5224 } else
6edb2a8a 5225 memcpy(&entry->buf, map_page[0] + offset, cnt);
5bf9a1ee 5226
d696b58c
SR
5227 if (entry->buf[cnt - 1] != '\n') {
5228 entry->buf[cnt] = '\n';
5229 entry->buf[cnt + 1] = '\0';
5230 } else
5231 entry->buf[cnt] = '\0';
5232
7ffbd48d 5233 __buffer_unlock_commit(buffer, event);
5bf9a1ee 5234
d696b58c 5235 written = cnt;
5bf9a1ee 5236
d696b58c 5237 *fpos += written;
1aa54bca 5238
d696b58c 5239 out_unlock:
7215853e 5240 for (i = nr_pages - 1; i >= 0; i--) {
6edb2a8a
SR
5241 kunmap_atomic(map_page[i]);
5242 put_page(pages[i]);
5243 }
d696b58c 5244 out:
1aa54bca 5245 return written;
5bf9a1ee
PP
5246}
5247
13f16d20 5248static int tracing_clock_show(struct seq_file *m, void *v)
5079f326 5249{
2b6080f2 5250 struct trace_array *tr = m->private;
5079f326
Z
5251 int i;
5252
5253 for (i = 0; i < ARRAY_SIZE(trace_clocks); i++)
13f16d20 5254 seq_printf(m,
5079f326 5255 "%s%s%s%s", i ? " " : "",
2b6080f2
SR
5256 i == tr->clock_id ? "[" : "", trace_clocks[i].name,
5257 i == tr->clock_id ? "]" : "");
13f16d20 5258 seq_putc(m, '\n');
5079f326 5259
13f16d20 5260 return 0;
5079f326
Z
5261}
5262
e1e232ca 5263static int tracing_set_clock(struct trace_array *tr, const char *clockstr)
5079f326 5264{
5079f326
Z
5265 int i;
5266
5079f326
Z
5267 for (i = 0; i < ARRAY_SIZE(trace_clocks); i++) {
5268 if (strcmp(trace_clocks[i].name, clockstr) == 0)
5269 break;
5270 }
5271 if (i == ARRAY_SIZE(trace_clocks))
5272 return -EINVAL;
5273
5079f326
Z
5274 mutex_lock(&trace_types_lock);
5275
2b6080f2
SR
5276 tr->clock_id = i;
5277
12883efb 5278 ring_buffer_set_clock(tr->trace_buffer.buffer, trace_clocks[i].func);
5079f326 5279
60303ed3
DS
5280 /*
5281 * New clock may not be consistent with the previous clock.
5282 * Reset the buffer so that it doesn't have incomparable timestamps.
5283 */
9457158b 5284 tracing_reset_online_cpus(&tr->trace_buffer);
12883efb
SRRH
5285
5286#ifdef CONFIG_TRACER_MAX_TRACE
5287 if (tr->flags & TRACE_ARRAY_FL_GLOBAL && tr->max_buffer.buffer)
5288 ring_buffer_set_clock(tr->max_buffer.buffer, trace_clocks[i].func);
9457158b 5289 tracing_reset_online_cpus(&tr->max_buffer);
12883efb 5290#endif
60303ed3 5291
5079f326
Z
5292 mutex_unlock(&trace_types_lock);
5293
e1e232ca
SR
5294 return 0;
5295}
5296
5297static ssize_t tracing_clock_write(struct file *filp, const char __user *ubuf,
5298 size_t cnt, loff_t *fpos)
5299{
5300 struct seq_file *m = filp->private_data;
5301 struct trace_array *tr = m->private;
5302 char buf[64];
5303 const char *clockstr;
5304 int ret;
5305
5306 if (cnt >= sizeof(buf))
5307 return -EINVAL;
5308
5309 if (copy_from_user(&buf, ubuf, cnt))
5310 return -EFAULT;
5311
5312 buf[cnt] = 0;
5313
5314 clockstr = strstrip(buf);
5315
5316 ret = tracing_set_clock(tr, clockstr);
5317 if (ret)
5318 return ret;
5319
5079f326
Z
5320 *fpos += cnt;
5321
5322 return cnt;
5323}
5324
13f16d20
LZ
5325static int tracing_clock_open(struct inode *inode, struct file *file)
5326{
7b85af63
SRRH
5327 struct trace_array *tr = inode->i_private;
5328 int ret;
5329
13f16d20
LZ
5330 if (tracing_disabled)
5331 return -ENODEV;
2b6080f2 5332
7b85af63
SRRH
5333 if (trace_array_get(tr))
5334 return -ENODEV;
5335
5336 ret = single_open(file, tracing_clock_show, inode->i_private);
5337 if (ret < 0)
5338 trace_array_put(tr);
5339
5340 return ret;
13f16d20
LZ
5341}
5342
6de58e62
SRRH
5343struct ftrace_buffer_info {
5344 struct trace_iterator iter;
5345 void *spare;
5346 unsigned int read;
5347};
5348
debdd57f
HT
5349#ifdef CONFIG_TRACER_SNAPSHOT
5350static int tracing_snapshot_open(struct inode *inode, struct file *file)
5351{
6484c71c 5352 struct trace_array *tr = inode->i_private;
debdd57f 5353 struct trace_iterator *iter;
2b6080f2 5354 struct seq_file *m;
debdd57f
HT
5355 int ret = 0;
5356
ff451961
SRRH
5357 if (trace_array_get(tr) < 0)
5358 return -ENODEV;
5359
debdd57f 5360 if (file->f_mode & FMODE_READ) {
6484c71c 5361 iter = __tracing_open(inode, file, true);
debdd57f
HT
5362 if (IS_ERR(iter))
5363 ret = PTR_ERR(iter);
2b6080f2
SR
5364 } else {
5365 /* Writes still need the seq_file to hold the private data */
f77d09a3 5366 ret = -ENOMEM;
2b6080f2
SR
5367 m = kzalloc(sizeof(*m), GFP_KERNEL);
5368 if (!m)
f77d09a3 5369 goto out;
2b6080f2
SR
5370 iter = kzalloc(sizeof(*iter), GFP_KERNEL);
5371 if (!iter) {
5372 kfree(m);
f77d09a3 5373 goto out;
2b6080f2 5374 }
f77d09a3
AL
5375 ret = 0;
5376
ff451961 5377 iter->tr = tr;
6484c71c
ON
5378 iter->trace_buffer = &tr->max_buffer;
5379 iter->cpu_file = tracing_get_cpu(inode);
2b6080f2
SR
5380 m->private = iter;
5381 file->private_data = m;
debdd57f 5382 }
f77d09a3 5383out:
ff451961
SRRH
5384 if (ret < 0)
5385 trace_array_put(tr);
5386
debdd57f
HT
5387 return ret;
5388}
5389
5390static ssize_t
5391tracing_snapshot_write(struct file *filp, const char __user *ubuf, size_t cnt,
5392 loff_t *ppos)
5393{
2b6080f2
SR
5394 struct seq_file *m = filp->private_data;
5395 struct trace_iterator *iter = m->private;
5396 struct trace_array *tr = iter->tr;
debdd57f
HT
5397 unsigned long val;
5398 int ret;
5399
5400 ret = tracing_update_buffers();
5401 if (ret < 0)
5402 return ret;
5403
5404 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
5405 if (ret)
5406 return ret;
5407
5408 mutex_lock(&trace_types_lock);
5409
2b6080f2 5410 if (tr->current_trace->use_max_tr) {
debdd57f
HT
5411 ret = -EBUSY;
5412 goto out;
5413 }
5414
5415 switch (val) {
5416 case 0:
f1affcaa
SRRH
5417 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
5418 ret = -EINVAL;
5419 break;
debdd57f 5420 }
3209cff4
SRRH
5421 if (tr->allocated_snapshot)
5422 free_snapshot(tr);
debdd57f
HT
5423 break;
5424 case 1:
f1affcaa
SRRH
5425/* Only allow per-cpu swap if the ring buffer supports it */
5426#ifndef CONFIG_RING_BUFFER_ALLOW_SWAP
5427 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
5428 ret = -EINVAL;
5429 break;
5430 }
5431#endif
45ad21ca 5432 if (!tr->allocated_snapshot) {
3209cff4 5433 ret = alloc_snapshot(tr);
debdd57f
HT
5434 if (ret < 0)
5435 break;
debdd57f 5436 }
debdd57f
HT
5437 local_irq_disable();
5438 /* Now, we're going to swap */
f1affcaa 5439 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
ce9bae55 5440 update_max_tr(tr, current, smp_processor_id());
f1affcaa 5441 else
ce9bae55 5442 update_max_tr_single(tr, current, iter->cpu_file);
debdd57f
HT
5443 local_irq_enable();
5444 break;
5445 default:
45ad21ca 5446 if (tr->allocated_snapshot) {
f1affcaa
SRRH
5447 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
5448 tracing_reset_online_cpus(&tr->max_buffer);
5449 else
5450 tracing_reset(&tr->max_buffer, iter->cpu_file);
5451 }
debdd57f
HT
5452 break;
5453 }
5454
5455 if (ret >= 0) {
5456 *ppos += cnt;
5457 ret = cnt;
5458 }
5459out:
5460 mutex_unlock(&trace_types_lock);
5461 return ret;
5462}
2b6080f2
SR
5463
5464static int tracing_snapshot_release(struct inode *inode, struct file *file)
5465{
5466 struct seq_file *m = file->private_data;
ff451961
SRRH
5467 int ret;
5468
5469 ret = tracing_release(inode, file);
2b6080f2
SR
5470
5471 if (file->f_mode & FMODE_READ)
ff451961 5472 return ret;
2b6080f2
SR
5473
5474 /* If write only, the seq_file is just a stub */
5475 if (m)
5476 kfree(m->private);
5477 kfree(m);
5478
5479 return 0;
5480}
5481
6de58e62
SRRH
5482static int tracing_buffers_open(struct inode *inode, struct file *filp);
5483static ssize_t tracing_buffers_read(struct file *filp, char __user *ubuf,
5484 size_t count, loff_t *ppos);
5485static int tracing_buffers_release(struct inode *inode, struct file *file);
5486static ssize_t tracing_buffers_splice_read(struct file *file, loff_t *ppos,
5487 struct pipe_inode_info *pipe, size_t len, unsigned int flags);
5488
5489static int snapshot_raw_open(struct inode *inode, struct file *filp)
5490{
5491 struct ftrace_buffer_info *info;
5492 int ret;
5493
5494 ret = tracing_buffers_open(inode, filp);
5495 if (ret < 0)
5496 return ret;
5497
5498 info = filp->private_data;
5499
5500 if (info->iter.trace->use_max_tr) {
5501 tracing_buffers_release(inode, filp);
5502 return -EBUSY;
5503 }
5504
5505 info->iter.snapshot = true;
5506 info->iter.trace_buffer = &info->iter.tr->max_buffer;
5507
5508 return ret;
5509}
5510
debdd57f
HT
5511#endif /* CONFIG_TRACER_SNAPSHOT */
5512
5513
6508fa76
SF
5514static const struct file_operations tracing_thresh_fops = {
5515 .open = tracing_open_generic,
5516 .read = tracing_thresh_read,
5517 .write = tracing_thresh_write,
5518 .llseek = generic_file_llseek,
5519};
5520
e428abbb 5521#ifdef CONFIG_TRACER_MAX_TRACE
5e2336a0 5522static const struct file_operations tracing_max_lat_fops = {
4bf39a94
IM
5523 .open = tracing_open_generic,
5524 .read = tracing_max_lat_read,
5525 .write = tracing_max_lat_write,
b444786f 5526 .llseek = generic_file_llseek,
bc0c38d1 5527};
e428abbb 5528#endif
bc0c38d1 5529
5e2336a0 5530static const struct file_operations set_tracer_fops = {
4bf39a94
IM
5531 .open = tracing_open_generic,
5532 .read = tracing_set_trace_read,
5533 .write = tracing_set_trace_write,
b444786f 5534 .llseek = generic_file_llseek,
bc0c38d1
SR
5535};
5536
5e2336a0 5537static const struct file_operations tracing_pipe_fops = {
4bf39a94 5538 .open = tracing_open_pipe,
2a2cc8f7 5539 .poll = tracing_poll_pipe,
4bf39a94 5540 .read = tracing_read_pipe,
3c56819b 5541 .splice_read = tracing_splice_read_pipe,
4bf39a94 5542 .release = tracing_release_pipe,
b444786f 5543 .llseek = no_llseek,
b3806b43
SR
5544};
5545
5e2336a0 5546static const struct file_operations tracing_entries_fops = {
0bc392ee 5547 .open = tracing_open_generic_tr,
a98a3c3f
SR
5548 .read = tracing_entries_read,
5549 .write = tracing_entries_write,
b444786f 5550 .llseek = generic_file_llseek,
0bc392ee 5551 .release = tracing_release_generic_tr,
a98a3c3f
SR
5552};
5553
f81ab074 5554static const struct file_operations tracing_total_entries_fops = {
7b85af63 5555 .open = tracing_open_generic_tr,
f81ab074
VN
5556 .read = tracing_total_entries_read,
5557 .llseek = generic_file_llseek,
7b85af63 5558 .release = tracing_release_generic_tr,
f81ab074
VN
5559};
5560
4f271a2a 5561static const struct file_operations tracing_free_buffer_fops = {
7b85af63 5562 .open = tracing_open_generic_tr,
4f271a2a
VN
5563 .write = tracing_free_buffer_write,
5564 .release = tracing_free_buffer_release,
5565};
5566
5e2336a0 5567static const struct file_operations tracing_mark_fops = {
7b85af63 5568 .open = tracing_open_generic_tr,
5bf9a1ee 5569 .write = tracing_mark_write,
b444786f 5570 .llseek = generic_file_llseek,
7b85af63 5571 .release = tracing_release_generic_tr,
5bf9a1ee
PP
5572};
5573
5079f326 5574static const struct file_operations trace_clock_fops = {
13f16d20
LZ
5575 .open = tracing_clock_open,
5576 .read = seq_read,
5577 .llseek = seq_lseek,
7b85af63 5578 .release = tracing_single_release_tr,
5079f326
Z
5579 .write = tracing_clock_write,
5580};
5581
debdd57f
HT
5582#ifdef CONFIG_TRACER_SNAPSHOT
5583static const struct file_operations snapshot_fops = {
5584 .open = tracing_snapshot_open,
5585 .read = seq_read,
5586 .write = tracing_snapshot_write,
098c879e 5587 .llseek = tracing_lseek,
2b6080f2 5588 .release = tracing_snapshot_release,
debdd57f 5589};
debdd57f 5590
6de58e62
SRRH
5591static const struct file_operations snapshot_raw_fops = {
5592 .open = snapshot_raw_open,
5593 .read = tracing_buffers_read,
5594 .release = tracing_buffers_release,
5595 .splice_read = tracing_buffers_splice_read,
5596 .llseek = no_llseek,
2cadf913
SR
5597};
5598
6de58e62
SRRH
5599#endif /* CONFIG_TRACER_SNAPSHOT */
5600
2cadf913
SR
5601static int tracing_buffers_open(struct inode *inode, struct file *filp)
5602{
46ef2be0 5603 struct trace_array *tr = inode->i_private;
2cadf913 5604 struct ftrace_buffer_info *info;
7b85af63 5605 int ret;
2cadf913
SR
5606
5607 if (tracing_disabled)
5608 return -ENODEV;
5609
7b85af63
SRRH
5610 if (trace_array_get(tr) < 0)
5611 return -ENODEV;
5612
2cadf913 5613 info = kzalloc(sizeof(*info), GFP_KERNEL);
7b85af63
SRRH
5614 if (!info) {
5615 trace_array_put(tr);
2cadf913 5616 return -ENOMEM;
7b85af63 5617 }
2cadf913 5618
a695cb58
SRRH
5619 mutex_lock(&trace_types_lock);
5620
cc60cdc9 5621 info->iter.tr = tr;
46ef2be0 5622 info->iter.cpu_file = tracing_get_cpu(inode);
b627344f 5623 info->iter.trace = tr->current_trace;
12883efb 5624 info->iter.trace_buffer = &tr->trace_buffer;
cc60cdc9 5625 info->spare = NULL;
2cadf913 5626 /* Force reading ring buffer for first read */
cc60cdc9 5627 info->read = (unsigned int)-1;
2cadf913
SR
5628
5629 filp->private_data = info;
5630
cf6ab6d9
SRRH
5631 tr->current_trace->ref++;
5632
a695cb58
SRRH
5633 mutex_unlock(&trace_types_lock);
5634
7b85af63
SRRH
5635 ret = nonseekable_open(inode, filp);
5636 if (ret < 0)
5637 trace_array_put(tr);
5638
5639 return ret;
2cadf913
SR
5640}
5641
cc60cdc9
SR
5642static unsigned int
5643tracing_buffers_poll(struct file *filp, poll_table *poll_table)
5644{
5645 struct ftrace_buffer_info *info = filp->private_data;
5646 struct trace_iterator *iter = &info->iter;
5647
5648 return trace_poll(iter, filp, poll_table);
5649}
5650
2cadf913
SR
5651static ssize_t
5652tracing_buffers_read(struct file *filp, char __user *ubuf,
5653 size_t count, loff_t *ppos)
5654{
5655 struct ftrace_buffer_info *info = filp->private_data;
cc60cdc9 5656 struct trace_iterator *iter = &info->iter;
2cadf913 5657 ssize_t ret;
6de58e62 5658 ssize_t size;
2cadf913 5659
2dc5d12b
SR
5660 if (!count)
5661 return 0;
5662
6de58e62 5663#ifdef CONFIG_TRACER_MAX_TRACE
d716ff71
SRRH
5664 if (iter->snapshot && iter->tr->current_trace->use_max_tr)
5665 return -EBUSY;
6de58e62
SRRH
5666#endif
5667
ddd538f3 5668 if (!info->spare)
12883efb
SRRH
5669 info->spare = ring_buffer_alloc_read_page(iter->trace_buffer->buffer,
5670 iter->cpu_file);
ddd538f3 5671 if (!info->spare)
d716ff71 5672 return -ENOMEM;
ddd538f3 5673
2cadf913
SR
5674 /* Do we have previous read data to read? */
5675 if (info->read < PAGE_SIZE)
5676 goto read;
5677
b627344f 5678 again:
cc60cdc9 5679 trace_access_lock(iter->cpu_file);
12883efb 5680 ret = ring_buffer_read_page(iter->trace_buffer->buffer,
2cadf913
SR
5681 &info->spare,
5682 count,
cc60cdc9
SR
5683 iter->cpu_file, 0);
5684 trace_access_unlock(iter->cpu_file);
2cadf913 5685
b627344f
SR
5686 if (ret < 0) {
5687 if (trace_empty(iter)) {
d716ff71
SRRH
5688 if ((filp->f_flags & O_NONBLOCK))
5689 return -EAGAIN;
5690
e30f53aa 5691 ret = wait_on_pipe(iter, false);
d716ff71
SRRH
5692 if (ret)
5693 return ret;
5694
b627344f
SR
5695 goto again;
5696 }
d716ff71 5697 return 0;
b627344f 5698 }
436fc280 5699
436fc280 5700 info->read = 0;
b627344f 5701 read:
2cadf913
SR
5702 size = PAGE_SIZE - info->read;
5703 if (size > count)
5704 size = count;
5705
5706 ret = copy_to_user(ubuf, info->spare + info->read, size);
d716ff71
SRRH
5707 if (ret == size)
5708 return -EFAULT;
5709
2dc5d12b
SR
5710 size -= ret;
5711
2cadf913
SR
5712 *ppos += size;
5713 info->read += size;
5714
5715 return size;
5716}
5717
5718static int tracing_buffers_release(struct inode *inode, struct file *file)
5719{
5720 struct ftrace_buffer_info *info = file->private_data;
cc60cdc9 5721 struct trace_iterator *iter = &info->iter;
2cadf913 5722
a695cb58
SRRH
5723 mutex_lock(&trace_types_lock);
5724
cf6ab6d9
SRRH
5725 iter->tr->current_trace->ref--;
5726
ff451961 5727 __trace_array_put(iter->tr);
2cadf913 5728
ddd538f3 5729 if (info->spare)
12883efb 5730 ring_buffer_free_read_page(iter->trace_buffer->buffer, info->spare);
2cadf913
SR
5731 kfree(info);
5732
a695cb58
SRRH
5733 mutex_unlock(&trace_types_lock);
5734
2cadf913
SR
5735 return 0;
5736}
5737
5738struct buffer_ref {
5739 struct ring_buffer *buffer;
5740 void *page;
5741 int ref;
5742};
5743
5744static void buffer_pipe_buf_release(struct pipe_inode_info *pipe,
5745 struct pipe_buffer *buf)
5746{
5747 struct buffer_ref *ref = (struct buffer_ref *)buf->private;
5748
5749 if (--ref->ref)
5750 return;
5751
5752 ring_buffer_free_read_page(ref->buffer, ref->page);
5753 kfree(ref);
5754 buf->private = 0;
5755}
5756
2cadf913
SR
5757static void buffer_pipe_buf_get(struct pipe_inode_info *pipe,
5758 struct pipe_buffer *buf)
5759{
5760 struct buffer_ref *ref = (struct buffer_ref *)buf->private;
5761
5762 ref->ref++;
5763}
5764
5765/* Pipe buffer operations for a buffer. */
28dfef8f 5766static const struct pipe_buf_operations buffer_pipe_buf_ops = {
2cadf913 5767 .can_merge = 0,
2cadf913
SR
5768 .confirm = generic_pipe_buf_confirm,
5769 .release = buffer_pipe_buf_release,
d55cb6cf 5770 .steal = generic_pipe_buf_steal,
2cadf913
SR
5771 .get = buffer_pipe_buf_get,
5772};
5773
5774/*
5775 * Callback from splice_to_pipe(), if we need to release some pages
5776 * at the end of the spd in case we error'ed out in filling the pipe.
5777 */
5778static void buffer_spd_release(struct splice_pipe_desc *spd, unsigned int i)
5779{
5780 struct buffer_ref *ref =
5781 (struct buffer_ref *)spd->partial[i].private;
5782
5783 if (--ref->ref)
5784 return;
5785
5786 ring_buffer_free_read_page(ref->buffer, ref->page);
5787 kfree(ref);
5788 spd->partial[i].private = 0;
5789}
5790
5791static ssize_t
5792tracing_buffers_splice_read(struct file *file, loff_t *ppos,
5793 struct pipe_inode_info *pipe, size_t len,
5794 unsigned int flags)
5795{
5796 struct ftrace_buffer_info *info = file->private_data;
cc60cdc9 5797 struct trace_iterator *iter = &info->iter;
35f3d14d
JA
5798 struct partial_page partial_def[PIPE_DEF_BUFFERS];
5799 struct page *pages_def[PIPE_DEF_BUFFERS];
2cadf913 5800 struct splice_pipe_desc spd = {
35f3d14d
JA
5801 .pages = pages_def,
5802 .partial = partial_def,
047fe360 5803 .nr_pages_max = PIPE_DEF_BUFFERS,
2cadf913
SR
5804 .flags = flags,
5805 .ops = &buffer_pipe_buf_ops,
5806 .spd_release = buffer_spd_release,
5807 };
5808 struct buffer_ref *ref;
93459c6c 5809 int entries, size, i;
07906da7 5810 ssize_t ret = 0;
2cadf913 5811
6de58e62 5812#ifdef CONFIG_TRACER_MAX_TRACE
d716ff71
SRRH
5813 if (iter->snapshot && iter->tr->current_trace->use_max_tr)
5814 return -EBUSY;
6de58e62
SRRH
5815#endif
5816
d716ff71
SRRH
5817 if (splice_grow_spd(pipe, &spd))
5818 return -ENOMEM;
35f3d14d 5819
d716ff71
SRRH
5820 if (*ppos & (PAGE_SIZE - 1))
5821 return -EINVAL;
93cfb3c9
LJ
5822
5823 if (len & (PAGE_SIZE - 1)) {
d716ff71
SRRH
5824 if (len < PAGE_SIZE)
5825 return -EINVAL;
93cfb3c9
LJ
5826 len &= PAGE_MASK;
5827 }
5828
cc60cdc9
SR
5829 again:
5830 trace_access_lock(iter->cpu_file);
12883efb 5831 entries = ring_buffer_entries_cpu(iter->trace_buffer->buffer, iter->cpu_file);
93459c6c 5832
a786c06d 5833 for (i = 0; i < spd.nr_pages_max && len && entries; i++, len -= PAGE_SIZE) {
2cadf913
SR
5834 struct page *page;
5835 int r;
5836
5837 ref = kzalloc(sizeof(*ref), GFP_KERNEL);
07906da7
RV
5838 if (!ref) {
5839 ret = -ENOMEM;
2cadf913 5840 break;
07906da7 5841 }
2cadf913 5842
7267fa68 5843 ref->ref = 1;
12883efb 5844 ref->buffer = iter->trace_buffer->buffer;
cc60cdc9 5845 ref->page = ring_buffer_alloc_read_page(ref->buffer, iter->cpu_file);
2cadf913 5846 if (!ref->page) {
07906da7 5847 ret = -ENOMEM;
2cadf913
SR
5848 kfree(ref);
5849 break;
5850 }
5851
5852 r = ring_buffer_read_page(ref->buffer, &ref->page,
cc60cdc9 5853 len, iter->cpu_file, 1);
2cadf913 5854 if (r < 0) {
7ea59064 5855 ring_buffer_free_read_page(ref->buffer, ref->page);
2cadf913
SR
5856 kfree(ref);
5857 break;
5858 }
5859
5860 /*
5861 * zero out any left over data, this is going to
5862 * user land.
5863 */
5864 size = ring_buffer_page_len(ref->page);
5865 if (size < PAGE_SIZE)
5866 memset(ref->page + size, 0, PAGE_SIZE - size);
5867
5868 page = virt_to_page(ref->page);
5869
5870 spd.pages[i] = page;
5871 spd.partial[i].len = PAGE_SIZE;
5872 spd.partial[i].offset = 0;
5873 spd.partial[i].private = (unsigned long)ref;
5874 spd.nr_pages++;
93cfb3c9 5875 *ppos += PAGE_SIZE;
93459c6c 5876
12883efb 5877 entries = ring_buffer_entries_cpu(iter->trace_buffer->buffer, iter->cpu_file);
2cadf913
SR
5878 }
5879
cc60cdc9 5880 trace_access_unlock(iter->cpu_file);
2cadf913
SR
5881 spd.nr_pages = i;
5882
5883 /* did we read anything? */
5884 if (!spd.nr_pages) {
07906da7 5885 if (ret)
d716ff71
SRRH
5886 return ret;
5887
5888 if ((file->f_flags & O_NONBLOCK) || (flags & SPLICE_F_NONBLOCK))
5889 return -EAGAIN;
07906da7 5890
e30f53aa 5891 ret = wait_on_pipe(iter, true);
8b8b3683 5892 if (ret)
d716ff71 5893 return ret;
e30f53aa 5894
cc60cdc9 5895 goto again;
2cadf913
SR
5896 }
5897
5898 ret = splice_to_pipe(pipe, &spd);
047fe360 5899 splice_shrink_spd(&spd);
6de58e62 5900
2cadf913
SR
5901 return ret;
5902}
5903
5904static const struct file_operations tracing_buffers_fops = {
5905 .open = tracing_buffers_open,
5906 .read = tracing_buffers_read,
cc60cdc9 5907 .poll = tracing_buffers_poll,
2cadf913
SR
5908 .release = tracing_buffers_release,
5909 .splice_read = tracing_buffers_splice_read,
5910 .llseek = no_llseek,
5911};
5912
c8d77183
SR
5913static ssize_t
5914tracing_stats_read(struct file *filp, char __user *ubuf,
5915 size_t count, loff_t *ppos)
5916{
4d3435b8
ON
5917 struct inode *inode = file_inode(filp);
5918 struct trace_array *tr = inode->i_private;
12883efb 5919 struct trace_buffer *trace_buf = &tr->trace_buffer;
4d3435b8 5920 int cpu = tracing_get_cpu(inode);
c8d77183
SR
5921 struct trace_seq *s;
5922 unsigned long cnt;
c64e148a
VN
5923 unsigned long long t;
5924 unsigned long usec_rem;
c8d77183 5925
e4f2d10f 5926 s = kmalloc(sizeof(*s), GFP_KERNEL);
c8d77183 5927 if (!s)
a646365c 5928 return -ENOMEM;
c8d77183
SR
5929
5930 trace_seq_init(s);
5931
12883efb 5932 cnt = ring_buffer_entries_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5933 trace_seq_printf(s, "entries: %ld\n", cnt);
5934
12883efb 5935 cnt = ring_buffer_overrun_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5936 trace_seq_printf(s, "overrun: %ld\n", cnt);
5937
12883efb 5938 cnt = ring_buffer_commit_overrun_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5939 trace_seq_printf(s, "commit overrun: %ld\n", cnt);
5940
12883efb 5941 cnt = ring_buffer_bytes_cpu(trace_buf->buffer, cpu);
c64e148a
VN
5942 trace_seq_printf(s, "bytes: %ld\n", cnt);
5943
58e8eedf 5944 if (trace_clocks[tr->clock_id].in_ns) {
11043d8b 5945 /* local or global for trace_clock */
12883efb 5946 t = ns2usecs(ring_buffer_oldest_event_ts(trace_buf->buffer, cpu));
11043d8b
YY
5947 usec_rem = do_div(t, USEC_PER_SEC);
5948 trace_seq_printf(s, "oldest event ts: %5llu.%06lu\n",
5949 t, usec_rem);
5950
12883efb 5951 t = ns2usecs(ring_buffer_time_stamp(trace_buf->buffer, cpu));
11043d8b
YY
5952 usec_rem = do_div(t, USEC_PER_SEC);
5953 trace_seq_printf(s, "now ts: %5llu.%06lu\n", t, usec_rem);
5954 } else {
5955 /* counter or tsc mode for trace_clock */
5956 trace_seq_printf(s, "oldest event ts: %llu\n",
12883efb 5957 ring_buffer_oldest_event_ts(trace_buf->buffer, cpu));
c64e148a 5958
11043d8b 5959 trace_seq_printf(s, "now ts: %llu\n",
12883efb 5960 ring_buffer_time_stamp(trace_buf->buffer, cpu));
11043d8b 5961 }
c64e148a 5962
12883efb 5963 cnt = ring_buffer_dropped_events_cpu(trace_buf->buffer, cpu);
884bfe89
SP
5964 trace_seq_printf(s, "dropped events: %ld\n", cnt);
5965
12883efb 5966 cnt = ring_buffer_read_events_cpu(trace_buf->buffer, cpu);
ad964704
SRRH
5967 trace_seq_printf(s, "read events: %ld\n", cnt);
5968
5ac48378
SRRH
5969 count = simple_read_from_buffer(ubuf, count, ppos,
5970 s->buffer, trace_seq_used(s));
c8d77183
SR
5971
5972 kfree(s);
5973
5974 return count;
5975}
5976
5977static const struct file_operations tracing_stats_fops = {
4d3435b8 5978 .open = tracing_open_generic_tr,
c8d77183 5979 .read = tracing_stats_read,
b444786f 5980 .llseek = generic_file_llseek,
4d3435b8 5981 .release = tracing_release_generic_tr,
c8d77183
SR
5982};
5983
bc0c38d1
SR
5984#ifdef CONFIG_DYNAMIC_FTRACE
5985
b807c3d0
SR
5986int __weak ftrace_arch_read_dyn_info(char *buf, int size)
5987{
5988 return 0;
5989}
5990
bc0c38d1 5991static ssize_t
b807c3d0 5992tracing_read_dyn_info(struct file *filp, char __user *ubuf,
bc0c38d1
SR
5993 size_t cnt, loff_t *ppos)
5994{
a26a2a27
SR
5995 static char ftrace_dyn_info_buffer[1024];
5996 static DEFINE_MUTEX(dyn_info_mutex);
bc0c38d1 5997 unsigned long *p = filp->private_data;
b807c3d0 5998 char *buf = ftrace_dyn_info_buffer;
a26a2a27 5999 int size = ARRAY_SIZE(ftrace_dyn_info_buffer);
bc0c38d1
SR
6000 int r;
6001
b807c3d0
SR
6002 mutex_lock(&dyn_info_mutex);
6003 r = sprintf(buf, "%ld ", *p);
4bf39a94 6004
a26a2a27 6005 r += ftrace_arch_read_dyn_info(buf+r, (size-1)-r);
b807c3d0
SR
6006 buf[r++] = '\n';
6007
6008 r = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
6009
6010 mutex_unlock(&dyn_info_mutex);
6011
6012 return r;
bc0c38d1
SR
6013}
6014
5e2336a0 6015static const struct file_operations tracing_dyn_info_fops = {
4bf39a94 6016 .open = tracing_open_generic,
b807c3d0 6017 .read = tracing_read_dyn_info,
b444786f 6018 .llseek = generic_file_llseek,
bc0c38d1 6019};
77fd5c15 6020#endif /* CONFIG_DYNAMIC_FTRACE */
bc0c38d1 6021
77fd5c15
SRRH
6022#if defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE)
6023static void
6024ftrace_snapshot(unsigned long ip, unsigned long parent_ip, void **data)
6025{
6026 tracing_snapshot();
6027}
bc0c38d1 6028
77fd5c15
SRRH
6029static void
6030ftrace_count_snapshot(unsigned long ip, unsigned long parent_ip, void **data)
bc0c38d1 6031{
77fd5c15
SRRH
6032 unsigned long *count = (long *)data;
6033
6034 if (!*count)
6035 return;
bc0c38d1 6036
77fd5c15
SRRH
6037 if (*count != -1)
6038 (*count)--;
6039
6040 tracing_snapshot();
6041}
6042
6043static int
6044ftrace_snapshot_print(struct seq_file *m, unsigned long ip,
6045 struct ftrace_probe_ops *ops, void *data)
6046{
6047 long count = (long)data;
6048
6049 seq_printf(m, "%ps:", (void *)ip);
6050
fa6f0cc7 6051 seq_puts(m, "snapshot");
77fd5c15
SRRH
6052
6053 if (count == -1)
fa6f0cc7 6054 seq_puts(m, ":unlimited\n");
77fd5c15
SRRH
6055 else
6056 seq_printf(m, ":count=%ld\n", count);
6057
6058 return 0;
6059}
6060
6061static struct ftrace_probe_ops snapshot_probe_ops = {
6062 .func = ftrace_snapshot,
6063 .print = ftrace_snapshot_print,
6064};
6065
6066static struct ftrace_probe_ops snapshot_count_probe_ops = {
6067 .func = ftrace_count_snapshot,
6068 .print = ftrace_snapshot_print,
6069};
6070
6071static int
6072ftrace_trace_snapshot_callback(struct ftrace_hash *hash,
6073 char *glob, char *cmd, char *param, int enable)
6074{
6075 struct ftrace_probe_ops *ops;
6076 void *count = (void *)-1;
6077 char *number;
6078 int ret;
6079
6080 /* hash funcs only work with set_ftrace_filter */
6081 if (!enable)
6082 return -EINVAL;
6083
6084 ops = param ? &snapshot_count_probe_ops : &snapshot_probe_ops;
6085
6086 if (glob[0] == '!') {
6087 unregister_ftrace_function_probe_func(glob+1, ops);
6088 return 0;
6089 }
6090
6091 if (!param)
6092 goto out_reg;
6093
6094 number = strsep(&param, ":");
6095
6096 if (!strlen(number))
6097 goto out_reg;
6098
6099 /*
6100 * We use the callback data field (which is a pointer)
6101 * as our counter.
6102 */
6103 ret = kstrtoul(number, 0, (unsigned long *)&count);
6104 if (ret)
6105 return ret;
6106
6107 out_reg:
6108 ret = register_ftrace_function_probe(glob, ops, count);
6109
6110 if (ret >= 0)
6111 alloc_snapshot(&global_trace);
6112
6113 return ret < 0 ? ret : 0;
6114}
6115
6116static struct ftrace_func_command ftrace_snapshot_cmd = {
6117 .name = "snapshot",
6118 .func = ftrace_trace_snapshot_callback,
6119};
6120
38de93ab 6121static __init int register_snapshot_cmd(void)
77fd5c15
SRRH
6122{
6123 return register_ftrace_command(&ftrace_snapshot_cmd);
6124}
6125#else
38de93ab 6126static inline __init int register_snapshot_cmd(void) { return 0; }
77fd5c15 6127#endif /* defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE) */
bc0c38d1 6128
7eeafbca 6129static struct dentry *tracing_get_dentry(struct trace_array *tr)
bc0c38d1 6130{
8434dc93
SRRH
6131 if (WARN_ON(!tr->dir))
6132 return ERR_PTR(-ENODEV);
6133
6134 /* Top directory uses NULL as the parent */
6135 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
6136 return NULL;
6137
6138 /* All sub buffers have a descriptor */
2b6080f2 6139 return tr->dir;
bc0c38d1
SR
6140}
6141
2b6080f2 6142static struct dentry *tracing_dentry_percpu(struct trace_array *tr, int cpu)
b04cc6b1 6143{
b04cc6b1
FW
6144 struct dentry *d_tracer;
6145
2b6080f2
SR
6146 if (tr->percpu_dir)
6147 return tr->percpu_dir;
b04cc6b1 6148
7eeafbca 6149 d_tracer = tracing_get_dentry(tr);
14a5ae40 6150 if (IS_ERR(d_tracer))
b04cc6b1
FW
6151 return NULL;
6152
8434dc93 6153 tr->percpu_dir = tracefs_create_dir("per_cpu", d_tracer);
b04cc6b1 6154
2b6080f2 6155 WARN_ONCE(!tr->percpu_dir,
8434dc93 6156 "Could not create tracefs directory 'per_cpu/%d'\n", cpu);
b04cc6b1 6157
2b6080f2 6158 return tr->percpu_dir;
b04cc6b1
FW
6159}
6160
649e9c70
ON
6161static struct dentry *
6162trace_create_cpu_file(const char *name, umode_t mode, struct dentry *parent,
6163 void *data, long cpu, const struct file_operations *fops)
6164{
6165 struct dentry *ret = trace_create_file(name, mode, parent, data, fops);
6166
6167 if (ret) /* See tracing_get_cpu() */
7682c918 6168 d_inode(ret)->i_cdev = (void *)(cpu + 1);
649e9c70
ON
6169 return ret;
6170}
6171
2b6080f2 6172static void
8434dc93 6173tracing_init_tracefs_percpu(struct trace_array *tr, long cpu)
b04cc6b1 6174{
2b6080f2 6175 struct dentry *d_percpu = tracing_dentry_percpu(tr, cpu);
5452af66 6176 struct dentry *d_cpu;
dd49a38c 6177 char cpu_dir[30]; /* 30 characters should be more than enough */
b04cc6b1 6178
0a3d7ce7
NK
6179 if (!d_percpu)
6180 return;
6181
dd49a38c 6182 snprintf(cpu_dir, 30, "cpu%ld", cpu);
8434dc93 6183 d_cpu = tracefs_create_dir(cpu_dir, d_percpu);
8656e7a2 6184 if (!d_cpu) {
a395d6a7 6185 pr_warn("Could not create tracefs '%s' entry\n", cpu_dir);
8656e7a2
FW
6186 return;
6187 }
b04cc6b1 6188
8656e7a2 6189 /* per cpu trace_pipe */
649e9c70 6190 trace_create_cpu_file("trace_pipe", 0444, d_cpu,
15544209 6191 tr, cpu, &tracing_pipe_fops);
b04cc6b1
FW
6192
6193 /* per cpu trace */
649e9c70 6194 trace_create_cpu_file("trace", 0644, d_cpu,
6484c71c 6195 tr, cpu, &tracing_fops);
7f96f93f 6196
649e9c70 6197 trace_create_cpu_file("trace_pipe_raw", 0444, d_cpu,
46ef2be0 6198 tr, cpu, &tracing_buffers_fops);
7f96f93f 6199
649e9c70 6200 trace_create_cpu_file("stats", 0444, d_cpu,
4d3435b8 6201 tr, cpu, &tracing_stats_fops);
438ced17 6202
649e9c70 6203 trace_create_cpu_file("buffer_size_kb", 0444, d_cpu,
0bc392ee 6204 tr, cpu, &tracing_entries_fops);
f1affcaa
SRRH
6205
6206#ifdef CONFIG_TRACER_SNAPSHOT
649e9c70 6207 trace_create_cpu_file("snapshot", 0644, d_cpu,
6484c71c 6208 tr, cpu, &snapshot_fops);
6de58e62 6209
649e9c70 6210 trace_create_cpu_file("snapshot_raw", 0444, d_cpu,
46ef2be0 6211 tr, cpu, &snapshot_raw_fops);
f1affcaa 6212#endif
b04cc6b1
FW
6213}
6214
60a11774
SR
6215#ifdef CONFIG_FTRACE_SELFTEST
6216/* Let selftest have access to static functions in this file */
6217#include "trace_selftest.c"
6218#endif
6219
577b785f
SR
6220static ssize_t
6221trace_options_read(struct file *filp, char __user *ubuf, size_t cnt,
6222 loff_t *ppos)
6223{
6224 struct trace_option_dentry *topt = filp->private_data;
6225 char *buf;
6226
6227 if (topt->flags->val & topt->opt->bit)
6228 buf = "1\n";
6229 else
6230 buf = "0\n";
6231
6232 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
6233}
6234
6235static ssize_t
6236trace_options_write(struct file *filp, const char __user *ubuf, size_t cnt,
6237 loff_t *ppos)
6238{
6239 struct trace_option_dentry *topt = filp->private_data;
6240 unsigned long val;
577b785f
SR
6241 int ret;
6242
22fe9b54
PH
6243 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6244 if (ret)
577b785f
SR
6245 return ret;
6246
8d18eaaf
LZ
6247 if (val != 0 && val != 1)
6248 return -EINVAL;
577b785f 6249
8d18eaaf 6250 if (!!(topt->flags->val & topt->opt->bit) != val) {
577b785f 6251 mutex_lock(&trace_types_lock);
8c1a49ae 6252 ret = __set_tracer_option(topt->tr, topt->flags,
c757bea9 6253 topt->opt, !val);
577b785f
SR
6254 mutex_unlock(&trace_types_lock);
6255 if (ret)
6256 return ret;
577b785f
SR
6257 }
6258
6259 *ppos += cnt;
6260
6261 return cnt;
6262}
6263
6264
6265static const struct file_operations trace_options_fops = {
6266 .open = tracing_open_generic,
6267 .read = trace_options_read,
6268 .write = trace_options_write,
b444786f 6269 .llseek = generic_file_llseek,
577b785f
SR
6270};
6271
9a38a885
SRRH
6272/*
6273 * In order to pass in both the trace_array descriptor as well as the index
6274 * to the flag that the trace option file represents, the trace_array
6275 * has a character array of trace_flags_index[], which holds the index
6276 * of the bit for the flag it represents. index[0] == 0, index[1] == 1, etc.
6277 * The address of this character array is passed to the flag option file
6278 * read/write callbacks.
6279 *
6280 * In order to extract both the index and the trace_array descriptor,
6281 * get_tr_index() uses the following algorithm.
6282 *
6283 * idx = *ptr;
6284 *
6285 * As the pointer itself contains the address of the index (remember
6286 * index[1] == 1).
6287 *
6288 * Then to get the trace_array descriptor, by subtracting that index
6289 * from the ptr, we get to the start of the index itself.
6290 *
6291 * ptr - idx == &index[0]
6292 *
6293 * Then a simple container_of() from that pointer gets us to the
6294 * trace_array descriptor.
6295 */
6296static void get_tr_index(void *data, struct trace_array **ptr,
6297 unsigned int *pindex)
6298{
6299 *pindex = *(unsigned char *)data;
6300
6301 *ptr = container_of(data - *pindex, struct trace_array,
6302 trace_flags_index);
6303}
6304
a8259075
SR
6305static ssize_t
6306trace_options_core_read(struct file *filp, char __user *ubuf, size_t cnt,
6307 loff_t *ppos)
6308{
9a38a885
SRRH
6309 void *tr_index = filp->private_data;
6310 struct trace_array *tr;
6311 unsigned int index;
a8259075
SR
6312 char *buf;
6313
9a38a885
SRRH
6314 get_tr_index(tr_index, &tr, &index);
6315
6316 if (tr->trace_flags & (1 << index))
a8259075
SR
6317 buf = "1\n";
6318 else
6319 buf = "0\n";
6320
6321 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
6322}
6323
6324static ssize_t
6325trace_options_core_write(struct file *filp, const char __user *ubuf, size_t cnt,
6326 loff_t *ppos)
6327{
9a38a885
SRRH
6328 void *tr_index = filp->private_data;
6329 struct trace_array *tr;
6330 unsigned int index;
a8259075
SR
6331 unsigned long val;
6332 int ret;
6333
9a38a885
SRRH
6334 get_tr_index(tr_index, &tr, &index);
6335
22fe9b54
PH
6336 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6337 if (ret)
a8259075
SR
6338 return ret;
6339
f2d84b65 6340 if (val != 0 && val != 1)
a8259075 6341 return -EINVAL;
69d34da2
SRRH
6342
6343 mutex_lock(&trace_types_lock);
2b6080f2 6344 ret = set_tracer_flag(tr, 1 << index, val);
69d34da2 6345 mutex_unlock(&trace_types_lock);
a8259075 6346
613f04a0
SRRH
6347 if (ret < 0)
6348 return ret;
6349
a8259075
SR
6350 *ppos += cnt;
6351
6352 return cnt;
6353}
6354
a8259075
SR
6355static const struct file_operations trace_options_core_fops = {
6356 .open = tracing_open_generic,
6357 .read = trace_options_core_read,
6358 .write = trace_options_core_write,
b444786f 6359 .llseek = generic_file_llseek,
a8259075
SR
6360};
6361
5452af66 6362struct dentry *trace_create_file(const char *name,
f4ae40a6 6363 umode_t mode,
5452af66
FW
6364 struct dentry *parent,
6365 void *data,
6366 const struct file_operations *fops)
6367{
6368 struct dentry *ret;
6369
8434dc93 6370 ret = tracefs_create_file(name, mode, parent, data, fops);
5452af66 6371 if (!ret)
a395d6a7 6372 pr_warn("Could not create tracefs '%s' entry\n", name);
5452af66
FW
6373
6374 return ret;
6375}
6376
6377
2b6080f2 6378static struct dentry *trace_options_init_dentry(struct trace_array *tr)
a8259075
SR
6379{
6380 struct dentry *d_tracer;
a8259075 6381
2b6080f2
SR
6382 if (tr->options)
6383 return tr->options;
a8259075 6384
7eeafbca 6385 d_tracer = tracing_get_dentry(tr);
14a5ae40 6386 if (IS_ERR(d_tracer))
a8259075
SR
6387 return NULL;
6388
8434dc93 6389 tr->options = tracefs_create_dir("options", d_tracer);
2b6080f2 6390 if (!tr->options) {
a395d6a7 6391 pr_warn("Could not create tracefs directory 'options'\n");
a8259075
SR
6392 return NULL;
6393 }
6394
2b6080f2 6395 return tr->options;
a8259075
SR
6396}
6397
577b785f 6398static void
2b6080f2
SR
6399create_trace_option_file(struct trace_array *tr,
6400 struct trace_option_dentry *topt,
577b785f
SR
6401 struct tracer_flags *flags,
6402 struct tracer_opt *opt)
6403{
6404 struct dentry *t_options;
577b785f 6405
2b6080f2 6406 t_options = trace_options_init_dentry(tr);
577b785f
SR
6407 if (!t_options)
6408 return;
6409
6410 topt->flags = flags;
6411 topt->opt = opt;
2b6080f2 6412 topt->tr = tr;
577b785f 6413
5452af66 6414 topt->entry = trace_create_file(opt->name, 0644, t_options, topt,
577b785f
SR
6415 &trace_options_fops);
6416
577b785f
SR
6417}
6418
37aea98b 6419static void
2b6080f2 6420create_trace_option_files(struct trace_array *tr, struct tracer *tracer)
577b785f
SR
6421{
6422 struct trace_option_dentry *topts;
37aea98b 6423 struct trace_options *tr_topts;
577b785f
SR
6424 struct tracer_flags *flags;
6425 struct tracer_opt *opts;
6426 int cnt;
37aea98b 6427 int i;
577b785f
SR
6428
6429 if (!tracer)
37aea98b 6430 return;
577b785f
SR
6431
6432 flags = tracer->flags;
6433
6434 if (!flags || !flags->opts)
37aea98b
SRRH
6435 return;
6436
6437 /*
6438 * If this is an instance, only create flags for tracers
6439 * the instance may have.
6440 */
6441 if (!trace_ok_for_array(tracer, tr))
6442 return;
6443
6444 for (i = 0; i < tr->nr_topts; i++) {
d39cdd20
CH
6445 /* Make sure there's no duplicate flags. */
6446 if (WARN_ON_ONCE(tr->topts[i].tracer->flags == tracer->flags))
37aea98b
SRRH
6447 return;
6448 }
577b785f
SR
6449
6450 opts = flags->opts;
6451
6452 for (cnt = 0; opts[cnt].name; cnt++)
6453 ;
6454
0cfe8245 6455 topts = kcalloc(cnt + 1, sizeof(*topts), GFP_KERNEL);
577b785f 6456 if (!topts)
37aea98b
SRRH
6457 return;
6458
6459 tr_topts = krealloc(tr->topts, sizeof(*tr->topts) * (tr->nr_topts + 1),
6460 GFP_KERNEL);
6461 if (!tr_topts) {
6462 kfree(topts);
6463 return;
6464 }
6465
6466 tr->topts = tr_topts;
6467 tr->topts[tr->nr_topts].tracer = tracer;
6468 tr->topts[tr->nr_topts].topts = topts;
6469 tr->nr_topts++;
577b785f 6470
41d9c0be 6471 for (cnt = 0; opts[cnt].name; cnt++) {
2b6080f2 6472 create_trace_option_file(tr, &topts[cnt], flags,
577b785f 6473 &opts[cnt]);
41d9c0be
SRRH
6474 WARN_ONCE(topts[cnt].entry == NULL,
6475 "Failed to create trace option: %s",
6476 opts[cnt].name);
6477 }
577b785f
SR
6478}
6479
a8259075 6480static struct dentry *
2b6080f2
SR
6481create_trace_option_core_file(struct trace_array *tr,
6482 const char *option, long index)
a8259075
SR
6483{
6484 struct dentry *t_options;
a8259075 6485
2b6080f2 6486 t_options = trace_options_init_dentry(tr);
a8259075
SR
6487 if (!t_options)
6488 return NULL;
6489
9a38a885
SRRH
6490 return trace_create_file(option, 0644, t_options,
6491 (void *)&tr->trace_flags_index[index],
6492 &trace_options_core_fops);
a8259075
SR
6493}
6494
16270145 6495static void create_trace_options_dir(struct trace_array *tr)
a8259075
SR
6496{
6497 struct dentry *t_options;
16270145 6498 bool top_level = tr == &global_trace;
a8259075
SR
6499 int i;
6500
2b6080f2 6501 t_options = trace_options_init_dentry(tr);
a8259075
SR
6502 if (!t_options)
6503 return;
6504
16270145
SRRH
6505 for (i = 0; trace_options[i]; i++) {
6506 if (top_level ||
6507 !((1 << i) & TOP_LEVEL_TRACE_FLAGS))
6508 create_trace_option_core_file(tr, trace_options[i], i);
6509 }
a8259075
SR
6510}
6511
499e5470
SR
6512static ssize_t
6513rb_simple_read(struct file *filp, char __user *ubuf,
6514 size_t cnt, loff_t *ppos)
6515{
348f0fc2 6516 struct trace_array *tr = filp->private_data;
499e5470
SR
6517 char buf[64];
6518 int r;
6519
10246fa3 6520 r = tracer_tracing_is_on(tr);
499e5470
SR
6521 r = sprintf(buf, "%d\n", r);
6522
6523 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
6524}
6525
6526static ssize_t
6527rb_simple_write(struct file *filp, const char __user *ubuf,
6528 size_t cnt, loff_t *ppos)
6529{
348f0fc2 6530 struct trace_array *tr = filp->private_data;
12883efb 6531 struct ring_buffer *buffer = tr->trace_buffer.buffer;
499e5470
SR
6532 unsigned long val;
6533 int ret;
6534
6535 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6536 if (ret)
6537 return ret;
6538
6539 if (buffer) {
2df8f8a6
SR
6540 mutex_lock(&trace_types_lock);
6541 if (val) {
10246fa3 6542 tracer_tracing_on(tr);
2b6080f2
SR
6543 if (tr->current_trace->start)
6544 tr->current_trace->start(tr);
2df8f8a6 6545 } else {
10246fa3 6546 tracer_tracing_off(tr);
2b6080f2
SR
6547 if (tr->current_trace->stop)
6548 tr->current_trace->stop(tr);
2df8f8a6
SR
6549 }
6550 mutex_unlock(&trace_types_lock);
499e5470
SR
6551 }
6552
6553 (*ppos)++;
6554
6555 return cnt;
6556}
6557
6558static const struct file_operations rb_simple_fops = {
7b85af63 6559 .open = tracing_open_generic_tr,
499e5470
SR
6560 .read = rb_simple_read,
6561 .write = rb_simple_write,
7b85af63 6562 .release = tracing_release_generic_tr,
499e5470
SR
6563 .llseek = default_llseek,
6564};
6565
277ba044
SR
6566struct dentry *trace_instance_dir;
6567
6568static void
8434dc93 6569init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer);
277ba044 6570
55034cd6
SRRH
6571static int
6572allocate_trace_buffer(struct trace_array *tr, struct trace_buffer *buf, int size)
277ba044
SR
6573{
6574 enum ring_buffer_flags rb_flags;
737223fb 6575
983f938a 6576 rb_flags = tr->trace_flags & TRACE_ITER_OVERWRITE ? RB_FL_OVERWRITE : 0;
737223fb 6577
dced341b
SRRH
6578 buf->tr = tr;
6579
55034cd6
SRRH
6580 buf->buffer = ring_buffer_alloc(size, rb_flags);
6581 if (!buf->buffer)
6582 return -ENOMEM;
737223fb 6583
55034cd6
SRRH
6584 buf->data = alloc_percpu(struct trace_array_cpu);
6585 if (!buf->data) {
6586 ring_buffer_free(buf->buffer);
6587 return -ENOMEM;
6588 }
737223fb 6589
737223fb
SRRH
6590 /* Allocate the first page for all buffers */
6591 set_buffer_entries(&tr->trace_buffer,
6592 ring_buffer_size(tr->trace_buffer.buffer, 0));
6593
55034cd6
SRRH
6594 return 0;
6595}
737223fb 6596
55034cd6
SRRH
6597static int allocate_trace_buffers(struct trace_array *tr, int size)
6598{
6599 int ret;
737223fb 6600
55034cd6
SRRH
6601 ret = allocate_trace_buffer(tr, &tr->trace_buffer, size);
6602 if (ret)
6603 return ret;
737223fb 6604
55034cd6
SRRH
6605#ifdef CONFIG_TRACER_MAX_TRACE
6606 ret = allocate_trace_buffer(tr, &tr->max_buffer,
6607 allocate_snapshot ? size : 1);
6608 if (WARN_ON(ret)) {
737223fb 6609 ring_buffer_free(tr->trace_buffer.buffer);
55034cd6
SRRH
6610 free_percpu(tr->trace_buffer.data);
6611 return -ENOMEM;
6612 }
6613 tr->allocated_snapshot = allocate_snapshot;
737223fb 6614
55034cd6
SRRH
6615 /*
6616 * Only the top level trace array gets its snapshot allocated
6617 * from the kernel command line.
6618 */
6619 allocate_snapshot = false;
737223fb 6620#endif
55034cd6 6621 return 0;
737223fb
SRRH
6622}
6623
f0b70cc4
SRRH
6624static void free_trace_buffer(struct trace_buffer *buf)
6625{
6626 if (buf->buffer) {
6627 ring_buffer_free(buf->buffer);
6628 buf->buffer = NULL;
6629 free_percpu(buf->data);
6630 buf->data = NULL;
6631 }
6632}
6633
23aaa3c1
SRRH
6634static void free_trace_buffers(struct trace_array *tr)
6635{
6636 if (!tr)
6637 return;
6638
f0b70cc4 6639 free_trace_buffer(&tr->trace_buffer);
23aaa3c1
SRRH
6640
6641#ifdef CONFIG_TRACER_MAX_TRACE
f0b70cc4 6642 free_trace_buffer(&tr->max_buffer);
23aaa3c1
SRRH
6643#endif
6644}
6645
9a38a885
SRRH
6646static void init_trace_flags_index(struct trace_array *tr)
6647{
6648 int i;
6649
6650 /* Used by the trace options files */
6651 for (i = 0; i < TRACE_FLAGS_MAX_SIZE; i++)
6652 tr->trace_flags_index[i] = i;
6653}
6654
37aea98b
SRRH
6655static void __update_tracer_options(struct trace_array *tr)
6656{
6657 struct tracer *t;
6658
6659 for (t = trace_types; t; t = t->next)
6660 add_tracer_options(tr, t);
6661}
6662
6663static void update_tracer_options(struct trace_array *tr)
6664{
6665 mutex_lock(&trace_types_lock);
6666 __update_tracer_options(tr);
6667 mutex_unlock(&trace_types_lock);
6668}
6669
eae47358 6670static int instance_mkdir(const char *name)
737223fb 6671{
277ba044
SR
6672 struct trace_array *tr;
6673 int ret;
277ba044
SR
6674
6675 mutex_lock(&trace_types_lock);
6676
6677 ret = -EEXIST;
6678 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
6679 if (tr->name && strcmp(tr->name, name) == 0)
6680 goto out_unlock;
6681 }
6682
6683 ret = -ENOMEM;
6684 tr = kzalloc(sizeof(*tr), GFP_KERNEL);
6685 if (!tr)
6686 goto out_unlock;
6687
6688 tr->name = kstrdup(name, GFP_KERNEL);
6689 if (!tr->name)
6690 goto out_free_tr;
6691
ccfe9e42
AL
6692 if (!alloc_cpumask_var(&tr->tracing_cpumask, GFP_KERNEL))
6693 goto out_free_tr;
6694
983f938a
SRRH
6695 tr->trace_flags = global_trace.trace_flags;
6696
ccfe9e42
AL
6697 cpumask_copy(tr->tracing_cpumask, cpu_all_mask);
6698
277ba044
SR
6699 raw_spin_lock_init(&tr->start_lock);
6700
0b9b12c1
SRRH
6701 tr->max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
6702
277ba044
SR
6703 tr->current_trace = &nop_trace;
6704
6705 INIT_LIST_HEAD(&tr->systems);
6706 INIT_LIST_HEAD(&tr->events);
6707
737223fb 6708 if (allocate_trace_buffers(tr, trace_buf_size) < 0)
277ba044
SR
6709 goto out_free_tr;
6710
8434dc93 6711 tr->dir = tracefs_create_dir(name, trace_instance_dir);
277ba044
SR
6712 if (!tr->dir)
6713 goto out_free_tr;
6714
6715 ret = event_trace_add_tracer(tr->dir, tr);
609e85a7 6716 if (ret) {
8434dc93 6717 tracefs_remove_recursive(tr->dir);
277ba044 6718 goto out_free_tr;
609e85a7 6719 }
277ba044 6720
8434dc93 6721 init_tracer_tracefs(tr, tr->dir);
9a38a885 6722 init_trace_flags_index(tr);
37aea98b 6723 __update_tracer_options(tr);
277ba044
SR
6724
6725 list_add(&tr->list, &ftrace_trace_arrays);
6726
6727 mutex_unlock(&trace_types_lock);
6728
6729 return 0;
6730
6731 out_free_tr:
23aaa3c1 6732 free_trace_buffers(tr);
ccfe9e42 6733 free_cpumask_var(tr->tracing_cpumask);
277ba044
SR
6734 kfree(tr->name);
6735 kfree(tr);
6736
6737 out_unlock:
6738 mutex_unlock(&trace_types_lock);
6739
6740 return ret;
6741
6742}
6743
eae47358 6744static int instance_rmdir(const char *name)
0c8916c3
SR
6745{
6746 struct trace_array *tr;
6747 int found = 0;
6748 int ret;
37aea98b 6749 int i;
0c8916c3
SR
6750
6751 mutex_lock(&trace_types_lock);
6752
6753 ret = -ENODEV;
6754 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
6755 if (tr->name && strcmp(tr->name, name) == 0) {
6756 found = 1;
6757 break;
6758 }
6759 }
6760 if (!found)
6761 goto out_unlock;
6762
a695cb58 6763 ret = -EBUSY;
cf6ab6d9 6764 if (tr->ref || (tr->current_trace && tr->current_trace->ref))
a695cb58
SRRH
6765 goto out_unlock;
6766
0c8916c3
SR
6767 list_del(&tr->list);
6768
6b450d25 6769 tracing_set_nop(tr);
0c8916c3 6770 event_trace_del_tracer(tr);
591dffda 6771 ftrace_destroy_function_files(tr);
681a4a2f 6772 tracefs_remove_recursive(tr->dir);
a9fcaaac 6773 free_trace_buffers(tr);
0c8916c3 6774
37aea98b
SRRH
6775 for (i = 0; i < tr->nr_topts; i++) {
6776 kfree(tr->topts[i].topts);
6777 }
6778 kfree(tr->topts);
6779
0c8916c3
SR
6780 kfree(tr->name);
6781 kfree(tr);
6782
6783 ret = 0;
6784
6785 out_unlock:
6786 mutex_unlock(&trace_types_lock);
6787
6788 return ret;
6789}
6790
277ba044
SR
6791static __init void create_trace_instances(struct dentry *d_tracer)
6792{
eae47358
SRRH
6793 trace_instance_dir = tracefs_create_instance_dir("instances", d_tracer,
6794 instance_mkdir,
6795 instance_rmdir);
277ba044
SR
6796 if (WARN_ON(!trace_instance_dir))
6797 return;
277ba044
SR
6798}
6799
2b6080f2 6800static void
8434dc93 6801init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer)
2b6080f2 6802{
121aaee7 6803 int cpu;
2b6080f2 6804
607e2ea1
SRRH
6805 trace_create_file("available_tracers", 0444, d_tracer,
6806 tr, &show_traces_fops);
6807
6808 trace_create_file("current_tracer", 0644, d_tracer,
6809 tr, &set_tracer_fops);
6810
ccfe9e42
AL
6811 trace_create_file("tracing_cpumask", 0644, d_tracer,
6812 tr, &tracing_cpumask_fops);
6813
2b6080f2
SR
6814 trace_create_file("trace_options", 0644, d_tracer,
6815 tr, &tracing_iter_fops);
6816
6817 trace_create_file("trace", 0644, d_tracer,
6484c71c 6818 tr, &tracing_fops);
2b6080f2
SR
6819
6820 trace_create_file("trace_pipe", 0444, d_tracer,
15544209 6821 tr, &tracing_pipe_fops);
2b6080f2
SR
6822
6823 trace_create_file("buffer_size_kb", 0644, d_tracer,
0bc392ee 6824 tr, &tracing_entries_fops);
2b6080f2
SR
6825
6826 trace_create_file("buffer_total_size_kb", 0444, d_tracer,
6827 tr, &tracing_total_entries_fops);
6828
238ae93d 6829 trace_create_file("free_buffer", 0200, d_tracer,
2b6080f2
SR
6830 tr, &tracing_free_buffer_fops);
6831
6832 trace_create_file("trace_marker", 0220, d_tracer,
6833 tr, &tracing_mark_fops);
6834
6835 trace_create_file("trace_clock", 0644, d_tracer, tr,
6836 &trace_clock_fops);
6837
6838 trace_create_file("tracing_on", 0644, d_tracer,
6484c71c 6839 tr, &rb_simple_fops);
ce9bae55 6840
16270145
SRRH
6841 create_trace_options_dir(tr);
6842
6d9b3fa5
SRRH
6843#ifdef CONFIG_TRACER_MAX_TRACE
6844 trace_create_file("tracing_max_latency", 0644, d_tracer,
6845 &tr->max_latency, &tracing_max_lat_fops);
6846#endif
6847
591dffda
SRRH
6848 if (ftrace_create_function_files(tr, d_tracer))
6849 WARN(1, "Could not allocate function filter files");
6850
ce9bae55
SRRH
6851#ifdef CONFIG_TRACER_SNAPSHOT
6852 trace_create_file("snapshot", 0644, d_tracer,
6484c71c 6853 tr, &snapshot_fops);
ce9bae55 6854#endif
121aaee7
SRRH
6855
6856 for_each_tracing_cpu(cpu)
8434dc93 6857 tracing_init_tracefs_percpu(tr, cpu);
121aaee7 6858
2b6080f2
SR
6859}
6860
f76180bc
SRRH
6861static struct vfsmount *trace_automount(void *ingore)
6862{
6863 struct vfsmount *mnt;
6864 struct file_system_type *type;
6865
6866 /*
6867 * To maintain backward compatibility for tools that mount
6868 * debugfs to get to the tracing facility, tracefs is automatically
6869 * mounted to the debugfs/tracing directory.
6870 */
6871 type = get_fs_type("tracefs");
6872 if (!type)
6873 return NULL;
6874 mnt = vfs_kern_mount(type, 0, "tracefs", NULL);
6875 put_filesystem(type);
6876 if (IS_ERR(mnt))
6877 return NULL;
6878 mntget(mnt);
6879
6880 return mnt;
6881}
6882
7eeafbca
SRRH
6883/**
6884 * tracing_init_dentry - initialize top level trace array
6885 *
6886 * This is called when creating files or directories in the tracing
6887 * directory. It is called via fs_initcall() by any of the boot up code
6888 * and expects to return the dentry of the top level tracing directory.
6889 */
6890struct dentry *tracing_init_dentry(void)
6891{
6892 struct trace_array *tr = &global_trace;
6893
f76180bc 6894 /* The top level trace array uses NULL as parent */
7eeafbca 6895 if (tr->dir)
f76180bc 6896 return NULL;
7eeafbca 6897
8b129199
JW
6898 if (WARN_ON(!tracefs_initialized()) ||
6899 (IS_ENABLED(CONFIG_DEBUG_FS) &&
6900 WARN_ON(!debugfs_initialized())))
7eeafbca
SRRH
6901 return ERR_PTR(-ENODEV);
6902
f76180bc
SRRH
6903 /*
6904 * As there may still be users that expect the tracing
6905 * files to exist in debugfs/tracing, we must automount
6906 * the tracefs file system there, so older tools still
6907 * work with the newer kerenl.
6908 */
6909 tr->dir = debugfs_create_automount("tracing", NULL,
6910 trace_automount, NULL);
7eeafbca
SRRH
6911 if (!tr->dir) {
6912 pr_warn_once("Could not create debugfs directory 'tracing'\n");
6913 return ERR_PTR(-ENOMEM);
6914 }
6915
8434dc93 6916 return NULL;
7eeafbca
SRRH
6917}
6918
0c564a53
SRRH
6919extern struct trace_enum_map *__start_ftrace_enum_maps[];
6920extern struct trace_enum_map *__stop_ftrace_enum_maps[];
6921
6922static void __init trace_enum_init(void)
6923{
3673b8e4
SRRH
6924 int len;
6925
6926 len = __stop_ftrace_enum_maps - __start_ftrace_enum_maps;
9828413d 6927 trace_insert_enum_map(NULL, __start_ftrace_enum_maps, len);
3673b8e4
SRRH
6928}
6929
6930#ifdef CONFIG_MODULES
6931static void trace_module_add_enums(struct module *mod)
6932{
6933 if (!mod->num_trace_enums)
6934 return;
6935
6936 /*
6937 * Modules with bad taint do not have events created, do
6938 * not bother with enums either.
6939 */
6940 if (trace_module_has_bad_taint(mod))
6941 return;
6942
9828413d 6943 trace_insert_enum_map(mod, mod->trace_enums, mod->num_trace_enums);
3673b8e4
SRRH
6944}
6945
9828413d
SRRH
6946#ifdef CONFIG_TRACE_ENUM_MAP_FILE
6947static void trace_module_remove_enums(struct module *mod)
6948{
6949 union trace_enum_map_item *map;
6950 union trace_enum_map_item **last = &trace_enum_maps;
6951
6952 if (!mod->num_trace_enums)
6953 return;
6954
6955 mutex_lock(&trace_enum_mutex);
6956
6957 map = trace_enum_maps;
6958
6959 while (map) {
6960 if (map->head.mod == mod)
6961 break;
6962 map = trace_enum_jmp_to_tail(map);
6963 last = &map->tail.next;
6964 map = map->tail.next;
6965 }
6966 if (!map)
6967 goto out;
6968
6969 *last = trace_enum_jmp_to_tail(map)->tail.next;
6970 kfree(map);
6971 out:
6972 mutex_unlock(&trace_enum_mutex);
6973}
6974#else
6975static inline void trace_module_remove_enums(struct module *mod) { }
6976#endif /* CONFIG_TRACE_ENUM_MAP_FILE */
6977
3673b8e4
SRRH
6978static int trace_module_notify(struct notifier_block *self,
6979 unsigned long val, void *data)
6980{
6981 struct module *mod = data;
6982
6983 switch (val) {
6984 case MODULE_STATE_COMING:
6985 trace_module_add_enums(mod);
6986 break;
9828413d
SRRH
6987 case MODULE_STATE_GOING:
6988 trace_module_remove_enums(mod);
6989 break;
3673b8e4
SRRH
6990 }
6991
6992 return 0;
0c564a53
SRRH
6993}
6994
3673b8e4
SRRH
6995static struct notifier_block trace_module_nb = {
6996 .notifier_call = trace_module_notify,
6997 .priority = 0,
6998};
9828413d 6999#endif /* CONFIG_MODULES */
3673b8e4 7000
8434dc93 7001static __init int tracer_init_tracefs(void)
bc0c38d1
SR
7002{
7003 struct dentry *d_tracer;
bc0c38d1 7004
7e53bd42
LJ
7005 trace_access_lock_init();
7006
bc0c38d1 7007 d_tracer = tracing_init_dentry();
14a5ae40 7008 if (IS_ERR(d_tracer))
ed6f1c99 7009 return 0;
bc0c38d1 7010
8434dc93 7011 init_tracer_tracefs(&global_trace, d_tracer);
bc0c38d1 7012
5452af66 7013 trace_create_file("tracing_thresh", 0644, d_tracer,
6508fa76 7014 &global_trace, &tracing_thresh_fops);
a8259075 7015
339ae5d3 7016 trace_create_file("README", 0444, d_tracer,
5452af66
FW
7017 NULL, &tracing_readme_fops);
7018
69abe6a5
AP
7019 trace_create_file("saved_cmdlines", 0444, d_tracer,
7020 NULL, &tracing_saved_cmdlines_fops);
5bf9a1ee 7021
939c7a4f
YY
7022 trace_create_file("saved_cmdlines_size", 0644, d_tracer,
7023 NULL, &tracing_saved_cmdlines_size_fops);
7024
0c564a53
SRRH
7025 trace_enum_init();
7026
9828413d
SRRH
7027 trace_create_enum_file(d_tracer);
7028
3673b8e4
SRRH
7029#ifdef CONFIG_MODULES
7030 register_module_notifier(&trace_module_nb);
7031#endif
7032
bc0c38d1 7033#ifdef CONFIG_DYNAMIC_FTRACE
5452af66
FW
7034 trace_create_file("dyn_ftrace_total_info", 0444, d_tracer,
7035 &ftrace_update_tot_cnt, &tracing_dyn_info_fops);
bc0c38d1 7036#endif
b04cc6b1 7037
277ba044 7038 create_trace_instances(d_tracer);
5452af66 7039
37aea98b 7040 update_tracer_options(&global_trace);
09d23a1d 7041
b5ad384e 7042 return 0;
bc0c38d1
SR
7043}
7044
3f5a54e3
SR
7045static int trace_panic_handler(struct notifier_block *this,
7046 unsigned long event, void *unused)
7047{
944ac425 7048 if (ftrace_dump_on_oops)
cecbca96 7049 ftrace_dump(ftrace_dump_on_oops);
3f5a54e3
SR
7050 return NOTIFY_OK;
7051}
7052
7053static struct notifier_block trace_panic_notifier = {
7054 .notifier_call = trace_panic_handler,
7055 .next = NULL,
7056 .priority = 150 /* priority: INT_MAX >= x >= 0 */
7057};
7058
7059static int trace_die_handler(struct notifier_block *self,
7060 unsigned long val,
7061 void *data)
7062{
7063 switch (val) {
7064 case DIE_OOPS:
944ac425 7065 if (ftrace_dump_on_oops)
cecbca96 7066 ftrace_dump(ftrace_dump_on_oops);
3f5a54e3
SR
7067 break;
7068 default:
7069 break;
7070 }
7071 return NOTIFY_OK;
7072}
7073
7074static struct notifier_block trace_die_notifier = {
7075 .notifier_call = trace_die_handler,
7076 .priority = 200
7077};
7078
7079/*
7080 * printk is set to max of 1024, we really don't need it that big.
7081 * Nothing should be printing 1000 characters anyway.
7082 */
7083#define TRACE_MAX_PRINT 1000
7084
7085/*
7086 * Define here KERN_TRACE so that we have one place to modify
7087 * it if we decide to change what log level the ftrace dump
7088 * should be at.
7089 */
428aee14 7090#define KERN_TRACE KERN_EMERG
3f5a54e3 7091
955b61e5 7092void
3f5a54e3
SR
7093trace_printk_seq(struct trace_seq *s)
7094{
7095 /* Probably should print a warning here. */
3a161d99
SRRH
7096 if (s->seq.len >= TRACE_MAX_PRINT)
7097 s->seq.len = TRACE_MAX_PRINT;
3f5a54e3 7098
820b75f6
SRRH
7099 /*
7100 * More paranoid code. Although the buffer size is set to
7101 * PAGE_SIZE, and TRACE_MAX_PRINT is 1000, this is just
7102 * an extra layer of protection.
7103 */
7104 if (WARN_ON_ONCE(s->seq.len >= s->seq.size))
7105 s->seq.len = s->seq.size - 1;
3f5a54e3
SR
7106
7107 /* should be zero ended, but we are paranoid. */
3a161d99 7108 s->buffer[s->seq.len] = 0;
3f5a54e3
SR
7109
7110 printk(KERN_TRACE "%s", s->buffer);
7111
f9520750 7112 trace_seq_init(s);
3f5a54e3
SR
7113}
7114
955b61e5
JW
7115void trace_init_global_iter(struct trace_iterator *iter)
7116{
7117 iter->tr = &global_trace;
2b6080f2 7118 iter->trace = iter->tr->current_trace;
ae3b5093 7119 iter->cpu_file = RING_BUFFER_ALL_CPUS;
12883efb 7120 iter->trace_buffer = &global_trace.trace_buffer;
b2f974d6
CS
7121
7122 if (iter->trace && iter->trace->open)
7123 iter->trace->open(iter);
7124
7125 /* Annotate start of buffers if we had overruns */
7126 if (ring_buffer_overruns(iter->trace_buffer->buffer))
7127 iter->iter_flags |= TRACE_FILE_ANNOTATE;
7128
7129 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
7130 if (trace_clocks[iter->tr->clock_id].in_ns)
7131 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
955b61e5
JW
7132}
7133
7fe70b57 7134void ftrace_dump(enum ftrace_dump_mode oops_dump_mode)
3f5a54e3 7135{
3f5a54e3
SR
7136 /* use static because iter can be a bit big for the stack */
7137 static struct trace_iterator iter;
7fe70b57 7138 static atomic_t dump_running;
983f938a 7139 struct trace_array *tr = &global_trace;
cf586b61 7140 unsigned int old_userobj;
d769041f
SR
7141 unsigned long flags;
7142 int cnt = 0, cpu;
3f5a54e3 7143
7fe70b57
SRRH
7144 /* Only allow one dump user at a time. */
7145 if (atomic_inc_return(&dump_running) != 1) {
7146 atomic_dec(&dump_running);
7147 return;
7148 }
3f5a54e3 7149
7fe70b57
SRRH
7150 /*
7151 * Always turn off tracing when we dump.
7152 * We don't need to show trace output of what happens
7153 * between multiple crashes.
7154 *
7155 * If the user does a sysrq-z, then they can re-enable
7156 * tracing with echo 1 > tracing_on.
7157 */
0ee6b6cf 7158 tracing_off();
cf586b61 7159
7fe70b57 7160 local_irq_save(flags);
3f5a54e3 7161
38dbe0b1 7162 /* Simulate the iterator */
955b61e5
JW
7163 trace_init_global_iter(&iter);
7164
d769041f 7165 for_each_tracing_cpu(cpu) {
5e2d5ef8 7166 atomic_inc(&per_cpu_ptr(iter.trace_buffer->data, cpu)->disabled);
d769041f
SR
7167 }
7168
983f938a 7169 old_userobj = tr->trace_flags & TRACE_ITER_SYM_USEROBJ;
cf586b61 7170
b54d3de9 7171 /* don't look at user memory in panic mode */
983f938a 7172 tr->trace_flags &= ~TRACE_ITER_SYM_USEROBJ;
b54d3de9 7173
cecbca96
FW
7174 switch (oops_dump_mode) {
7175 case DUMP_ALL:
ae3b5093 7176 iter.cpu_file = RING_BUFFER_ALL_CPUS;
cecbca96
FW
7177 break;
7178 case DUMP_ORIG:
7179 iter.cpu_file = raw_smp_processor_id();
7180 break;
7181 case DUMP_NONE:
7182 goto out_enable;
7183 default:
7184 printk(KERN_TRACE "Bad dumping mode, switching to all CPUs dump\n");
ae3b5093 7185 iter.cpu_file = RING_BUFFER_ALL_CPUS;
cecbca96
FW
7186 }
7187
7188 printk(KERN_TRACE "Dumping ftrace buffer:\n");
3f5a54e3 7189
7fe70b57
SRRH
7190 /* Did function tracer already get disabled? */
7191 if (ftrace_is_dead()) {
7192 printk("# WARNING: FUNCTION TRACING IS CORRUPTED\n");
7193 printk("# MAY BE MISSING FUNCTION EVENTS\n");
7194 }
7195
3f5a54e3
SR
7196 /*
7197 * We need to stop all tracing on all CPUS to read the
7198 * the next buffer. This is a bit expensive, but is
7199 * not done often. We fill all what we can read,
7200 * and then release the locks again.
7201 */
7202
3f5a54e3
SR
7203 while (!trace_empty(&iter)) {
7204
7205 if (!cnt)
7206 printk(KERN_TRACE "---------------------------------\n");
7207
7208 cnt++;
7209
7210 /* reset all but tr, trace, and overruns */
7211 memset(&iter.seq, 0,
7212 sizeof(struct trace_iterator) -
7213 offsetof(struct trace_iterator, seq));
7214 iter.iter_flags |= TRACE_FILE_LAT_FMT;
7215 iter.pos = -1;
7216
955b61e5 7217 if (trace_find_next_entry_inc(&iter) != NULL) {
74e7ff8c
LJ
7218 int ret;
7219
7220 ret = print_trace_line(&iter);
7221 if (ret != TRACE_TYPE_NO_CONSUME)
7222 trace_consume(&iter);
3f5a54e3 7223 }
b892e5c8 7224 touch_nmi_watchdog();
3f5a54e3
SR
7225
7226 trace_printk_seq(&iter.seq);
7227 }
7228
7229 if (!cnt)
7230 printk(KERN_TRACE " (ftrace buffer empty)\n");
7231 else
7232 printk(KERN_TRACE "---------------------------------\n");
7233
cecbca96 7234 out_enable:
983f938a 7235 tr->trace_flags |= old_userobj;
cf586b61 7236
7fe70b57
SRRH
7237 for_each_tracing_cpu(cpu) {
7238 atomic_dec(&per_cpu_ptr(iter.trace_buffer->data, cpu)->disabled);
cf586b61 7239 }
7fe70b57 7240 atomic_dec(&dump_running);
cd891ae0 7241 local_irq_restore(flags);
3f5a54e3 7242}
a8eecf22 7243EXPORT_SYMBOL_GPL(ftrace_dump);
cf586b61 7244
3928a8a2 7245__init static int tracer_alloc_buffers(void)
bc0c38d1 7246{
73c5162a 7247 int ring_buf_size;
9e01c1b7 7248 int ret = -ENOMEM;
4c11d7ae 7249
b5e87c05
SRRH
7250 /*
7251 * Make sure we don't accidently add more trace options
7252 * than we have bits for.
7253 */
9a38a885 7254 BUILD_BUG_ON(TRACE_ITER_LAST_BIT > TRACE_FLAGS_MAX_SIZE);
b5e87c05 7255
9e01c1b7
RR
7256 if (!alloc_cpumask_var(&tracing_buffer_mask, GFP_KERNEL))
7257 goto out;
7258
ccfe9e42 7259 if (!alloc_cpumask_var(&global_trace.tracing_cpumask, GFP_KERNEL))
9e01c1b7 7260 goto out_free_buffer_mask;
4c11d7ae 7261
07d777fe
SR
7262 /* Only allocate trace_printk buffers if a trace_printk exists */
7263 if (__stop___trace_bprintk_fmt != __start___trace_bprintk_fmt)
81698831 7264 /* Must be called before global_trace.buffer is allocated */
07d777fe
SR
7265 trace_printk_init_buffers();
7266
73c5162a
SR
7267 /* To save memory, keep the ring buffer size to its minimum */
7268 if (ring_buffer_expanded)
7269 ring_buf_size = trace_buf_size;
7270 else
7271 ring_buf_size = 1;
7272
9e01c1b7 7273 cpumask_copy(tracing_buffer_mask, cpu_possible_mask);
ccfe9e42 7274 cpumask_copy(global_trace.tracing_cpumask, cpu_all_mask);
9e01c1b7 7275
2b6080f2
SR
7276 raw_spin_lock_init(&global_trace.start_lock);
7277
2c4a33ab
SRRH
7278 /* Used for event triggers */
7279 temp_buffer = ring_buffer_alloc(PAGE_SIZE, RB_FL_OVERWRITE);
7280 if (!temp_buffer)
7281 goto out_free_cpumask;
7282
939c7a4f
YY
7283 if (trace_create_savedcmd() < 0)
7284 goto out_free_temp_buffer;
7285
9e01c1b7 7286 /* TODO: make the number of buffers hot pluggable with CPUS */
737223fb 7287 if (allocate_trace_buffers(&global_trace, ring_buf_size) < 0) {
3928a8a2
SR
7288 printk(KERN_ERR "tracer: failed to allocate ring buffer!\n");
7289 WARN_ON(1);
939c7a4f 7290 goto out_free_savedcmd;
4c11d7ae 7291 }
a7603ff4 7292
499e5470
SR
7293 if (global_trace.buffer_disabled)
7294 tracing_off();
4c11d7ae 7295
e1e232ca
SR
7296 if (trace_boot_clock) {
7297 ret = tracing_set_clock(&global_trace, trace_boot_clock);
7298 if (ret < 0)
a395d6a7
JP
7299 pr_warn("Trace clock %s not defined, going back to default\n",
7300 trace_boot_clock);
e1e232ca
SR
7301 }
7302
ca164318
SRRH
7303 /*
7304 * register_tracer() might reference current_trace, so it
7305 * needs to be set before we register anything. This is
7306 * just a bootstrap of current_trace anyway.
7307 */
2b6080f2
SR
7308 global_trace.current_trace = &nop_trace;
7309
0b9b12c1
SRRH
7310 global_trace.max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
7311
4104d326
SRRH
7312 ftrace_init_global_array_ops(&global_trace);
7313
9a38a885
SRRH
7314 init_trace_flags_index(&global_trace);
7315
ca164318
SRRH
7316 register_tracer(&nop_trace);
7317
60a11774
SR
7318 /* All seems OK, enable tracing */
7319 tracing_disabled = 0;
3928a8a2 7320
3f5a54e3
SR
7321 atomic_notifier_chain_register(&panic_notifier_list,
7322 &trace_panic_notifier);
7323
7324 register_die_notifier(&trace_die_notifier);
2fc1dfbe 7325
ae63b31e
SR
7326 global_trace.flags = TRACE_ARRAY_FL_GLOBAL;
7327
7328 INIT_LIST_HEAD(&global_trace.systems);
7329 INIT_LIST_HEAD(&global_trace.events);
7330 list_add(&global_trace.list, &ftrace_trace_arrays);
7331
a4d1e688 7332 apply_trace_boot_options();
7bcfaf54 7333
77fd5c15
SRRH
7334 register_snapshot_cmd();
7335
2fc1dfbe 7336 return 0;
3f5a54e3 7337
939c7a4f
YY
7338out_free_savedcmd:
7339 free_saved_cmdlines_buffer(savedcmd);
2c4a33ab
SRRH
7340out_free_temp_buffer:
7341 ring_buffer_free(temp_buffer);
9e01c1b7 7342out_free_cpumask:
ccfe9e42 7343 free_cpumask_var(global_trace.tracing_cpumask);
9e01c1b7
RR
7344out_free_buffer_mask:
7345 free_cpumask_var(tracing_buffer_mask);
7346out:
7347 return ret;
bc0c38d1 7348}
b2821ae6 7349
5f893b26
SRRH
7350void __init trace_init(void)
7351{
0daa2302
SRRH
7352 if (tracepoint_printk) {
7353 tracepoint_print_iter =
7354 kmalloc(sizeof(*tracepoint_print_iter), GFP_KERNEL);
7355 if (WARN_ON(!tracepoint_print_iter))
7356 tracepoint_printk = 0;
7357 }
5f893b26 7358 tracer_alloc_buffers();
0c564a53 7359 trace_event_init();
5f893b26
SRRH
7360}
7361
b2821ae6
SR
7362__init static int clear_boot_tracer(void)
7363{
7364 /*
7365 * The default tracer at boot buffer is an init section.
7366 * This function is called in lateinit. If we did not
7367 * find the boot tracer, then clear it out, to prevent
7368 * later registration from accessing the buffer that is
7369 * about to be freed.
7370 */
7371 if (!default_bootup_tracer)
7372 return 0;
7373
7374 printk(KERN_INFO "ftrace bootup tracer '%s' not registered.\n",
7375 default_bootup_tracer);
7376 default_bootup_tracer = NULL;
7377
7378 return 0;
7379}
7380
8434dc93 7381fs_initcall(tracer_init_tracefs);
b2821ae6 7382late_initcall(clear_boot_tracer);