]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - kernel/trace/trace.c
tracing: Add hist trigger support for multiple values ('vals=' param)
[mirror_ubuntu-jammy-kernel.git] / kernel / trace / trace.c
CommitLineData
bc0c38d1
SR
1/*
2 * ring buffer based function tracer
3 *
2b6080f2 4 * Copyright (C) 2007-2012 Steven Rostedt <srostedt@redhat.com>
bc0c38d1
SR
5 * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
6 *
7 * Originally taken from the RT patch by:
8 * Arnaldo Carvalho de Melo <acme@redhat.com>
9 *
10 * Based on code from the latency_tracer, that is:
11 * Copyright (C) 2004-2006 Ingo Molnar
6d49e352 12 * Copyright (C) 2004 Nadia Yvette Chambers
bc0c38d1 13 */
2cadf913 14#include <linux/ring_buffer.h>
273b281f 15#include <generated/utsrelease.h>
2cadf913
SR
16#include <linux/stacktrace.h>
17#include <linux/writeback.h>
bc0c38d1
SR
18#include <linux/kallsyms.h>
19#include <linux/seq_file.h>
3f5a54e3 20#include <linux/notifier.h>
2cadf913 21#include <linux/irqflags.h>
bc0c38d1 22#include <linux/debugfs.h>
8434dc93 23#include <linux/tracefs.h>
4c11d7ae 24#include <linux/pagemap.h>
bc0c38d1
SR
25#include <linux/hardirq.h>
26#include <linux/linkage.h>
27#include <linux/uaccess.h>
2cadf913 28#include <linux/kprobes.h>
bc0c38d1
SR
29#include <linux/ftrace.h>
30#include <linux/module.h>
31#include <linux/percpu.h>
2cadf913 32#include <linux/splice.h>
3f5a54e3 33#include <linux/kdebug.h>
5f0c6c03 34#include <linux/string.h>
f76180bc 35#include <linux/mount.h>
7e53bd42 36#include <linux/rwsem.h>
5a0e3ad6 37#include <linux/slab.h>
bc0c38d1
SR
38#include <linux/ctype.h>
39#include <linux/init.h>
2a2cc8f7 40#include <linux/poll.h>
b892e5c8 41#include <linux/nmi.h>
bc0c38d1 42#include <linux/fs.h>
8bd75c77 43#include <linux/sched/rt.h>
86387f7e 44
bc0c38d1 45#include "trace.h"
f0868d1e 46#include "trace_output.h"
bc0c38d1 47
73c5162a
SR
48/*
49 * On boot up, the ring buffer is set to the minimum size, so that
50 * we do not waste memory on systems that are not using tracing.
51 */
55034cd6 52bool ring_buffer_expanded;
73c5162a 53
8e1b82e0
FW
54/*
55 * We need to change this state when a selftest is running.
ff32504f
FW
56 * A selftest will lurk into the ring-buffer to count the
57 * entries inserted during the selftest although some concurrent
5e1607a0 58 * insertions into the ring-buffer such as trace_printk could occurred
ff32504f
FW
59 * at the same time, giving false positive or negative results.
60 */
8e1b82e0 61static bool __read_mostly tracing_selftest_running;
ff32504f 62
b2821ae6
SR
63/*
64 * If a tracer is running, we do not want to run SELFTEST.
65 */
020e5f85 66bool __read_mostly tracing_selftest_disabled;
b2821ae6 67
0daa2302
SRRH
68/* Pipe tracepoints to printk */
69struct trace_iterator *tracepoint_print_iter;
70int tracepoint_printk;
71
adf9f195
FW
72/* For tracers that don't implement custom flags */
73static struct tracer_opt dummy_tracer_opt[] = {
74 { }
75};
76
8c1a49ae
SRRH
77static int
78dummy_set_flag(struct trace_array *tr, u32 old_flags, u32 bit, int set)
adf9f195
FW
79{
80 return 0;
81}
0f048701 82
7ffbd48d
SR
83/*
84 * To prevent the comm cache from being overwritten when no
85 * tracing is active, only save the comm when a trace event
86 * occurred.
87 */
88static DEFINE_PER_CPU(bool, trace_cmdline_save);
89
0f048701
SR
90/*
91 * Kill all tracing for good (never come back).
92 * It is initialized to 1 but will turn to zero if the initialization
93 * of the tracer is successful. But that is the only place that sets
94 * this back to zero.
95 */
4fd27358 96static int tracing_disabled = 1;
0f048701 97
955b61e5 98cpumask_var_t __read_mostly tracing_buffer_mask;
ab46428c 99
944ac425
SR
100/*
101 * ftrace_dump_on_oops - variable to dump ftrace buffer on oops
102 *
103 * If there is an oops (or kernel panic) and the ftrace_dump_on_oops
104 * is set, then ftrace_dump is called. This will output the contents
105 * of the ftrace buffers to the console. This is very useful for
106 * capturing traces that lead to crashes and outputing it to a
107 * serial console.
108 *
109 * It is default off, but you can enable it with either specifying
110 * "ftrace_dump_on_oops" in the kernel command line, or setting
cecbca96
FW
111 * /proc/sys/kernel/ftrace_dump_on_oops
112 * Set 1 if you want to dump buffers of all CPUs
113 * Set 2 if you want to dump the buffer of the CPU that triggered oops
944ac425 114 */
cecbca96
FW
115
116enum ftrace_dump_mode ftrace_dump_on_oops;
944ac425 117
de7edd31
SRRH
118/* When set, tracing will stop when a WARN*() is hit */
119int __disable_trace_on_warning;
120
9828413d
SRRH
121#ifdef CONFIG_TRACE_ENUM_MAP_FILE
122/* Map of enums to their values, for "enum_map" file */
123struct trace_enum_map_head {
124 struct module *mod;
125 unsigned long length;
126};
127
128union trace_enum_map_item;
129
130struct trace_enum_map_tail {
131 /*
132 * "end" is first and points to NULL as it must be different
133 * than "mod" or "enum_string"
134 */
135 union trace_enum_map_item *next;
136 const char *end; /* points to NULL */
137};
138
139static DEFINE_MUTEX(trace_enum_mutex);
140
141/*
142 * The trace_enum_maps are saved in an array with two extra elements,
143 * one at the beginning, and one at the end. The beginning item contains
144 * the count of the saved maps (head.length), and the module they
145 * belong to if not built in (head.mod). The ending item contains a
146 * pointer to the next array of saved enum_map items.
147 */
148union trace_enum_map_item {
149 struct trace_enum_map map;
150 struct trace_enum_map_head head;
151 struct trace_enum_map_tail tail;
152};
153
154static union trace_enum_map_item *trace_enum_maps;
155#endif /* CONFIG_TRACE_ENUM_MAP_FILE */
156
607e2ea1 157static int tracing_set_tracer(struct trace_array *tr, const char *buf);
b2821ae6 158
ee6c2c1b
LZ
159#define MAX_TRACER_SIZE 100
160static char bootup_tracer_buf[MAX_TRACER_SIZE] __initdata;
b2821ae6 161static char *default_bootup_tracer;
d9e54076 162
55034cd6
SRRH
163static bool allocate_snapshot;
164
1beee96b 165static int __init set_cmdline_ftrace(char *str)
d9e54076 166{
67012ab1 167 strlcpy(bootup_tracer_buf, str, MAX_TRACER_SIZE);
b2821ae6 168 default_bootup_tracer = bootup_tracer_buf;
73c5162a 169 /* We are using ftrace early, expand it */
55034cd6 170 ring_buffer_expanded = true;
d9e54076
PZ
171 return 1;
172}
1beee96b 173__setup("ftrace=", set_cmdline_ftrace);
d9e54076 174
944ac425
SR
175static int __init set_ftrace_dump_on_oops(char *str)
176{
cecbca96
FW
177 if (*str++ != '=' || !*str) {
178 ftrace_dump_on_oops = DUMP_ALL;
179 return 1;
180 }
181
182 if (!strcmp("orig_cpu", str)) {
183 ftrace_dump_on_oops = DUMP_ORIG;
184 return 1;
185 }
186
187 return 0;
944ac425
SR
188}
189__setup("ftrace_dump_on_oops", set_ftrace_dump_on_oops);
60a11774 190
de7edd31
SRRH
191static int __init stop_trace_on_warning(char *str)
192{
933ff9f2
LCG
193 if ((strcmp(str, "=0") != 0 && strcmp(str, "=off") != 0))
194 __disable_trace_on_warning = 1;
de7edd31
SRRH
195 return 1;
196}
933ff9f2 197__setup("traceoff_on_warning", stop_trace_on_warning);
de7edd31 198
3209cff4 199static int __init boot_alloc_snapshot(char *str)
55034cd6
SRRH
200{
201 allocate_snapshot = true;
202 /* We also need the main ring buffer expanded */
203 ring_buffer_expanded = true;
204 return 1;
205}
3209cff4 206__setup("alloc_snapshot", boot_alloc_snapshot);
55034cd6 207
7bcfaf54
SR
208
209static char trace_boot_options_buf[MAX_TRACER_SIZE] __initdata;
7bcfaf54
SR
210
211static int __init set_trace_boot_options(char *str)
212{
67012ab1 213 strlcpy(trace_boot_options_buf, str, MAX_TRACER_SIZE);
7bcfaf54
SR
214 return 0;
215}
216__setup("trace_options=", set_trace_boot_options);
217
e1e232ca
SR
218static char trace_boot_clock_buf[MAX_TRACER_SIZE] __initdata;
219static char *trace_boot_clock __initdata;
220
221static int __init set_trace_boot_clock(char *str)
222{
223 strlcpy(trace_boot_clock_buf, str, MAX_TRACER_SIZE);
224 trace_boot_clock = trace_boot_clock_buf;
225 return 0;
226}
227__setup("trace_clock=", set_trace_boot_clock);
228
0daa2302
SRRH
229static int __init set_tracepoint_printk(char *str)
230{
231 if ((strcmp(str, "=0") != 0 && strcmp(str, "=off") != 0))
232 tracepoint_printk = 1;
233 return 1;
234}
235__setup("tp_printk", set_tracepoint_printk);
de7edd31 236
cf8e3474 237unsigned long long ns2usecs(cycle_t nsec)
bc0c38d1
SR
238{
239 nsec += 500;
240 do_div(nsec, 1000);
241 return nsec;
242}
243
983f938a
SRRH
244/* trace_flags holds trace_options default values */
245#define TRACE_DEFAULT_FLAGS \
246 (FUNCTION_DEFAULT_FLAGS | \
247 TRACE_ITER_PRINT_PARENT | TRACE_ITER_PRINTK | \
248 TRACE_ITER_ANNOTATE | TRACE_ITER_CONTEXT_INFO | \
249 TRACE_ITER_RECORD_CMD | TRACE_ITER_OVERWRITE | \
250 TRACE_ITER_IRQ_INFO | TRACE_ITER_MARKERS)
251
16270145
SRRH
252/* trace_options that are only supported by global_trace */
253#define TOP_LEVEL_TRACE_FLAGS (TRACE_ITER_PRINTK | \
254 TRACE_ITER_PRINTK_MSGONLY | TRACE_ITER_RECORD_CMD)
255
256
4fcdae83
SR
257/*
258 * The global_trace is the descriptor that holds the tracing
259 * buffers for the live tracing. For each CPU, it contains
260 * a link list of pages that will store trace entries. The
261 * page descriptor of the pages in the memory is used to hold
262 * the link list by linking the lru item in the page descriptor
263 * to each of the pages in the buffer per CPU.
264 *
265 * For each active CPU there is a data field that holds the
266 * pages for the buffer for that CPU. Each CPU has the same number
267 * of pages allocated for its buffer.
268 */
983f938a
SRRH
269static struct trace_array global_trace = {
270 .trace_flags = TRACE_DEFAULT_FLAGS,
271};
bc0c38d1 272
ae63b31e 273LIST_HEAD(ftrace_trace_arrays);
bc0c38d1 274
ff451961
SRRH
275int trace_array_get(struct trace_array *this_tr)
276{
277 struct trace_array *tr;
278 int ret = -ENODEV;
279
280 mutex_lock(&trace_types_lock);
281 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
282 if (tr == this_tr) {
283 tr->ref++;
284 ret = 0;
285 break;
286 }
287 }
288 mutex_unlock(&trace_types_lock);
289
290 return ret;
291}
292
293static void __trace_array_put(struct trace_array *this_tr)
294{
295 WARN_ON(!this_tr->ref);
296 this_tr->ref--;
297}
298
299void trace_array_put(struct trace_array *this_tr)
300{
301 mutex_lock(&trace_types_lock);
302 __trace_array_put(this_tr);
303 mutex_unlock(&trace_types_lock);
304}
305
7f1d2f82 306int filter_check_discard(struct trace_event_file *file, void *rec,
f306cc82
TZ
307 struct ring_buffer *buffer,
308 struct ring_buffer_event *event)
eb02ce01 309{
5d6ad960 310 if (unlikely(file->flags & EVENT_FILE_FL_FILTERED) &&
f306cc82
TZ
311 !filter_match_preds(file->filter, rec)) {
312 ring_buffer_discard_commit(buffer, event);
313 return 1;
314 }
315
316 return 0;
317}
318EXPORT_SYMBOL_GPL(filter_check_discard);
319
2425bcb9 320int call_filter_check_discard(struct trace_event_call *call, void *rec,
f306cc82
TZ
321 struct ring_buffer *buffer,
322 struct ring_buffer_event *event)
323{
324 if (unlikely(call->flags & TRACE_EVENT_FL_FILTERED) &&
325 !filter_match_preds(call->filter, rec)) {
326 ring_buffer_discard_commit(buffer, event);
327 return 1;
328 }
329
330 return 0;
eb02ce01 331}
f306cc82 332EXPORT_SYMBOL_GPL(call_filter_check_discard);
eb02ce01 333
ad1438a0 334static cycle_t buffer_ftrace_now(struct trace_buffer *buf, int cpu)
37886f6a
SR
335{
336 u64 ts;
337
338 /* Early boot up does not have a buffer yet */
9457158b 339 if (!buf->buffer)
37886f6a
SR
340 return trace_clock_local();
341
9457158b
AL
342 ts = ring_buffer_time_stamp(buf->buffer, cpu);
343 ring_buffer_normalize_time_stamp(buf->buffer, cpu, &ts);
37886f6a
SR
344
345 return ts;
346}
bc0c38d1 347
9457158b
AL
348cycle_t ftrace_now(int cpu)
349{
350 return buffer_ftrace_now(&global_trace.trace_buffer, cpu);
351}
352
10246fa3
SRRH
353/**
354 * tracing_is_enabled - Show if global_trace has been disabled
355 *
356 * Shows if the global trace has been enabled or not. It uses the
357 * mirror flag "buffer_disabled" to be used in fast paths such as for
358 * the irqsoff tracer. But it may be inaccurate due to races. If you
359 * need to know the accurate state, use tracing_is_on() which is a little
360 * slower, but accurate.
361 */
9036990d
SR
362int tracing_is_enabled(void)
363{
10246fa3
SRRH
364 /*
365 * For quick access (irqsoff uses this in fast path), just
366 * return the mirror variable of the state of the ring buffer.
367 * It's a little racy, but we don't really care.
368 */
369 smp_rmb();
370 return !global_trace.buffer_disabled;
9036990d
SR
371}
372
4fcdae83 373/*
3928a8a2
SR
374 * trace_buf_size is the size in bytes that is allocated
375 * for a buffer. Note, the number of bytes is always rounded
376 * to page size.
3f5a54e3
SR
377 *
378 * This number is purposely set to a low number of 16384.
379 * If the dump on oops happens, it will be much appreciated
380 * to not have to wait for all that output. Anyway this can be
381 * boot time and run time configurable.
4fcdae83 382 */
3928a8a2 383#define TRACE_BUF_SIZE_DEFAULT 1441792UL /* 16384 * 88 (sizeof(entry)) */
3f5a54e3 384
3928a8a2 385static unsigned long trace_buf_size = TRACE_BUF_SIZE_DEFAULT;
bc0c38d1 386
4fcdae83 387/* trace_types holds a link list of available tracers. */
bc0c38d1 388static struct tracer *trace_types __read_mostly;
4fcdae83 389
4fcdae83
SR
390/*
391 * trace_types_lock is used to protect the trace_types list.
4fcdae83 392 */
a8227415 393DEFINE_MUTEX(trace_types_lock);
4fcdae83 394
7e53bd42
LJ
395/*
396 * serialize the access of the ring buffer
397 *
398 * ring buffer serializes readers, but it is low level protection.
399 * The validity of the events (which returns by ring_buffer_peek() ..etc)
400 * are not protected by ring buffer.
401 *
402 * The content of events may become garbage if we allow other process consumes
403 * these events concurrently:
404 * A) the page of the consumed events may become a normal page
405 * (not reader page) in ring buffer, and this page will be rewrited
406 * by events producer.
407 * B) The page of the consumed events may become a page for splice_read,
408 * and this page will be returned to system.
409 *
410 * These primitives allow multi process access to different cpu ring buffer
411 * concurrently.
412 *
413 * These primitives don't distinguish read-only and read-consume access.
414 * Multi read-only access are also serialized.
415 */
416
417#ifdef CONFIG_SMP
418static DECLARE_RWSEM(all_cpu_access_lock);
419static DEFINE_PER_CPU(struct mutex, cpu_access_lock);
420
421static inline void trace_access_lock(int cpu)
422{
ae3b5093 423 if (cpu == RING_BUFFER_ALL_CPUS) {
7e53bd42
LJ
424 /* gain it for accessing the whole ring buffer. */
425 down_write(&all_cpu_access_lock);
426 } else {
427 /* gain it for accessing a cpu ring buffer. */
428
ae3b5093 429 /* Firstly block other trace_access_lock(RING_BUFFER_ALL_CPUS). */
7e53bd42
LJ
430 down_read(&all_cpu_access_lock);
431
432 /* Secondly block other access to this @cpu ring buffer. */
433 mutex_lock(&per_cpu(cpu_access_lock, cpu));
434 }
435}
436
437static inline void trace_access_unlock(int cpu)
438{
ae3b5093 439 if (cpu == RING_BUFFER_ALL_CPUS) {
7e53bd42
LJ
440 up_write(&all_cpu_access_lock);
441 } else {
442 mutex_unlock(&per_cpu(cpu_access_lock, cpu));
443 up_read(&all_cpu_access_lock);
444 }
445}
446
447static inline void trace_access_lock_init(void)
448{
449 int cpu;
450
451 for_each_possible_cpu(cpu)
452 mutex_init(&per_cpu(cpu_access_lock, cpu));
453}
454
455#else
456
457static DEFINE_MUTEX(access_lock);
458
459static inline void trace_access_lock(int cpu)
460{
461 (void)cpu;
462 mutex_lock(&access_lock);
463}
464
465static inline void trace_access_unlock(int cpu)
466{
467 (void)cpu;
468 mutex_unlock(&access_lock);
469}
470
471static inline void trace_access_lock_init(void)
472{
473}
474
475#endif
476
d78a4614
SRRH
477#ifdef CONFIG_STACKTRACE
478static void __ftrace_trace_stack(struct ring_buffer *buffer,
479 unsigned long flags,
480 int skip, int pc, struct pt_regs *regs);
2d34f489
SRRH
481static inline void ftrace_trace_stack(struct trace_array *tr,
482 struct ring_buffer *buffer,
73dddbb5
SRRH
483 unsigned long flags,
484 int skip, int pc, struct pt_regs *regs);
ca475e83 485
d78a4614
SRRH
486#else
487static inline void __ftrace_trace_stack(struct ring_buffer *buffer,
488 unsigned long flags,
489 int skip, int pc, struct pt_regs *regs)
490{
491}
2d34f489
SRRH
492static inline void ftrace_trace_stack(struct trace_array *tr,
493 struct ring_buffer *buffer,
73dddbb5
SRRH
494 unsigned long flags,
495 int skip, int pc, struct pt_regs *regs)
ca475e83
SRRH
496{
497}
498
d78a4614
SRRH
499#endif
500
5280bcef 501static void tracer_tracing_on(struct trace_array *tr)
10246fa3
SRRH
502{
503 if (tr->trace_buffer.buffer)
504 ring_buffer_record_on(tr->trace_buffer.buffer);
505 /*
506 * This flag is looked at when buffers haven't been allocated
507 * yet, or by some tracers (like irqsoff), that just want to
508 * know if the ring buffer has been disabled, but it can handle
509 * races of where it gets disabled but we still do a record.
510 * As the check is in the fast path of the tracers, it is more
511 * important to be fast than accurate.
512 */
513 tr->buffer_disabled = 0;
514 /* Make the flag seen by readers */
515 smp_wmb();
516}
517
499e5470
SR
518/**
519 * tracing_on - enable tracing buffers
520 *
521 * This function enables tracing buffers that may have been
522 * disabled with tracing_off.
523 */
524void tracing_on(void)
525{
10246fa3 526 tracer_tracing_on(&global_trace);
499e5470
SR
527}
528EXPORT_SYMBOL_GPL(tracing_on);
529
09ae7234
SRRH
530/**
531 * __trace_puts - write a constant string into the trace buffer.
532 * @ip: The address of the caller
533 * @str: The constant string to write
534 * @size: The size of the string.
535 */
536int __trace_puts(unsigned long ip, const char *str, int size)
537{
538 struct ring_buffer_event *event;
539 struct ring_buffer *buffer;
540 struct print_entry *entry;
541 unsigned long irq_flags;
542 int alloc;
8abfb872
J
543 int pc;
544
983f938a 545 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
f0160a5a
J
546 return 0;
547
8abfb872 548 pc = preempt_count();
09ae7234 549
3132e107
SRRH
550 if (unlikely(tracing_selftest_running || tracing_disabled))
551 return 0;
552
09ae7234
SRRH
553 alloc = sizeof(*entry) + size + 2; /* possible \n added */
554
555 local_save_flags(irq_flags);
556 buffer = global_trace.trace_buffer.buffer;
557 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, alloc,
8abfb872 558 irq_flags, pc);
09ae7234
SRRH
559 if (!event)
560 return 0;
561
562 entry = ring_buffer_event_data(event);
563 entry->ip = ip;
564
565 memcpy(&entry->buf, str, size);
566
567 /* Add a newline if necessary */
568 if (entry->buf[size - 1] != '\n') {
569 entry->buf[size] = '\n';
570 entry->buf[size + 1] = '\0';
571 } else
572 entry->buf[size] = '\0';
573
574 __buffer_unlock_commit(buffer, event);
2d34f489 575 ftrace_trace_stack(&global_trace, buffer, irq_flags, 4, pc, NULL);
09ae7234
SRRH
576
577 return size;
578}
579EXPORT_SYMBOL_GPL(__trace_puts);
580
581/**
582 * __trace_bputs - write the pointer to a constant string into trace buffer
583 * @ip: The address of the caller
584 * @str: The constant string to write to the buffer to
585 */
586int __trace_bputs(unsigned long ip, const char *str)
587{
588 struct ring_buffer_event *event;
589 struct ring_buffer *buffer;
590 struct bputs_entry *entry;
591 unsigned long irq_flags;
592 int size = sizeof(struct bputs_entry);
8abfb872
J
593 int pc;
594
983f938a 595 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
f0160a5a
J
596 return 0;
597
8abfb872 598 pc = preempt_count();
09ae7234 599
3132e107
SRRH
600 if (unlikely(tracing_selftest_running || tracing_disabled))
601 return 0;
602
09ae7234
SRRH
603 local_save_flags(irq_flags);
604 buffer = global_trace.trace_buffer.buffer;
605 event = trace_buffer_lock_reserve(buffer, TRACE_BPUTS, size,
8abfb872 606 irq_flags, pc);
09ae7234
SRRH
607 if (!event)
608 return 0;
609
610 entry = ring_buffer_event_data(event);
611 entry->ip = ip;
612 entry->str = str;
613
614 __buffer_unlock_commit(buffer, event);
2d34f489 615 ftrace_trace_stack(&global_trace, buffer, irq_flags, 4, pc, NULL);
09ae7234
SRRH
616
617 return 1;
618}
619EXPORT_SYMBOL_GPL(__trace_bputs);
620
ad909e21
SRRH
621#ifdef CONFIG_TRACER_SNAPSHOT
622/**
623 * trace_snapshot - take a snapshot of the current buffer.
624 *
625 * This causes a swap between the snapshot buffer and the current live
626 * tracing buffer. You can use this to take snapshots of the live
627 * trace when some condition is triggered, but continue to trace.
628 *
629 * Note, make sure to allocate the snapshot with either
630 * a tracing_snapshot_alloc(), or by doing it manually
631 * with: echo 1 > /sys/kernel/debug/tracing/snapshot
632 *
633 * If the snapshot buffer is not allocated, it will stop tracing.
634 * Basically making a permanent snapshot.
635 */
636void tracing_snapshot(void)
637{
638 struct trace_array *tr = &global_trace;
639 struct tracer *tracer = tr->current_trace;
640 unsigned long flags;
641
1b22e382
SRRH
642 if (in_nmi()) {
643 internal_trace_puts("*** SNAPSHOT CALLED FROM NMI CONTEXT ***\n");
644 internal_trace_puts("*** snapshot is being ignored ***\n");
645 return;
646 }
647
ad909e21 648 if (!tr->allocated_snapshot) {
ca268da6
SRRH
649 internal_trace_puts("*** SNAPSHOT NOT ALLOCATED ***\n");
650 internal_trace_puts("*** stopping trace here! ***\n");
ad909e21
SRRH
651 tracing_off();
652 return;
653 }
654
655 /* Note, snapshot can not be used when the tracer uses it */
656 if (tracer->use_max_tr) {
ca268da6
SRRH
657 internal_trace_puts("*** LATENCY TRACER ACTIVE ***\n");
658 internal_trace_puts("*** Can not use snapshot (sorry) ***\n");
ad909e21
SRRH
659 return;
660 }
661
662 local_irq_save(flags);
663 update_max_tr(tr, current, smp_processor_id());
664 local_irq_restore(flags);
665}
1b22e382 666EXPORT_SYMBOL_GPL(tracing_snapshot);
ad909e21
SRRH
667
668static int resize_buffer_duplicate_size(struct trace_buffer *trace_buf,
669 struct trace_buffer *size_buf, int cpu_id);
3209cff4
SRRH
670static void set_buffer_entries(struct trace_buffer *buf, unsigned long val);
671
672static int alloc_snapshot(struct trace_array *tr)
673{
674 int ret;
675
676 if (!tr->allocated_snapshot) {
677
678 /* allocate spare buffer */
679 ret = resize_buffer_duplicate_size(&tr->max_buffer,
680 &tr->trace_buffer, RING_BUFFER_ALL_CPUS);
681 if (ret < 0)
682 return ret;
683
684 tr->allocated_snapshot = true;
685 }
686
687 return 0;
688}
689
ad1438a0 690static void free_snapshot(struct trace_array *tr)
3209cff4
SRRH
691{
692 /*
693 * We don't free the ring buffer. instead, resize it because
694 * The max_tr ring buffer has some state (e.g. ring->clock) and
695 * we want preserve it.
696 */
697 ring_buffer_resize(tr->max_buffer.buffer, 1, RING_BUFFER_ALL_CPUS);
698 set_buffer_entries(&tr->max_buffer, 1);
699 tracing_reset_online_cpus(&tr->max_buffer);
700 tr->allocated_snapshot = false;
701}
ad909e21 702
93e31ffb
TZ
703/**
704 * tracing_alloc_snapshot - allocate snapshot buffer.
705 *
706 * This only allocates the snapshot buffer if it isn't already
707 * allocated - it doesn't also take a snapshot.
708 *
709 * This is meant to be used in cases where the snapshot buffer needs
710 * to be set up for events that can't sleep but need to be able to
711 * trigger a snapshot.
712 */
713int tracing_alloc_snapshot(void)
714{
715 struct trace_array *tr = &global_trace;
716 int ret;
717
718 ret = alloc_snapshot(tr);
719 WARN_ON(ret < 0);
720
721 return ret;
722}
723EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
724
ad909e21
SRRH
725/**
726 * trace_snapshot_alloc - allocate and take a snapshot of the current buffer.
727 *
728 * This is similar to trace_snapshot(), but it will allocate the
729 * snapshot buffer if it isn't already allocated. Use this only
730 * where it is safe to sleep, as the allocation may sleep.
731 *
732 * This causes a swap between the snapshot buffer and the current live
733 * tracing buffer. You can use this to take snapshots of the live
734 * trace when some condition is triggered, but continue to trace.
735 */
736void tracing_snapshot_alloc(void)
737{
ad909e21
SRRH
738 int ret;
739
93e31ffb
TZ
740 ret = tracing_alloc_snapshot();
741 if (ret < 0)
3209cff4 742 return;
ad909e21
SRRH
743
744 tracing_snapshot();
745}
1b22e382 746EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
ad909e21
SRRH
747#else
748void tracing_snapshot(void)
749{
750 WARN_ONCE(1, "Snapshot feature not enabled, but internal snapshot used");
751}
1b22e382 752EXPORT_SYMBOL_GPL(tracing_snapshot);
93e31ffb
TZ
753int tracing_alloc_snapshot(void)
754{
755 WARN_ONCE(1, "Snapshot feature not enabled, but snapshot allocation used");
756 return -ENODEV;
757}
758EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
ad909e21
SRRH
759void tracing_snapshot_alloc(void)
760{
761 /* Give warning */
762 tracing_snapshot();
763}
1b22e382 764EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
ad909e21
SRRH
765#endif /* CONFIG_TRACER_SNAPSHOT */
766
5280bcef 767static void tracer_tracing_off(struct trace_array *tr)
10246fa3
SRRH
768{
769 if (tr->trace_buffer.buffer)
770 ring_buffer_record_off(tr->trace_buffer.buffer);
771 /*
772 * This flag is looked at when buffers haven't been allocated
773 * yet, or by some tracers (like irqsoff), that just want to
774 * know if the ring buffer has been disabled, but it can handle
775 * races of where it gets disabled but we still do a record.
776 * As the check is in the fast path of the tracers, it is more
777 * important to be fast than accurate.
778 */
779 tr->buffer_disabled = 1;
780 /* Make the flag seen by readers */
781 smp_wmb();
782}
783
499e5470
SR
784/**
785 * tracing_off - turn off tracing buffers
786 *
787 * This function stops the tracing buffers from recording data.
788 * It does not disable any overhead the tracers themselves may
789 * be causing. This function simply causes all recording to
790 * the ring buffers to fail.
791 */
792void tracing_off(void)
793{
10246fa3 794 tracer_tracing_off(&global_trace);
499e5470
SR
795}
796EXPORT_SYMBOL_GPL(tracing_off);
797
de7edd31
SRRH
798void disable_trace_on_warning(void)
799{
800 if (__disable_trace_on_warning)
801 tracing_off();
802}
803
10246fa3
SRRH
804/**
805 * tracer_tracing_is_on - show real state of ring buffer enabled
806 * @tr : the trace array to know if ring buffer is enabled
807 *
808 * Shows real state of the ring buffer if it is enabled or not.
809 */
5280bcef 810static int tracer_tracing_is_on(struct trace_array *tr)
10246fa3
SRRH
811{
812 if (tr->trace_buffer.buffer)
813 return ring_buffer_record_is_on(tr->trace_buffer.buffer);
814 return !tr->buffer_disabled;
815}
816
499e5470
SR
817/**
818 * tracing_is_on - show state of ring buffers enabled
819 */
820int tracing_is_on(void)
821{
10246fa3 822 return tracer_tracing_is_on(&global_trace);
499e5470
SR
823}
824EXPORT_SYMBOL_GPL(tracing_is_on);
825
3928a8a2 826static int __init set_buf_size(char *str)
bc0c38d1 827{
3928a8a2 828 unsigned long buf_size;
c6caeeb1 829
bc0c38d1
SR
830 if (!str)
831 return 0;
9d612bef 832 buf_size = memparse(str, &str);
c6caeeb1 833 /* nr_entries can not be zero */
9d612bef 834 if (buf_size == 0)
c6caeeb1 835 return 0;
3928a8a2 836 trace_buf_size = buf_size;
bc0c38d1
SR
837 return 1;
838}
3928a8a2 839__setup("trace_buf_size=", set_buf_size);
bc0c38d1 840
0e950173
TB
841static int __init set_tracing_thresh(char *str)
842{
87abb3b1 843 unsigned long threshold;
0e950173
TB
844 int ret;
845
846 if (!str)
847 return 0;
bcd83ea6 848 ret = kstrtoul(str, 0, &threshold);
0e950173
TB
849 if (ret < 0)
850 return 0;
87abb3b1 851 tracing_thresh = threshold * 1000;
0e950173
TB
852 return 1;
853}
854__setup("tracing_thresh=", set_tracing_thresh);
855
57f50be1
SR
856unsigned long nsecs_to_usecs(unsigned long nsecs)
857{
858 return nsecs / 1000;
859}
860
a3418a36
SRRH
861/*
862 * TRACE_FLAGS is defined as a tuple matching bit masks with strings.
863 * It uses C(a, b) where 'a' is the enum name and 'b' is the string that
864 * matches it. By defining "C(a, b) b", TRACE_FLAGS becomes a list
865 * of strings in the order that the enums were defined.
866 */
867#undef C
868#define C(a, b) b
869
4fcdae83 870/* These must match the bit postions in trace_iterator_flags */
bc0c38d1 871static const char *trace_options[] = {
a3418a36 872 TRACE_FLAGS
bc0c38d1
SR
873 NULL
874};
875
5079f326
Z
876static struct {
877 u64 (*func)(void);
878 const char *name;
8be0709f 879 int in_ns; /* is this clock in nanoseconds? */
5079f326 880} trace_clocks[] = {
1b3e5c09
TG
881 { trace_clock_local, "local", 1 },
882 { trace_clock_global, "global", 1 },
883 { trace_clock_counter, "counter", 0 },
e7fda6c4 884 { trace_clock_jiffies, "uptime", 0 },
1b3e5c09
TG
885 { trace_clock, "perf", 1 },
886 { ktime_get_mono_fast_ns, "mono", 1 },
aabfa5f2 887 { ktime_get_raw_fast_ns, "mono_raw", 1 },
8cbd9cc6 888 ARCH_TRACE_CLOCKS
5079f326
Z
889};
890
b63f39ea 891/*
892 * trace_parser_get_init - gets the buffer for trace parser
893 */
894int trace_parser_get_init(struct trace_parser *parser, int size)
895{
896 memset(parser, 0, sizeof(*parser));
897
898 parser->buffer = kmalloc(size, GFP_KERNEL);
899 if (!parser->buffer)
900 return 1;
901
902 parser->size = size;
903 return 0;
904}
905
906/*
907 * trace_parser_put - frees the buffer for trace parser
908 */
909void trace_parser_put(struct trace_parser *parser)
910{
911 kfree(parser->buffer);
912}
913
914/*
915 * trace_get_user - reads the user input string separated by space
916 * (matched by isspace(ch))
917 *
918 * For each string found the 'struct trace_parser' is updated,
919 * and the function returns.
920 *
921 * Returns number of bytes read.
922 *
923 * See kernel/trace/trace.h for 'struct trace_parser' details.
924 */
925int trace_get_user(struct trace_parser *parser, const char __user *ubuf,
926 size_t cnt, loff_t *ppos)
927{
928 char ch;
929 size_t read = 0;
930 ssize_t ret;
931
932 if (!*ppos)
933 trace_parser_clear(parser);
934
935 ret = get_user(ch, ubuf++);
936 if (ret)
937 goto out;
938
939 read++;
940 cnt--;
941
942 /*
943 * The parser is not finished with the last write,
944 * continue reading the user input without skipping spaces.
945 */
946 if (!parser->cont) {
947 /* skip white space */
948 while (cnt && isspace(ch)) {
949 ret = get_user(ch, ubuf++);
950 if (ret)
951 goto out;
952 read++;
953 cnt--;
954 }
955
956 /* only spaces were written */
957 if (isspace(ch)) {
958 *ppos += read;
959 ret = read;
960 goto out;
961 }
962
963 parser->idx = 0;
964 }
965
966 /* read the non-space input */
967 while (cnt && !isspace(ch)) {
3c235a33 968 if (parser->idx < parser->size - 1)
b63f39ea 969 parser->buffer[parser->idx++] = ch;
970 else {
971 ret = -EINVAL;
972 goto out;
973 }
974 ret = get_user(ch, ubuf++);
975 if (ret)
976 goto out;
977 read++;
978 cnt--;
979 }
980
981 /* We either got finished input or we have to wait for another call. */
982 if (isspace(ch)) {
983 parser->buffer[parser->idx] = 0;
984 parser->cont = false;
057db848 985 } else if (parser->idx < parser->size - 1) {
b63f39ea 986 parser->cont = true;
987 parser->buffer[parser->idx++] = ch;
057db848
SR
988 } else {
989 ret = -EINVAL;
990 goto out;
b63f39ea 991 }
992
993 *ppos += read;
994 ret = read;
995
996out:
997 return ret;
998}
999
3a161d99 1000/* TODO add a seq_buf_to_buffer() */
b8b94265 1001static ssize_t trace_seq_to_buffer(struct trace_seq *s, void *buf, size_t cnt)
3c56819b
EGM
1002{
1003 int len;
3c56819b 1004
5ac48378 1005 if (trace_seq_used(s) <= s->seq.readpos)
3c56819b
EGM
1006 return -EBUSY;
1007
5ac48378 1008 len = trace_seq_used(s) - s->seq.readpos;
3c56819b
EGM
1009 if (cnt > len)
1010 cnt = len;
3a161d99 1011 memcpy(buf, s->buffer + s->seq.readpos, cnt);
3c56819b 1012
3a161d99 1013 s->seq.readpos += cnt;
3c56819b
EGM
1014 return cnt;
1015}
1016
0e950173
TB
1017unsigned long __read_mostly tracing_thresh;
1018
5d4a9dba 1019#ifdef CONFIG_TRACER_MAX_TRACE
5d4a9dba
SR
1020/*
1021 * Copy the new maximum trace into the separate maximum-trace
1022 * structure. (this way the maximum trace is permanently saved,
1023 * for later retrieval via /sys/kernel/debug/tracing/latency_trace)
1024 */
1025static void
1026__update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
1027{
12883efb
SRRH
1028 struct trace_buffer *trace_buf = &tr->trace_buffer;
1029 struct trace_buffer *max_buf = &tr->max_buffer;
1030 struct trace_array_cpu *data = per_cpu_ptr(trace_buf->data, cpu);
1031 struct trace_array_cpu *max_data = per_cpu_ptr(max_buf->data, cpu);
5d4a9dba 1032
12883efb
SRRH
1033 max_buf->cpu = cpu;
1034 max_buf->time_start = data->preempt_timestamp;
5d4a9dba 1035
6d9b3fa5 1036 max_data->saved_latency = tr->max_latency;
8248ac05
SR
1037 max_data->critical_start = data->critical_start;
1038 max_data->critical_end = data->critical_end;
5d4a9dba 1039
1acaa1b2 1040 memcpy(max_data->comm, tsk->comm, TASK_COMM_LEN);
8248ac05 1041 max_data->pid = tsk->pid;
f17a5194
SRRH
1042 /*
1043 * If tsk == current, then use current_uid(), as that does not use
1044 * RCU. The irq tracer can be called out of RCU scope.
1045 */
1046 if (tsk == current)
1047 max_data->uid = current_uid();
1048 else
1049 max_data->uid = task_uid(tsk);
1050
8248ac05
SR
1051 max_data->nice = tsk->static_prio - 20 - MAX_RT_PRIO;
1052 max_data->policy = tsk->policy;
1053 max_data->rt_priority = tsk->rt_priority;
5d4a9dba
SR
1054
1055 /* record this tasks comm */
1056 tracing_record_cmdline(tsk);
1057}
1058
4fcdae83
SR
1059/**
1060 * update_max_tr - snapshot all trace buffers from global_trace to max_tr
1061 * @tr: tracer
1062 * @tsk: the task with the latency
1063 * @cpu: The cpu that initiated the trace.
1064 *
1065 * Flip the buffers between the @tr and the max_tr and record information
1066 * about which task was the cause of this latency.
1067 */
e309b41d 1068void
bc0c38d1
SR
1069update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
1070{
2721e72d 1071 struct ring_buffer *buf;
bc0c38d1 1072
2b6080f2 1073 if (tr->stop_count)
b8de7bd1
SR
1074 return;
1075
4c11d7ae 1076 WARN_ON_ONCE(!irqs_disabled());
34600f0e 1077
45ad21ca 1078 if (!tr->allocated_snapshot) {
debdd57f 1079 /* Only the nop tracer should hit this when disabling */
2b6080f2 1080 WARN_ON_ONCE(tr->current_trace != &nop_trace);
34600f0e 1081 return;
debdd57f 1082 }
34600f0e 1083
0b9b12c1 1084 arch_spin_lock(&tr->max_lock);
3928a8a2 1085
12883efb
SRRH
1086 buf = tr->trace_buffer.buffer;
1087 tr->trace_buffer.buffer = tr->max_buffer.buffer;
1088 tr->max_buffer.buffer = buf;
3928a8a2 1089
bc0c38d1 1090 __update_max_tr(tr, tsk, cpu);
0b9b12c1 1091 arch_spin_unlock(&tr->max_lock);
bc0c38d1
SR
1092}
1093
1094/**
1095 * update_max_tr_single - only copy one trace over, and reset the rest
1096 * @tr - tracer
1097 * @tsk - task with the latency
1098 * @cpu - the cpu of the buffer to copy.
4fcdae83
SR
1099 *
1100 * Flip the trace of a single CPU buffer between the @tr and the max_tr.
bc0c38d1 1101 */
e309b41d 1102void
bc0c38d1
SR
1103update_max_tr_single(struct trace_array *tr, struct task_struct *tsk, int cpu)
1104{
3928a8a2 1105 int ret;
bc0c38d1 1106
2b6080f2 1107 if (tr->stop_count)
b8de7bd1
SR
1108 return;
1109
4c11d7ae 1110 WARN_ON_ONCE(!irqs_disabled());
6c24499f 1111 if (!tr->allocated_snapshot) {
2930e04d 1112 /* Only the nop tracer should hit this when disabling */
9e8529af 1113 WARN_ON_ONCE(tr->current_trace != &nop_trace);
ef710e10 1114 return;
2930e04d 1115 }
ef710e10 1116
0b9b12c1 1117 arch_spin_lock(&tr->max_lock);
bc0c38d1 1118
12883efb 1119 ret = ring_buffer_swap_cpu(tr->max_buffer.buffer, tr->trace_buffer.buffer, cpu);
3928a8a2 1120
e8165dbb
SR
1121 if (ret == -EBUSY) {
1122 /*
1123 * We failed to swap the buffer due to a commit taking
1124 * place on this CPU. We fail to record, but we reset
1125 * the max trace buffer (no one writes directly to it)
1126 * and flag that it failed.
1127 */
12883efb 1128 trace_array_printk_buf(tr->max_buffer.buffer, _THIS_IP_,
e8165dbb
SR
1129 "Failed to swap buffers due to commit in progress\n");
1130 }
1131
e8165dbb 1132 WARN_ON_ONCE(ret && ret != -EAGAIN && ret != -EBUSY);
bc0c38d1
SR
1133
1134 __update_max_tr(tr, tsk, cpu);
0b9b12c1 1135 arch_spin_unlock(&tr->max_lock);
bc0c38d1 1136}
5d4a9dba 1137#endif /* CONFIG_TRACER_MAX_TRACE */
bc0c38d1 1138
e30f53aa 1139static int wait_on_pipe(struct trace_iterator *iter, bool full)
0d5c6e1c 1140{
15693458
SRRH
1141 /* Iterators are static, they should be filled or empty */
1142 if (trace_buffer_iter(iter, iter->cpu_file))
8b8b3683 1143 return 0;
0d5c6e1c 1144
e30f53aa
RV
1145 return ring_buffer_wait(iter->trace_buffer->buffer, iter->cpu_file,
1146 full);
0d5c6e1c
SR
1147}
1148
f4e781c0
SRRH
1149#ifdef CONFIG_FTRACE_STARTUP_TEST
1150static int run_tracer_selftest(struct tracer *type)
1151{
1152 struct trace_array *tr = &global_trace;
1153 struct tracer *saved_tracer = tr->current_trace;
1154 int ret;
0d5c6e1c 1155
f4e781c0
SRRH
1156 if (!type->selftest || tracing_selftest_disabled)
1157 return 0;
0d5c6e1c
SR
1158
1159 /*
f4e781c0
SRRH
1160 * Run a selftest on this tracer.
1161 * Here we reset the trace buffer, and set the current
1162 * tracer to be this tracer. The tracer can then run some
1163 * internal tracing to verify that everything is in order.
1164 * If we fail, we do not register this tracer.
0d5c6e1c 1165 */
f4e781c0 1166 tracing_reset_online_cpus(&tr->trace_buffer);
0d5c6e1c 1167
f4e781c0
SRRH
1168 tr->current_trace = type;
1169
1170#ifdef CONFIG_TRACER_MAX_TRACE
1171 if (type->use_max_tr) {
1172 /* If we expanded the buffers, make sure the max is expanded too */
1173 if (ring_buffer_expanded)
1174 ring_buffer_resize(tr->max_buffer.buffer, trace_buf_size,
1175 RING_BUFFER_ALL_CPUS);
1176 tr->allocated_snapshot = true;
1177 }
1178#endif
1179
1180 /* the test is responsible for initializing and enabling */
1181 pr_info("Testing tracer %s: ", type->name);
1182 ret = type->selftest(type, tr);
1183 /* the test is responsible for resetting too */
1184 tr->current_trace = saved_tracer;
1185 if (ret) {
1186 printk(KERN_CONT "FAILED!\n");
1187 /* Add the warning after printing 'FAILED' */
1188 WARN_ON(1);
1189 return -1;
1190 }
1191 /* Only reset on passing, to avoid touching corrupted buffers */
1192 tracing_reset_online_cpus(&tr->trace_buffer);
1193
1194#ifdef CONFIG_TRACER_MAX_TRACE
1195 if (type->use_max_tr) {
1196 tr->allocated_snapshot = false;
0d5c6e1c 1197
f4e781c0
SRRH
1198 /* Shrink the max buffer again */
1199 if (ring_buffer_expanded)
1200 ring_buffer_resize(tr->max_buffer.buffer, 1,
1201 RING_BUFFER_ALL_CPUS);
1202 }
1203#endif
1204
1205 printk(KERN_CONT "PASSED\n");
1206 return 0;
1207}
1208#else
1209static inline int run_tracer_selftest(struct tracer *type)
1210{
1211 return 0;
0d5c6e1c 1212}
f4e781c0 1213#endif /* CONFIG_FTRACE_STARTUP_TEST */
0d5c6e1c 1214
41d9c0be
SRRH
1215static void add_tracer_options(struct trace_array *tr, struct tracer *t);
1216
a4d1e688
JW
1217static void __init apply_trace_boot_options(void);
1218
4fcdae83
SR
1219/**
1220 * register_tracer - register a tracer with the ftrace system.
1221 * @type - the plugin for the tracer
1222 *
1223 * Register a new plugin tracer.
1224 */
a4d1e688 1225int __init register_tracer(struct tracer *type)
bc0c38d1
SR
1226{
1227 struct tracer *t;
bc0c38d1
SR
1228 int ret = 0;
1229
1230 if (!type->name) {
1231 pr_info("Tracer must have a name\n");
1232 return -1;
1233 }
1234
24a461d5 1235 if (strlen(type->name) >= MAX_TRACER_SIZE) {
ee6c2c1b
LZ
1236 pr_info("Tracer has a name longer than %d\n", MAX_TRACER_SIZE);
1237 return -1;
1238 }
1239
bc0c38d1 1240 mutex_lock(&trace_types_lock);
86fa2f60 1241
8e1b82e0
FW
1242 tracing_selftest_running = true;
1243
bc0c38d1
SR
1244 for (t = trace_types; t; t = t->next) {
1245 if (strcmp(type->name, t->name) == 0) {
1246 /* already found */
ee6c2c1b 1247 pr_info("Tracer %s already registered\n",
bc0c38d1
SR
1248 type->name);
1249 ret = -1;
1250 goto out;
1251 }
1252 }
1253
adf9f195
FW
1254 if (!type->set_flag)
1255 type->set_flag = &dummy_set_flag;
d39cdd20
CH
1256 if (!type->flags) {
1257 /*allocate a dummy tracer_flags*/
1258 type->flags = kmalloc(sizeof(*type->flags), GFP_KERNEL);
c8ca003b
CH
1259 if (!type->flags) {
1260 ret = -ENOMEM;
1261 goto out;
1262 }
d39cdd20
CH
1263 type->flags->val = 0;
1264 type->flags->opts = dummy_tracer_opt;
1265 } else
adf9f195
FW
1266 if (!type->flags->opts)
1267 type->flags->opts = dummy_tracer_opt;
6eaaa5d5 1268
d39cdd20
CH
1269 /* store the tracer for __set_tracer_option */
1270 type->flags->trace = type;
1271
f4e781c0
SRRH
1272 ret = run_tracer_selftest(type);
1273 if (ret < 0)
1274 goto out;
60a11774 1275
bc0c38d1
SR
1276 type->next = trace_types;
1277 trace_types = type;
41d9c0be 1278 add_tracer_options(&global_trace, type);
60a11774 1279
bc0c38d1 1280 out:
8e1b82e0 1281 tracing_selftest_running = false;
bc0c38d1
SR
1282 mutex_unlock(&trace_types_lock);
1283
dac74940
SR
1284 if (ret || !default_bootup_tracer)
1285 goto out_unlock;
1286
ee6c2c1b 1287 if (strncmp(default_bootup_tracer, type->name, MAX_TRACER_SIZE))
dac74940
SR
1288 goto out_unlock;
1289
1290 printk(KERN_INFO "Starting tracer '%s'\n", type->name);
1291 /* Do we want this tracer to start on bootup? */
607e2ea1 1292 tracing_set_tracer(&global_trace, type->name);
dac74940 1293 default_bootup_tracer = NULL;
a4d1e688
JW
1294
1295 apply_trace_boot_options();
1296
dac74940 1297 /* disable other selftests, since this will break it. */
55034cd6 1298 tracing_selftest_disabled = true;
b2821ae6 1299#ifdef CONFIG_FTRACE_STARTUP_TEST
dac74940
SR
1300 printk(KERN_INFO "Disabling FTRACE selftests due to running tracer '%s'\n",
1301 type->name);
b2821ae6 1302#endif
b2821ae6 1303
dac74940 1304 out_unlock:
bc0c38d1
SR
1305 return ret;
1306}
1307
12883efb 1308void tracing_reset(struct trace_buffer *buf, int cpu)
f633903a 1309{
12883efb 1310 struct ring_buffer *buffer = buf->buffer;
f633903a 1311
a5416411
HT
1312 if (!buffer)
1313 return;
1314
f633903a
SR
1315 ring_buffer_record_disable(buffer);
1316
1317 /* Make sure all commits have finished */
1318 synchronize_sched();
68179686 1319 ring_buffer_reset_cpu(buffer, cpu);
f633903a
SR
1320
1321 ring_buffer_record_enable(buffer);
1322}
1323
12883efb 1324void tracing_reset_online_cpus(struct trace_buffer *buf)
213cc060 1325{
12883efb 1326 struct ring_buffer *buffer = buf->buffer;
213cc060
PE
1327 int cpu;
1328
a5416411
HT
1329 if (!buffer)
1330 return;
1331
621968cd
SR
1332 ring_buffer_record_disable(buffer);
1333
1334 /* Make sure all commits have finished */
1335 synchronize_sched();
1336
9457158b 1337 buf->time_start = buffer_ftrace_now(buf, buf->cpu);
213cc060
PE
1338
1339 for_each_online_cpu(cpu)
68179686 1340 ring_buffer_reset_cpu(buffer, cpu);
621968cd
SR
1341
1342 ring_buffer_record_enable(buffer);
213cc060
PE
1343}
1344
09d8091c 1345/* Must have trace_types_lock held */
873c642f 1346void tracing_reset_all_online_cpus(void)
9456f0fa 1347{
873c642f
SRRH
1348 struct trace_array *tr;
1349
873c642f 1350 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
12883efb
SRRH
1351 tracing_reset_online_cpus(&tr->trace_buffer);
1352#ifdef CONFIG_TRACER_MAX_TRACE
1353 tracing_reset_online_cpus(&tr->max_buffer);
1354#endif
873c642f 1355 }
9456f0fa
SR
1356}
1357
939c7a4f 1358#define SAVED_CMDLINES_DEFAULT 128
2c7eea4c 1359#define NO_CMDLINE_MAP UINT_MAX
edc35bd7 1360static arch_spinlock_t trace_cmdline_lock = __ARCH_SPIN_LOCK_UNLOCKED;
939c7a4f
YY
1361struct saved_cmdlines_buffer {
1362 unsigned map_pid_to_cmdline[PID_MAX_DEFAULT+1];
1363 unsigned *map_cmdline_to_pid;
1364 unsigned cmdline_num;
1365 int cmdline_idx;
1366 char *saved_cmdlines;
1367};
1368static struct saved_cmdlines_buffer *savedcmd;
25b0b44a 1369
25b0b44a 1370/* temporary disable recording */
4fd27358 1371static atomic_t trace_record_cmdline_disabled __read_mostly;
bc0c38d1 1372
939c7a4f
YY
1373static inline char *get_saved_cmdlines(int idx)
1374{
1375 return &savedcmd->saved_cmdlines[idx * TASK_COMM_LEN];
1376}
1377
1378static inline void set_cmdline(int idx, const char *cmdline)
bc0c38d1 1379{
939c7a4f
YY
1380 memcpy(get_saved_cmdlines(idx), cmdline, TASK_COMM_LEN);
1381}
1382
1383static int allocate_cmdlines_buffer(unsigned int val,
1384 struct saved_cmdlines_buffer *s)
1385{
1386 s->map_cmdline_to_pid = kmalloc(val * sizeof(*s->map_cmdline_to_pid),
1387 GFP_KERNEL);
1388 if (!s->map_cmdline_to_pid)
1389 return -ENOMEM;
1390
1391 s->saved_cmdlines = kmalloc(val * TASK_COMM_LEN, GFP_KERNEL);
1392 if (!s->saved_cmdlines) {
1393 kfree(s->map_cmdline_to_pid);
1394 return -ENOMEM;
1395 }
1396
1397 s->cmdline_idx = 0;
1398 s->cmdline_num = val;
1399 memset(&s->map_pid_to_cmdline, NO_CMDLINE_MAP,
1400 sizeof(s->map_pid_to_cmdline));
1401 memset(s->map_cmdline_to_pid, NO_CMDLINE_MAP,
1402 val * sizeof(*s->map_cmdline_to_pid));
1403
1404 return 0;
1405}
1406
1407static int trace_create_savedcmd(void)
1408{
1409 int ret;
1410
a6af8fbf 1411 savedcmd = kmalloc(sizeof(*savedcmd), GFP_KERNEL);
939c7a4f
YY
1412 if (!savedcmd)
1413 return -ENOMEM;
1414
1415 ret = allocate_cmdlines_buffer(SAVED_CMDLINES_DEFAULT, savedcmd);
1416 if (ret < 0) {
1417 kfree(savedcmd);
1418 savedcmd = NULL;
1419 return -ENOMEM;
1420 }
1421
1422 return 0;
bc0c38d1
SR
1423}
1424
b5130b1e
CE
1425int is_tracing_stopped(void)
1426{
2b6080f2 1427 return global_trace.stop_count;
b5130b1e
CE
1428}
1429
0f048701
SR
1430/**
1431 * tracing_start - quick start of the tracer
1432 *
1433 * If tracing is enabled but was stopped by tracing_stop,
1434 * this will start the tracer back up.
1435 */
1436void tracing_start(void)
1437{
1438 struct ring_buffer *buffer;
1439 unsigned long flags;
1440
1441 if (tracing_disabled)
1442 return;
1443
2b6080f2
SR
1444 raw_spin_lock_irqsave(&global_trace.start_lock, flags);
1445 if (--global_trace.stop_count) {
1446 if (global_trace.stop_count < 0) {
b06a8301
SR
1447 /* Someone screwed up their debugging */
1448 WARN_ON_ONCE(1);
2b6080f2 1449 global_trace.stop_count = 0;
b06a8301 1450 }
0f048701
SR
1451 goto out;
1452 }
1453
a2f80714 1454 /* Prevent the buffers from switching */
0b9b12c1 1455 arch_spin_lock(&global_trace.max_lock);
0f048701 1456
12883efb 1457 buffer = global_trace.trace_buffer.buffer;
0f048701
SR
1458 if (buffer)
1459 ring_buffer_record_enable(buffer);
1460
12883efb
SRRH
1461#ifdef CONFIG_TRACER_MAX_TRACE
1462 buffer = global_trace.max_buffer.buffer;
0f048701
SR
1463 if (buffer)
1464 ring_buffer_record_enable(buffer);
12883efb 1465#endif
0f048701 1466
0b9b12c1 1467 arch_spin_unlock(&global_trace.max_lock);
a2f80714 1468
0f048701 1469 out:
2b6080f2
SR
1470 raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
1471}
1472
1473static void tracing_start_tr(struct trace_array *tr)
1474{
1475 struct ring_buffer *buffer;
1476 unsigned long flags;
1477
1478 if (tracing_disabled)
1479 return;
1480
1481 /* If global, we need to also start the max tracer */
1482 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
1483 return tracing_start();
1484
1485 raw_spin_lock_irqsave(&tr->start_lock, flags);
1486
1487 if (--tr->stop_count) {
1488 if (tr->stop_count < 0) {
1489 /* Someone screwed up their debugging */
1490 WARN_ON_ONCE(1);
1491 tr->stop_count = 0;
1492 }
1493 goto out;
1494 }
1495
12883efb 1496 buffer = tr->trace_buffer.buffer;
2b6080f2
SR
1497 if (buffer)
1498 ring_buffer_record_enable(buffer);
1499
1500 out:
1501 raw_spin_unlock_irqrestore(&tr->start_lock, flags);
0f048701
SR
1502}
1503
1504/**
1505 * tracing_stop - quick stop of the tracer
1506 *
1507 * Light weight way to stop tracing. Use in conjunction with
1508 * tracing_start.
1509 */
1510void tracing_stop(void)
1511{
1512 struct ring_buffer *buffer;
1513 unsigned long flags;
1514
2b6080f2
SR
1515 raw_spin_lock_irqsave(&global_trace.start_lock, flags);
1516 if (global_trace.stop_count++)
0f048701
SR
1517 goto out;
1518
a2f80714 1519 /* Prevent the buffers from switching */
0b9b12c1 1520 arch_spin_lock(&global_trace.max_lock);
a2f80714 1521
12883efb 1522 buffer = global_trace.trace_buffer.buffer;
0f048701
SR
1523 if (buffer)
1524 ring_buffer_record_disable(buffer);
1525
12883efb
SRRH
1526#ifdef CONFIG_TRACER_MAX_TRACE
1527 buffer = global_trace.max_buffer.buffer;
0f048701
SR
1528 if (buffer)
1529 ring_buffer_record_disable(buffer);
12883efb 1530#endif
0f048701 1531
0b9b12c1 1532 arch_spin_unlock(&global_trace.max_lock);
a2f80714 1533
0f048701 1534 out:
2b6080f2
SR
1535 raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
1536}
1537
1538static void tracing_stop_tr(struct trace_array *tr)
1539{
1540 struct ring_buffer *buffer;
1541 unsigned long flags;
1542
1543 /* If global, we need to also stop the max tracer */
1544 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
1545 return tracing_stop();
1546
1547 raw_spin_lock_irqsave(&tr->start_lock, flags);
1548 if (tr->stop_count++)
1549 goto out;
1550
12883efb 1551 buffer = tr->trace_buffer.buffer;
2b6080f2
SR
1552 if (buffer)
1553 ring_buffer_record_disable(buffer);
1554
1555 out:
1556 raw_spin_unlock_irqrestore(&tr->start_lock, flags);
0f048701
SR
1557}
1558
e309b41d 1559void trace_stop_cmdline_recording(void);
bc0c38d1 1560
379cfdac 1561static int trace_save_cmdline(struct task_struct *tsk)
bc0c38d1 1562{
a635cf04 1563 unsigned pid, idx;
bc0c38d1
SR
1564
1565 if (!tsk->pid || unlikely(tsk->pid > PID_MAX_DEFAULT))
379cfdac 1566 return 0;
bc0c38d1
SR
1567
1568 /*
1569 * It's not the end of the world if we don't get
1570 * the lock, but we also don't want to spin
1571 * nor do we want to disable interrupts,
1572 * so if we miss here, then better luck next time.
1573 */
0199c4e6 1574 if (!arch_spin_trylock(&trace_cmdline_lock))
379cfdac 1575 return 0;
bc0c38d1 1576
939c7a4f 1577 idx = savedcmd->map_pid_to_cmdline[tsk->pid];
2c7eea4c 1578 if (idx == NO_CMDLINE_MAP) {
939c7a4f 1579 idx = (savedcmd->cmdline_idx + 1) % savedcmd->cmdline_num;
bc0c38d1 1580
a635cf04
CE
1581 /*
1582 * Check whether the cmdline buffer at idx has a pid
1583 * mapped. We are going to overwrite that entry so we
1584 * need to clear the map_pid_to_cmdline. Otherwise we
1585 * would read the new comm for the old pid.
1586 */
939c7a4f 1587 pid = savedcmd->map_cmdline_to_pid[idx];
a635cf04 1588 if (pid != NO_CMDLINE_MAP)
939c7a4f 1589 savedcmd->map_pid_to_cmdline[pid] = NO_CMDLINE_MAP;
bc0c38d1 1590
939c7a4f
YY
1591 savedcmd->map_cmdline_to_pid[idx] = tsk->pid;
1592 savedcmd->map_pid_to_cmdline[tsk->pid] = idx;
bc0c38d1 1593
939c7a4f 1594 savedcmd->cmdline_idx = idx;
bc0c38d1
SR
1595 }
1596
939c7a4f 1597 set_cmdline(idx, tsk->comm);
bc0c38d1 1598
0199c4e6 1599 arch_spin_unlock(&trace_cmdline_lock);
379cfdac
SRRH
1600
1601 return 1;
bc0c38d1
SR
1602}
1603
4c27e756 1604static void __trace_find_cmdline(int pid, char comm[])
bc0c38d1 1605{
bc0c38d1
SR
1606 unsigned map;
1607
4ca53085
SR
1608 if (!pid) {
1609 strcpy(comm, "<idle>");
1610 return;
1611 }
bc0c38d1 1612
74bf4076
SR
1613 if (WARN_ON_ONCE(pid < 0)) {
1614 strcpy(comm, "<XXX>");
1615 return;
1616 }
1617
4ca53085
SR
1618 if (pid > PID_MAX_DEFAULT) {
1619 strcpy(comm, "<...>");
1620 return;
1621 }
bc0c38d1 1622
939c7a4f 1623 map = savedcmd->map_pid_to_cmdline[pid];
50d88758 1624 if (map != NO_CMDLINE_MAP)
939c7a4f 1625 strcpy(comm, get_saved_cmdlines(map));
50d88758
TG
1626 else
1627 strcpy(comm, "<...>");
4c27e756
SRRH
1628}
1629
1630void trace_find_cmdline(int pid, char comm[])
1631{
1632 preempt_disable();
1633 arch_spin_lock(&trace_cmdline_lock);
1634
1635 __trace_find_cmdline(pid, comm);
bc0c38d1 1636
0199c4e6 1637 arch_spin_unlock(&trace_cmdline_lock);
5b6045a9 1638 preempt_enable();
bc0c38d1
SR
1639}
1640
e309b41d 1641void tracing_record_cmdline(struct task_struct *tsk)
bc0c38d1 1642{
0fb9656d 1643 if (atomic_read(&trace_record_cmdline_disabled) || !tracing_is_on())
bc0c38d1
SR
1644 return;
1645
7ffbd48d
SR
1646 if (!__this_cpu_read(trace_cmdline_save))
1647 return;
1648
379cfdac
SRRH
1649 if (trace_save_cmdline(tsk))
1650 __this_cpu_write(trace_cmdline_save, false);
bc0c38d1
SR
1651}
1652
45dcd8b8 1653void
38697053
SR
1654tracing_generic_entry_update(struct trace_entry *entry, unsigned long flags,
1655 int pc)
bc0c38d1
SR
1656{
1657 struct task_struct *tsk = current;
bc0c38d1 1658
777e208d
SR
1659 entry->preempt_count = pc & 0xff;
1660 entry->pid = (tsk) ? tsk->pid : 0;
1661 entry->flags =
9244489a 1662#ifdef CONFIG_TRACE_IRQFLAGS_SUPPORT
2e2ca155 1663 (irqs_disabled_flags(flags) ? TRACE_FLAG_IRQS_OFF : 0) |
9244489a
SR
1664#else
1665 TRACE_FLAG_IRQS_NOSUPPORT |
1666#endif
7e6867bf 1667 ((pc & NMI_MASK ) ? TRACE_FLAG_NMI : 0) |
bc0c38d1
SR
1668 ((pc & HARDIRQ_MASK) ? TRACE_FLAG_HARDIRQ : 0) |
1669 ((pc & SOFTIRQ_MASK) ? TRACE_FLAG_SOFTIRQ : 0) |
e5137b50
PZ
1670 (tif_need_resched() ? TRACE_FLAG_NEED_RESCHED : 0) |
1671 (test_preempt_need_resched() ? TRACE_FLAG_PREEMPT_RESCHED : 0);
bc0c38d1 1672}
f413cdb8 1673EXPORT_SYMBOL_GPL(tracing_generic_entry_update);
bc0c38d1 1674
e77405ad
SR
1675struct ring_buffer_event *
1676trace_buffer_lock_reserve(struct ring_buffer *buffer,
1677 int type,
1678 unsigned long len,
1679 unsigned long flags, int pc)
51a763dd
ACM
1680{
1681 struct ring_buffer_event *event;
1682
e77405ad 1683 event = ring_buffer_lock_reserve(buffer, len);
51a763dd
ACM
1684 if (event != NULL) {
1685 struct trace_entry *ent = ring_buffer_event_data(event);
1686
1687 tracing_generic_entry_update(ent, flags, pc);
1688 ent->type = type;
1689 }
1690
1691 return event;
1692}
51a763dd 1693
7ffbd48d
SR
1694void
1695__buffer_unlock_commit(struct ring_buffer *buffer, struct ring_buffer_event *event)
1696{
1697 __this_cpu_write(trace_cmdline_save, true);
1698 ring_buffer_unlock_commit(buffer, event);
1699}
1700
b7f0c959
SRRH
1701void trace_buffer_unlock_commit(struct trace_array *tr,
1702 struct ring_buffer *buffer,
1703 struct ring_buffer_event *event,
1704 unsigned long flags, int pc)
51a763dd 1705{
7ffbd48d 1706 __buffer_unlock_commit(buffer, event);
51a763dd 1707
2d34f489 1708 ftrace_trace_stack(tr, buffer, flags, 6, pc, NULL);
e77405ad 1709 ftrace_trace_userstack(buffer, flags, pc);
07edf712 1710}
0d5c6e1c 1711EXPORT_SYMBOL_GPL(trace_buffer_unlock_commit);
51a763dd 1712
2c4a33ab
SRRH
1713static struct ring_buffer *temp_buffer;
1714
ccb469a1
SR
1715struct ring_buffer_event *
1716trace_event_buffer_lock_reserve(struct ring_buffer **current_rb,
7f1d2f82 1717 struct trace_event_file *trace_file,
ccb469a1
SR
1718 int type, unsigned long len,
1719 unsigned long flags, int pc)
1720{
2c4a33ab
SRRH
1721 struct ring_buffer_event *entry;
1722
7f1d2f82 1723 *current_rb = trace_file->tr->trace_buffer.buffer;
2c4a33ab 1724 entry = trace_buffer_lock_reserve(*current_rb,
ccb469a1 1725 type, len, flags, pc);
2c4a33ab
SRRH
1726 /*
1727 * If tracing is off, but we have triggers enabled
1728 * we still need to look at the event data. Use the temp_buffer
1729 * to store the trace event for the tigger to use. It's recusive
1730 * safe and will not be recorded anywhere.
1731 */
5d6ad960 1732 if (!entry && trace_file->flags & EVENT_FILE_FL_TRIGGER_COND) {
2c4a33ab
SRRH
1733 *current_rb = temp_buffer;
1734 entry = trace_buffer_lock_reserve(*current_rb,
1735 type, len, flags, pc);
1736 }
1737 return entry;
ccb469a1
SR
1738}
1739EXPORT_SYMBOL_GPL(trace_event_buffer_lock_reserve);
1740
ef5580d0 1741struct ring_buffer_event *
e77405ad
SR
1742trace_current_buffer_lock_reserve(struct ring_buffer **current_rb,
1743 int type, unsigned long len,
ef5580d0
SR
1744 unsigned long flags, int pc)
1745{
12883efb 1746 *current_rb = global_trace.trace_buffer.buffer;
e77405ad 1747 return trace_buffer_lock_reserve(*current_rb,
ef5580d0
SR
1748 type, len, flags, pc);
1749}
94487d6d 1750EXPORT_SYMBOL_GPL(trace_current_buffer_lock_reserve);
ef5580d0 1751
b7f0c959
SRRH
1752void trace_buffer_unlock_commit_regs(struct trace_array *tr,
1753 struct ring_buffer *buffer,
0d5c6e1c
SR
1754 struct ring_buffer_event *event,
1755 unsigned long flags, int pc,
1756 struct pt_regs *regs)
1fd8df2c 1757{
7ffbd48d 1758 __buffer_unlock_commit(buffer, event);
1fd8df2c 1759
7717c6be 1760 ftrace_trace_stack(tr, buffer, flags, 0, pc, regs);
1fd8df2c
MH
1761 ftrace_trace_userstack(buffer, flags, pc);
1762}
0d5c6e1c 1763EXPORT_SYMBOL_GPL(trace_buffer_unlock_commit_regs);
1fd8df2c 1764
e77405ad
SR
1765void trace_current_buffer_discard_commit(struct ring_buffer *buffer,
1766 struct ring_buffer_event *event)
77d9f465 1767{
e77405ad 1768 ring_buffer_discard_commit(buffer, event);
ef5580d0 1769}
12acd473 1770EXPORT_SYMBOL_GPL(trace_current_buffer_discard_commit);
ef5580d0 1771
e309b41d 1772void
7be42151 1773trace_function(struct trace_array *tr,
38697053
SR
1774 unsigned long ip, unsigned long parent_ip, unsigned long flags,
1775 int pc)
bc0c38d1 1776{
2425bcb9 1777 struct trace_event_call *call = &event_function;
12883efb 1778 struct ring_buffer *buffer = tr->trace_buffer.buffer;
3928a8a2 1779 struct ring_buffer_event *event;
777e208d 1780 struct ftrace_entry *entry;
bc0c38d1 1781
e77405ad 1782 event = trace_buffer_lock_reserve(buffer, TRACE_FN, sizeof(*entry),
51a763dd 1783 flags, pc);
3928a8a2
SR
1784 if (!event)
1785 return;
1786 entry = ring_buffer_event_data(event);
777e208d
SR
1787 entry->ip = ip;
1788 entry->parent_ip = parent_ip;
e1112b4d 1789
f306cc82 1790 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1791 __buffer_unlock_commit(buffer, event);
bc0c38d1
SR
1792}
1793
c0a0d0d3 1794#ifdef CONFIG_STACKTRACE
4a9bd3f1
SR
1795
1796#define FTRACE_STACK_MAX_ENTRIES (PAGE_SIZE / sizeof(unsigned long))
1797struct ftrace_stack {
1798 unsigned long calls[FTRACE_STACK_MAX_ENTRIES];
1799};
1800
1801static DEFINE_PER_CPU(struct ftrace_stack, ftrace_stack);
1802static DEFINE_PER_CPU(int, ftrace_stack_reserve);
1803
e77405ad 1804static void __ftrace_trace_stack(struct ring_buffer *buffer,
53614991 1805 unsigned long flags,
1fd8df2c 1806 int skip, int pc, struct pt_regs *regs)
86387f7e 1807{
2425bcb9 1808 struct trace_event_call *call = &event_kernel_stack;
3928a8a2 1809 struct ring_buffer_event *event;
777e208d 1810 struct stack_entry *entry;
86387f7e 1811 struct stack_trace trace;
4a9bd3f1
SR
1812 int use_stack;
1813 int size = FTRACE_STACK_ENTRIES;
1814
1815 trace.nr_entries = 0;
1816 trace.skip = skip;
1817
1818 /*
1819 * Since events can happen in NMIs there's no safe way to
1820 * use the per cpu ftrace_stacks. We reserve it and if an interrupt
1821 * or NMI comes in, it will just have to use the default
1822 * FTRACE_STACK_SIZE.
1823 */
1824 preempt_disable_notrace();
1825
82146529 1826 use_stack = __this_cpu_inc_return(ftrace_stack_reserve);
4a9bd3f1
SR
1827 /*
1828 * We don't need any atomic variables, just a barrier.
1829 * If an interrupt comes in, we don't care, because it would
1830 * have exited and put the counter back to what we want.
1831 * We just need a barrier to keep gcc from moving things
1832 * around.
1833 */
1834 barrier();
1835 if (use_stack == 1) {
bdffd893 1836 trace.entries = this_cpu_ptr(ftrace_stack.calls);
4a9bd3f1
SR
1837 trace.max_entries = FTRACE_STACK_MAX_ENTRIES;
1838
1839 if (regs)
1840 save_stack_trace_regs(regs, &trace);
1841 else
1842 save_stack_trace(&trace);
1843
1844 if (trace.nr_entries > size)
1845 size = trace.nr_entries;
1846 } else
1847 /* From now on, use_stack is a boolean */
1848 use_stack = 0;
1849
1850 size *= sizeof(unsigned long);
86387f7e 1851
e77405ad 1852 event = trace_buffer_lock_reserve(buffer, TRACE_STACK,
4a9bd3f1 1853 sizeof(*entry) + size, flags, pc);
3928a8a2 1854 if (!event)
4a9bd3f1
SR
1855 goto out;
1856 entry = ring_buffer_event_data(event);
86387f7e 1857
4a9bd3f1
SR
1858 memset(&entry->caller, 0, size);
1859
1860 if (use_stack)
1861 memcpy(&entry->caller, trace.entries,
1862 trace.nr_entries * sizeof(unsigned long));
1863 else {
1864 trace.max_entries = FTRACE_STACK_ENTRIES;
1865 trace.entries = entry->caller;
1866 if (regs)
1867 save_stack_trace_regs(regs, &trace);
1868 else
1869 save_stack_trace(&trace);
1870 }
1871
1872 entry->size = trace.nr_entries;
86387f7e 1873
f306cc82 1874 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1875 __buffer_unlock_commit(buffer, event);
4a9bd3f1
SR
1876
1877 out:
1878 /* Again, don't let gcc optimize things here */
1879 barrier();
82146529 1880 __this_cpu_dec(ftrace_stack_reserve);
4a9bd3f1
SR
1881 preempt_enable_notrace();
1882
f0a920d5
IM
1883}
1884
2d34f489
SRRH
1885static inline void ftrace_trace_stack(struct trace_array *tr,
1886 struct ring_buffer *buffer,
73dddbb5
SRRH
1887 unsigned long flags,
1888 int skip, int pc, struct pt_regs *regs)
53614991 1889{
2d34f489 1890 if (!(tr->trace_flags & TRACE_ITER_STACKTRACE))
53614991
SR
1891 return;
1892
73dddbb5 1893 __ftrace_trace_stack(buffer, flags, skip, pc, regs);
53614991
SR
1894}
1895
c0a0d0d3
FW
1896void __trace_stack(struct trace_array *tr, unsigned long flags, int skip,
1897 int pc)
38697053 1898{
12883efb 1899 __ftrace_trace_stack(tr->trace_buffer.buffer, flags, skip, pc, NULL);
38697053
SR
1900}
1901
03889384
SR
1902/**
1903 * trace_dump_stack - record a stack back trace in the trace buffer
c142be8e 1904 * @skip: Number of functions to skip (helper handlers)
03889384 1905 */
c142be8e 1906void trace_dump_stack(int skip)
03889384
SR
1907{
1908 unsigned long flags;
1909
1910 if (tracing_disabled || tracing_selftest_running)
e36c5458 1911 return;
03889384
SR
1912
1913 local_save_flags(flags);
1914
c142be8e
SRRH
1915 /*
1916 * Skip 3 more, seems to get us at the caller of
1917 * this function.
1918 */
1919 skip += 3;
1920 __ftrace_trace_stack(global_trace.trace_buffer.buffer,
1921 flags, skip, preempt_count(), NULL);
03889384
SR
1922}
1923
91e86e56
SR
1924static DEFINE_PER_CPU(int, user_stack_count);
1925
e77405ad
SR
1926void
1927ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
02b67518 1928{
2425bcb9 1929 struct trace_event_call *call = &event_user_stack;
8d7c6a96 1930 struct ring_buffer_event *event;
02b67518
TE
1931 struct userstack_entry *entry;
1932 struct stack_trace trace;
02b67518 1933
983f938a 1934 if (!(global_trace.trace_flags & TRACE_ITER_USERSTACKTRACE))
02b67518
TE
1935 return;
1936
b6345879
SR
1937 /*
1938 * NMIs can not handle page faults, even with fix ups.
1939 * The save user stack can (and often does) fault.
1940 */
1941 if (unlikely(in_nmi()))
1942 return;
02b67518 1943
91e86e56
SR
1944 /*
1945 * prevent recursion, since the user stack tracing may
1946 * trigger other kernel events.
1947 */
1948 preempt_disable();
1949 if (__this_cpu_read(user_stack_count))
1950 goto out;
1951
1952 __this_cpu_inc(user_stack_count);
1953
e77405ad 1954 event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK,
51a763dd 1955 sizeof(*entry), flags, pc);
02b67518 1956 if (!event)
1dbd1951 1957 goto out_drop_count;
02b67518 1958 entry = ring_buffer_event_data(event);
02b67518 1959
48659d31 1960 entry->tgid = current->tgid;
02b67518
TE
1961 memset(&entry->caller, 0, sizeof(entry->caller));
1962
1963 trace.nr_entries = 0;
1964 trace.max_entries = FTRACE_STACK_ENTRIES;
1965 trace.skip = 0;
1966 trace.entries = entry->caller;
1967
1968 save_stack_trace_user(&trace);
f306cc82 1969 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1970 __buffer_unlock_commit(buffer, event);
91e86e56 1971
1dbd1951 1972 out_drop_count:
91e86e56 1973 __this_cpu_dec(user_stack_count);
91e86e56
SR
1974 out:
1975 preempt_enable();
02b67518
TE
1976}
1977
4fd27358
HE
1978#ifdef UNUSED
1979static void __trace_userstack(struct trace_array *tr, unsigned long flags)
02b67518 1980{
7be42151 1981 ftrace_trace_userstack(tr, flags, preempt_count());
02b67518 1982}
4fd27358 1983#endif /* UNUSED */
02b67518 1984
c0a0d0d3
FW
1985#endif /* CONFIG_STACKTRACE */
1986
07d777fe
SR
1987/* created for use with alloc_percpu */
1988struct trace_buffer_struct {
1989 char buffer[TRACE_BUF_SIZE];
1990};
1991
1992static struct trace_buffer_struct *trace_percpu_buffer;
1993static struct trace_buffer_struct *trace_percpu_sirq_buffer;
1994static struct trace_buffer_struct *trace_percpu_irq_buffer;
1995static struct trace_buffer_struct *trace_percpu_nmi_buffer;
1996
1997/*
1998 * The buffer used is dependent on the context. There is a per cpu
1999 * buffer for normal context, softirq contex, hard irq context and
2000 * for NMI context. Thise allows for lockless recording.
2001 *
2002 * Note, if the buffers failed to be allocated, then this returns NULL
2003 */
2004static char *get_trace_buf(void)
2005{
2006 struct trace_buffer_struct *percpu_buffer;
07d777fe
SR
2007
2008 /*
2009 * If we have allocated per cpu buffers, then we do not
2010 * need to do any locking.
2011 */
2012 if (in_nmi())
2013 percpu_buffer = trace_percpu_nmi_buffer;
2014 else if (in_irq())
2015 percpu_buffer = trace_percpu_irq_buffer;
2016 else if (in_softirq())
2017 percpu_buffer = trace_percpu_sirq_buffer;
2018 else
2019 percpu_buffer = trace_percpu_buffer;
2020
2021 if (!percpu_buffer)
2022 return NULL;
2023
d8a0349c 2024 return this_cpu_ptr(&percpu_buffer->buffer[0]);
07d777fe
SR
2025}
2026
2027static int alloc_percpu_trace_buffer(void)
2028{
2029 struct trace_buffer_struct *buffers;
2030 struct trace_buffer_struct *sirq_buffers;
2031 struct trace_buffer_struct *irq_buffers;
2032 struct trace_buffer_struct *nmi_buffers;
2033
2034 buffers = alloc_percpu(struct trace_buffer_struct);
2035 if (!buffers)
2036 goto err_warn;
2037
2038 sirq_buffers = alloc_percpu(struct trace_buffer_struct);
2039 if (!sirq_buffers)
2040 goto err_sirq;
2041
2042 irq_buffers = alloc_percpu(struct trace_buffer_struct);
2043 if (!irq_buffers)
2044 goto err_irq;
2045
2046 nmi_buffers = alloc_percpu(struct trace_buffer_struct);
2047 if (!nmi_buffers)
2048 goto err_nmi;
2049
2050 trace_percpu_buffer = buffers;
2051 trace_percpu_sirq_buffer = sirq_buffers;
2052 trace_percpu_irq_buffer = irq_buffers;
2053 trace_percpu_nmi_buffer = nmi_buffers;
2054
2055 return 0;
2056
2057 err_nmi:
2058 free_percpu(irq_buffers);
2059 err_irq:
2060 free_percpu(sirq_buffers);
2061 err_sirq:
2062 free_percpu(buffers);
2063 err_warn:
2064 WARN(1, "Could not allocate percpu trace_printk buffer");
2065 return -ENOMEM;
2066}
2067
81698831
SR
2068static int buffers_allocated;
2069
07d777fe
SR
2070void trace_printk_init_buffers(void)
2071{
07d777fe
SR
2072 if (buffers_allocated)
2073 return;
2074
2075 if (alloc_percpu_trace_buffer())
2076 return;
2077
2184db46
SR
2078 /* trace_printk() is for debug use only. Don't use it in production. */
2079
a395d6a7
JP
2080 pr_warn("\n");
2081 pr_warn("**********************************************************\n");
2082 pr_warn("** NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE **\n");
2083 pr_warn("** **\n");
2084 pr_warn("** trace_printk() being used. Allocating extra memory. **\n");
2085 pr_warn("** **\n");
2086 pr_warn("** This means that this is a DEBUG kernel and it is **\n");
2087 pr_warn("** unsafe for production use. **\n");
2088 pr_warn("** **\n");
2089 pr_warn("** If you see this message and you are not debugging **\n");
2090 pr_warn("** the kernel, report this immediately to your vendor! **\n");
2091 pr_warn("** **\n");
2092 pr_warn("** NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE **\n");
2093 pr_warn("**********************************************************\n");
07d777fe 2094
b382ede6
SR
2095 /* Expand the buffers to set size */
2096 tracing_update_buffers();
2097
07d777fe 2098 buffers_allocated = 1;
81698831
SR
2099
2100 /*
2101 * trace_printk_init_buffers() can be called by modules.
2102 * If that happens, then we need to start cmdline recording
2103 * directly here. If the global_trace.buffer is already
2104 * allocated here, then this was called by module code.
2105 */
12883efb 2106 if (global_trace.trace_buffer.buffer)
81698831
SR
2107 tracing_start_cmdline_record();
2108}
2109
2110void trace_printk_start_comm(void)
2111{
2112 /* Start tracing comms if trace printk is set */
2113 if (!buffers_allocated)
2114 return;
2115 tracing_start_cmdline_record();
2116}
2117
2118static void trace_printk_start_stop_comm(int enabled)
2119{
2120 if (!buffers_allocated)
2121 return;
2122
2123 if (enabled)
2124 tracing_start_cmdline_record();
2125 else
2126 tracing_stop_cmdline_record();
07d777fe
SR
2127}
2128
769b0441 2129/**
48ead020 2130 * trace_vbprintk - write binary msg to tracing buffer
769b0441
FW
2131 *
2132 */
40ce74f1 2133int trace_vbprintk(unsigned long ip, const char *fmt, va_list args)
769b0441 2134{
2425bcb9 2135 struct trace_event_call *call = &event_bprint;
769b0441 2136 struct ring_buffer_event *event;
e77405ad 2137 struct ring_buffer *buffer;
769b0441 2138 struct trace_array *tr = &global_trace;
48ead020 2139 struct bprint_entry *entry;
769b0441 2140 unsigned long flags;
07d777fe
SR
2141 char *tbuffer;
2142 int len = 0, size, pc;
769b0441
FW
2143
2144 if (unlikely(tracing_selftest_running || tracing_disabled))
2145 return 0;
2146
2147 /* Don't pollute graph traces with trace_vprintk internals */
2148 pause_graph_tracing();
2149
2150 pc = preempt_count();
5168ae50 2151 preempt_disable_notrace();
769b0441 2152
07d777fe
SR
2153 tbuffer = get_trace_buf();
2154 if (!tbuffer) {
2155 len = 0;
769b0441 2156 goto out;
07d777fe 2157 }
769b0441 2158
07d777fe 2159 len = vbin_printf((u32 *)tbuffer, TRACE_BUF_SIZE/sizeof(int), fmt, args);
769b0441 2160
07d777fe
SR
2161 if (len > TRACE_BUF_SIZE/sizeof(int) || len < 0)
2162 goto out;
769b0441 2163
07d777fe 2164 local_save_flags(flags);
769b0441 2165 size = sizeof(*entry) + sizeof(u32) * len;
12883efb 2166 buffer = tr->trace_buffer.buffer;
e77405ad
SR
2167 event = trace_buffer_lock_reserve(buffer, TRACE_BPRINT, size,
2168 flags, pc);
769b0441 2169 if (!event)
07d777fe 2170 goto out;
769b0441
FW
2171 entry = ring_buffer_event_data(event);
2172 entry->ip = ip;
769b0441
FW
2173 entry->fmt = fmt;
2174
07d777fe 2175 memcpy(entry->buf, tbuffer, sizeof(u32) * len);
f306cc82 2176 if (!call_filter_check_discard(call, entry, buffer, event)) {
7ffbd48d 2177 __buffer_unlock_commit(buffer, event);
2d34f489 2178 ftrace_trace_stack(tr, buffer, flags, 6, pc, NULL);
d931369b 2179 }
769b0441 2180
769b0441 2181out:
5168ae50 2182 preempt_enable_notrace();
769b0441
FW
2183 unpause_graph_tracing();
2184
2185 return len;
2186}
48ead020
FW
2187EXPORT_SYMBOL_GPL(trace_vbprintk);
2188
12883efb
SRRH
2189static int
2190__trace_array_vprintk(struct ring_buffer *buffer,
2191 unsigned long ip, const char *fmt, va_list args)
48ead020 2192{
2425bcb9 2193 struct trace_event_call *call = &event_print;
48ead020 2194 struct ring_buffer_event *event;
07d777fe 2195 int len = 0, size, pc;
48ead020 2196 struct print_entry *entry;
07d777fe
SR
2197 unsigned long flags;
2198 char *tbuffer;
48ead020
FW
2199
2200 if (tracing_disabled || tracing_selftest_running)
2201 return 0;
2202
07d777fe
SR
2203 /* Don't pollute graph traces with trace_vprintk internals */
2204 pause_graph_tracing();
2205
48ead020
FW
2206 pc = preempt_count();
2207 preempt_disable_notrace();
48ead020 2208
07d777fe
SR
2209
2210 tbuffer = get_trace_buf();
2211 if (!tbuffer) {
2212 len = 0;
48ead020 2213 goto out;
07d777fe 2214 }
48ead020 2215
3558a5ac 2216 len = vscnprintf(tbuffer, TRACE_BUF_SIZE, fmt, args);
48ead020 2217
07d777fe 2218 local_save_flags(flags);
48ead020 2219 size = sizeof(*entry) + len + 1;
e77405ad 2220 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, size,
07d777fe 2221 flags, pc);
48ead020 2222 if (!event)
07d777fe 2223 goto out;
48ead020 2224 entry = ring_buffer_event_data(event);
c13d2f7c 2225 entry->ip = ip;
48ead020 2226
3558a5ac 2227 memcpy(&entry->buf, tbuffer, len + 1);
f306cc82 2228 if (!call_filter_check_discard(call, entry, buffer, event)) {
7ffbd48d 2229 __buffer_unlock_commit(buffer, event);
2d34f489 2230 ftrace_trace_stack(&global_trace, buffer, flags, 6, pc, NULL);
d931369b 2231 }
48ead020
FW
2232 out:
2233 preempt_enable_notrace();
07d777fe 2234 unpause_graph_tracing();
48ead020
FW
2235
2236 return len;
2237}
659372d3 2238
12883efb
SRRH
2239int trace_array_vprintk(struct trace_array *tr,
2240 unsigned long ip, const char *fmt, va_list args)
2241{
2242 return __trace_array_vprintk(tr->trace_buffer.buffer, ip, fmt, args);
2243}
2244
2245int trace_array_printk(struct trace_array *tr,
2246 unsigned long ip, const char *fmt, ...)
2247{
2248 int ret;
2249 va_list ap;
2250
983f938a 2251 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
12883efb
SRRH
2252 return 0;
2253
2254 va_start(ap, fmt);
2255 ret = trace_array_vprintk(tr, ip, fmt, ap);
2256 va_end(ap);
2257 return ret;
2258}
2259
2260int trace_array_printk_buf(struct ring_buffer *buffer,
2261 unsigned long ip, const char *fmt, ...)
2262{
2263 int ret;
2264 va_list ap;
2265
983f938a 2266 if (!(global_trace.trace_flags & TRACE_ITER_PRINTK))
12883efb
SRRH
2267 return 0;
2268
2269 va_start(ap, fmt);
2270 ret = __trace_array_vprintk(buffer, ip, fmt, ap);
2271 va_end(ap);
2272 return ret;
2273}
2274
659372d3
SR
2275int trace_vprintk(unsigned long ip, const char *fmt, va_list args)
2276{
a813a159 2277 return trace_array_vprintk(&global_trace, ip, fmt, args);
659372d3 2278}
769b0441
FW
2279EXPORT_SYMBOL_GPL(trace_vprintk);
2280
e2ac8ef5 2281static void trace_iterator_increment(struct trace_iterator *iter)
5a90f577 2282{
6d158a81
SR
2283 struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, iter->cpu);
2284
5a90f577 2285 iter->idx++;
6d158a81
SR
2286 if (buf_iter)
2287 ring_buffer_read(buf_iter, NULL);
5a90f577
SR
2288}
2289
e309b41d 2290static struct trace_entry *
bc21b478
SR
2291peek_next_entry(struct trace_iterator *iter, int cpu, u64 *ts,
2292 unsigned long *lost_events)
dd0e545f 2293{
3928a8a2 2294 struct ring_buffer_event *event;
6d158a81 2295 struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, cpu);
dd0e545f 2296
d769041f
SR
2297 if (buf_iter)
2298 event = ring_buffer_iter_peek(buf_iter, ts);
2299 else
12883efb 2300 event = ring_buffer_peek(iter->trace_buffer->buffer, cpu, ts,
bc21b478 2301 lost_events);
d769041f 2302
4a9bd3f1
SR
2303 if (event) {
2304 iter->ent_size = ring_buffer_event_length(event);
2305 return ring_buffer_event_data(event);
2306 }
2307 iter->ent_size = 0;
2308 return NULL;
dd0e545f 2309}
d769041f 2310
dd0e545f 2311static struct trace_entry *
bc21b478
SR
2312__find_next_entry(struct trace_iterator *iter, int *ent_cpu,
2313 unsigned long *missing_events, u64 *ent_ts)
bc0c38d1 2314{
12883efb 2315 struct ring_buffer *buffer = iter->trace_buffer->buffer;
bc0c38d1 2316 struct trace_entry *ent, *next = NULL;
aa27497c 2317 unsigned long lost_events = 0, next_lost = 0;
b04cc6b1 2318 int cpu_file = iter->cpu_file;
3928a8a2 2319 u64 next_ts = 0, ts;
bc0c38d1 2320 int next_cpu = -1;
12b5da34 2321 int next_size = 0;
bc0c38d1
SR
2322 int cpu;
2323
b04cc6b1
FW
2324 /*
2325 * If we are in a per_cpu trace file, don't bother by iterating over
2326 * all cpu and peek directly.
2327 */
ae3b5093 2328 if (cpu_file > RING_BUFFER_ALL_CPUS) {
b04cc6b1
FW
2329 if (ring_buffer_empty_cpu(buffer, cpu_file))
2330 return NULL;
bc21b478 2331 ent = peek_next_entry(iter, cpu_file, ent_ts, missing_events);
b04cc6b1
FW
2332 if (ent_cpu)
2333 *ent_cpu = cpu_file;
2334
2335 return ent;
2336 }
2337
ab46428c 2338 for_each_tracing_cpu(cpu) {
dd0e545f 2339
3928a8a2
SR
2340 if (ring_buffer_empty_cpu(buffer, cpu))
2341 continue;
dd0e545f 2342
bc21b478 2343 ent = peek_next_entry(iter, cpu, &ts, &lost_events);
dd0e545f 2344
cdd31cd2
IM
2345 /*
2346 * Pick the entry with the smallest timestamp:
2347 */
3928a8a2 2348 if (ent && (!next || ts < next_ts)) {
bc0c38d1
SR
2349 next = ent;
2350 next_cpu = cpu;
3928a8a2 2351 next_ts = ts;
bc21b478 2352 next_lost = lost_events;
12b5da34 2353 next_size = iter->ent_size;
bc0c38d1
SR
2354 }
2355 }
2356
12b5da34
SR
2357 iter->ent_size = next_size;
2358
bc0c38d1
SR
2359 if (ent_cpu)
2360 *ent_cpu = next_cpu;
2361
3928a8a2
SR
2362 if (ent_ts)
2363 *ent_ts = next_ts;
2364
bc21b478
SR
2365 if (missing_events)
2366 *missing_events = next_lost;
2367
bc0c38d1
SR
2368 return next;
2369}
2370
dd0e545f 2371/* Find the next real entry, without updating the iterator itself */
c4a8e8be
FW
2372struct trace_entry *trace_find_next_entry(struct trace_iterator *iter,
2373 int *ent_cpu, u64 *ent_ts)
bc0c38d1 2374{
bc21b478 2375 return __find_next_entry(iter, ent_cpu, NULL, ent_ts);
dd0e545f
SR
2376}
2377
2378/* Find the next real entry, and increment the iterator to the next entry */
955b61e5 2379void *trace_find_next_entry_inc(struct trace_iterator *iter)
dd0e545f 2380{
bc21b478
SR
2381 iter->ent = __find_next_entry(iter, &iter->cpu,
2382 &iter->lost_events, &iter->ts);
dd0e545f 2383
3928a8a2 2384 if (iter->ent)
e2ac8ef5 2385 trace_iterator_increment(iter);
dd0e545f 2386
3928a8a2 2387 return iter->ent ? iter : NULL;
b3806b43 2388}
bc0c38d1 2389
e309b41d 2390static void trace_consume(struct trace_iterator *iter)
b3806b43 2391{
12883efb 2392 ring_buffer_consume(iter->trace_buffer->buffer, iter->cpu, &iter->ts,
bc21b478 2393 &iter->lost_events);
bc0c38d1
SR
2394}
2395
e309b41d 2396static void *s_next(struct seq_file *m, void *v, loff_t *pos)
bc0c38d1
SR
2397{
2398 struct trace_iterator *iter = m->private;
bc0c38d1 2399 int i = (int)*pos;
4e3c3333 2400 void *ent;
bc0c38d1 2401
a63ce5b3
SR
2402 WARN_ON_ONCE(iter->leftover);
2403
bc0c38d1
SR
2404 (*pos)++;
2405
2406 /* can't go backwards */
2407 if (iter->idx > i)
2408 return NULL;
2409
2410 if (iter->idx < 0)
955b61e5 2411 ent = trace_find_next_entry_inc(iter);
bc0c38d1
SR
2412 else
2413 ent = iter;
2414
2415 while (ent && iter->idx < i)
955b61e5 2416 ent = trace_find_next_entry_inc(iter);
bc0c38d1
SR
2417
2418 iter->pos = *pos;
2419
bc0c38d1
SR
2420 return ent;
2421}
2422
955b61e5 2423void tracing_iter_reset(struct trace_iterator *iter, int cpu)
2f26ebd5 2424{
2f26ebd5
SR
2425 struct ring_buffer_event *event;
2426 struct ring_buffer_iter *buf_iter;
2427 unsigned long entries = 0;
2428 u64 ts;
2429
12883efb 2430 per_cpu_ptr(iter->trace_buffer->data, cpu)->skipped_entries = 0;
2f26ebd5 2431
6d158a81
SR
2432 buf_iter = trace_buffer_iter(iter, cpu);
2433 if (!buf_iter)
2f26ebd5
SR
2434 return;
2435
2f26ebd5
SR
2436 ring_buffer_iter_reset(buf_iter);
2437
2438 /*
2439 * We could have the case with the max latency tracers
2440 * that a reset never took place on a cpu. This is evident
2441 * by the timestamp being before the start of the buffer.
2442 */
2443 while ((event = ring_buffer_iter_peek(buf_iter, &ts))) {
12883efb 2444 if (ts >= iter->trace_buffer->time_start)
2f26ebd5
SR
2445 break;
2446 entries++;
2447 ring_buffer_read(buf_iter, NULL);
2448 }
2449
12883efb 2450 per_cpu_ptr(iter->trace_buffer->data, cpu)->skipped_entries = entries;
2f26ebd5
SR
2451}
2452
d7350c3f 2453/*
d7350c3f
FW
2454 * The current tracer is copied to avoid a global locking
2455 * all around.
2456 */
bc0c38d1
SR
2457static void *s_start(struct seq_file *m, loff_t *pos)
2458{
2459 struct trace_iterator *iter = m->private;
2b6080f2 2460 struct trace_array *tr = iter->tr;
b04cc6b1 2461 int cpu_file = iter->cpu_file;
bc0c38d1
SR
2462 void *p = NULL;
2463 loff_t l = 0;
3928a8a2 2464 int cpu;
bc0c38d1 2465
2fd196ec
HT
2466 /*
2467 * copy the tracer to avoid using a global lock all around.
2468 * iter->trace is a copy of current_trace, the pointer to the
2469 * name may be used instead of a strcmp(), as iter->trace->name
2470 * will point to the same string as current_trace->name.
2471 */
bc0c38d1 2472 mutex_lock(&trace_types_lock);
2b6080f2
SR
2473 if (unlikely(tr->current_trace && iter->trace->name != tr->current_trace->name))
2474 *iter->trace = *tr->current_trace;
d7350c3f 2475 mutex_unlock(&trace_types_lock);
bc0c38d1 2476
12883efb 2477#ifdef CONFIG_TRACER_MAX_TRACE
debdd57f
HT
2478 if (iter->snapshot && iter->trace->use_max_tr)
2479 return ERR_PTR(-EBUSY);
12883efb 2480#endif
debdd57f
HT
2481
2482 if (!iter->snapshot)
2483 atomic_inc(&trace_record_cmdline_disabled);
bc0c38d1 2484
bc0c38d1
SR
2485 if (*pos != iter->pos) {
2486 iter->ent = NULL;
2487 iter->cpu = 0;
2488 iter->idx = -1;
2489
ae3b5093 2490 if (cpu_file == RING_BUFFER_ALL_CPUS) {
b04cc6b1 2491 for_each_tracing_cpu(cpu)
2f26ebd5 2492 tracing_iter_reset(iter, cpu);
b04cc6b1 2493 } else
2f26ebd5 2494 tracing_iter_reset(iter, cpu_file);
bc0c38d1 2495
ac91d854 2496 iter->leftover = 0;
bc0c38d1
SR
2497 for (p = iter; p && l < *pos; p = s_next(m, p, &l))
2498 ;
2499
2500 } else {
a63ce5b3
SR
2501 /*
2502 * If we overflowed the seq_file before, then we want
2503 * to just reuse the trace_seq buffer again.
2504 */
2505 if (iter->leftover)
2506 p = iter;
2507 else {
2508 l = *pos - 1;
2509 p = s_next(m, p, &l);
2510 }
bc0c38d1
SR
2511 }
2512
4f535968 2513 trace_event_read_lock();
7e53bd42 2514 trace_access_lock(cpu_file);
bc0c38d1
SR
2515 return p;
2516}
2517
2518static void s_stop(struct seq_file *m, void *p)
2519{
7e53bd42
LJ
2520 struct trace_iterator *iter = m->private;
2521
12883efb 2522#ifdef CONFIG_TRACER_MAX_TRACE
debdd57f
HT
2523 if (iter->snapshot && iter->trace->use_max_tr)
2524 return;
12883efb 2525#endif
debdd57f
HT
2526
2527 if (!iter->snapshot)
2528 atomic_dec(&trace_record_cmdline_disabled);
12883efb 2529
7e53bd42 2530 trace_access_unlock(iter->cpu_file);
4f535968 2531 trace_event_read_unlock();
bc0c38d1
SR
2532}
2533
39eaf7ef 2534static void
12883efb
SRRH
2535get_total_entries(struct trace_buffer *buf,
2536 unsigned long *total, unsigned long *entries)
39eaf7ef
SR
2537{
2538 unsigned long count;
2539 int cpu;
2540
2541 *total = 0;
2542 *entries = 0;
2543
2544 for_each_tracing_cpu(cpu) {
12883efb 2545 count = ring_buffer_entries_cpu(buf->buffer, cpu);
39eaf7ef
SR
2546 /*
2547 * If this buffer has skipped entries, then we hold all
2548 * entries for the trace and we need to ignore the
2549 * ones before the time stamp.
2550 */
12883efb
SRRH
2551 if (per_cpu_ptr(buf->data, cpu)->skipped_entries) {
2552 count -= per_cpu_ptr(buf->data, cpu)->skipped_entries;
39eaf7ef
SR
2553 /* total is the same as the entries */
2554 *total += count;
2555 } else
2556 *total += count +
12883efb 2557 ring_buffer_overrun_cpu(buf->buffer, cpu);
39eaf7ef
SR
2558 *entries += count;
2559 }
2560}
2561
e309b41d 2562static void print_lat_help_header(struct seq_file *m)
bc0c38d1 2563{
d79ac28f
RV
2564 seq_puts(m, "# _------=> CPU# \n"
2565 "# / _-----=> irqs-off \n"
2566 "# | / _----=> need-resched \n"
2567 "# || / _---=> hardirq/softirq \n"
2568 "# ||| / _--=> preempt-depth \n"
2569 "# |||| / delay \n"
2570 "# cmd pid ||||| time | caller \n"
2571 "# \\ / ||||| \\ | / \n");
bc0c38d1
SR
2572}
2573
12883efb 2574static void print_event_info(struct trace_buffer *buf, struct seq_file *m)
bc0c38d1 2575{
39eaf7ef
SR
2576 unsigned long total;
2577 unsigned long entries;
2578
12883efb 2579 get_total_entries(buf, &total, &entries);
39eaf7ef
SR
2580 seq_printf(m, "# entries-in-buffer/entries-written: %lu/%lu #P:%d\n",
2581 entries, total, num_online_cpus());
2582 seq_puts(m, "#\n");
2583}
2584
12883efb 2585static void print_func_help_header(struct trace_buffer *buf, struct seq_file *m)
39eaf7ef 2586{
12883efb 2587 print_event_info(buf, m);
d79ac28f
RV
2588 seq_puts(m, "# TASK-PID CPU# TIMESTAMP FUNCTION\n"
2589 "# | | | | |\n");
bc0c38d1
SR
2590}
2591
12883efb 2592static void print_func_help_header_irq(struct trace_buffer *buf, struct seq_file *m)
77271ce4 2593{
12883efb 2594 print_event_info(buf, m);
d79ac28f
RV
2595 seq_puts(m, "# _-----=> irqs-off\n"
2596 "# / _----=> need-resched\n"
2597 "# | / _---=> hardirq/softirq\n"
2598 "# || / _--=> preempt-depth\n"
2599 "# ||| / delay\n"
2600 "# TASK-PID CPU# |||| TIMESTAMP FUNCTION\n"
2601 "# | | | |||| | |\n");
77271ce4 2602}
bc0c38d1 2603
62b915f1 2604void
bc0c38d1
SR
2605print_trace_header(struct seq_file *m, struct trace_iterator *iter)
2606{
983f938a 2607 unsigned long sym_flags = (global_trace.trace_flags & TRACE_ITER_SYM_MASK);
12883efb
SRRH
2608 struct trace_buffer *buf = iter->trace_buffer;
2609 struct trace_array_cpu *data = per_cpu_ptr(buf->data, buf->cpu);
2b6080f2 2610 struct tracer *type = iter->trace;
39eaf7ef
SR
2611 unsigned long entries;
2612 unsigned long total;
bc0c38d1
SR
2613 const char *name = "preemption";
2614
d840f718 2615 name = type->name;
bc0c38d1 2616
12883efb 2617 get_total_entries(buf, &total, &entries);
bc0c38d1 2618
888b55dc 2619 seq_printf(m, "# %s latency trace v1.1.5 on %s\n",
bc0c38d1 2620 name, UTS_RELEASE);
888b55dc 2621 seq_puts(m, "# -----------------------------------"
bc0c38d1 2622 "---------------------------------\n");
888b55dc 2623 seq_printf(m, "# latency: %lu us, #%lu/%lu, CPU#%d |"
bc0c38d1 2624 " (M:%s VP:%d, KP:%d, SP:%d HP:%d",
57f50be1 2625 nsecs_to_usecs(data->saved_latency),
bc0c38d1 2626 entries,
4c11d7ae 2627 total,
12883efb 2628 buf->cpu,
bc0c38d1
SR
2629#if defined(CONFIG_PREEMPT_NONE)
2630 "server",
2631#elif defined(CONFIG_PREEMPT_VOLUNTARY)
2632 "desktop",
b5c21b45 2633#elif defined(CONFIG_PREEMPT)
bc0c38d1
SR
2634 "preempt",
2635#else
2636 "unknown",
2637#endif
2638 /* These are reserved for later use */
2639 0, 0, 0, 0);
2640#ifdef CONFIG_SMP
2641 seq_printf(m, " #P:%d)\n", num_online_cpus());
2642#else
2643 seq_puts(m, ")\n");
2644#endif
888b55dc
KM
2645 seq_puts(m, "# -----------------\n");
2646 seq_printf(m, "# | task: %.16s-%d "
bc0c38d1 2647 "(uid:%d nice:%ld policy:%ld rt_prio:%ld)\n",
d20b92ab
EB
2648 data->comm, data->pid,
2649 from_kuid_munged(seq_user_ns(m), data->uid), data->nice,
bc0c38d1 2650 data->policy, data->rt_priority);
888b55dc 2651 seq_puts(m, "# -----------------\n");
bc0c38d1
SR
2652
2653 if (data->critical_start) {
888b55dc 2654 seq_puts(m, "# => started at: ");
214023c3
SR
2655 seq_print_ip_sym(&iter->seq, data->critical_start, sym_flags);
2656 trace_print_seq(m, &iter->seq);
888b55dc 2657 seq_puts(m, "\n# => ended at: ");
214023c3
SR
2658 seq_print_ip_sym(&iter->seq, data->critical_end, sym_flags);
2659 trace_print_seq(m, &iter->seq);
8248ac05 2660 seq_puts(m, "\n#\n");
bc0c38d1
SR
2661 }
2662
888b55dc 2663 seq_puts(m, "#\n");
bc0c38d1
SR
2664}
2665
a309720c
SR
2666static void test_cpu_buff_start(struct trace_iterator *iter)
2667{
2668 struct trace_seq *s = &iter->seq;
983f938a 2669 struct trace_array *tr = iter->tr;
a309720c 2670
983f938a 2671 if (!(tr->trace_flags & TRACE_ITER_ANNOTATE))
12ef7d44
SR
2672 return;
2673
2674 if (!(iter->iter_flags & TRACE_FILE_ANNOTATE))
2675 return;
2676
919cd979 2677 if (iter->started && cpumask_test_cpu(iter->cpu, iter->started))
a309720c
SR
2678 return;
2679
12883efb 2680 if (per_cpu_ptr(iter->trace_buffer->data, iter->cpu)->skipped_entries)
2f26ebd5
SR
2681 return;
2682
919cd979
SL
2683 if (iter->started)
2684 cpumask_set_cpu(iter->cpu, iter->started);
b0dfa978
FW
2685
2686 /* Don't print started cpu buffer for the first entry of the trace */
2687 if (iter->idx > 1)
2688 trace_seq_printf(s, "##### CPU %u buffer started ####\n",
2689 iter->cpu);
a309720c
SR
2690}
2691
2c4f035f 2692static enum print_line_t print_trace_fmt(struct trace_iterator *iter)
bc0c38d1 2693{
983f938a 2694 struct trace_array *tr = iter->tr;
214023c3 2695 struct trace_seq *s = &iter->seq;
983f938a 2696 unsigned long sym_flags = (tr->trace_flags & TRACE_ITER_SYM_MASK);
4e3c3333 2697 struct trace_entry *entry;
f633cef0 2698 struct trace_event *event;
bc0c38d1 2699
4e3c3333 2700 entry = iter->ent;
dd0e545f 2701
a309720c
SR
2702 test_cpu_buff_start(iter);
2703
c4a8e8be 2704 event = ftrace_find_event(entry->type);
bc0c38d1 2705
983f938a 2706 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2707 if (iter->iter_flags & TRACE_FILE_LAT_FMT)
2708 trace_print_lat_context(iter);
2709 else
2710 trace_print_context(iter);
c4a8e8be 2711 }
bc0c38d1 2712
19a7fe20
SRRH
2713 if (trace_seq_has_overflowed(s))
2714 return TRACE_TYPE_PARTIAL_LINE;
2715
268ccda0 2716 if (event)
a9a57763 2717 return event->funcs->trace(iter, sym_flags, event);
d9793bd8 2718
19a7fe20 2719 trace_seq_printf(s, "Unknown type %d\n", entry->type);
02b67518 2720
19a7fe20 2721 return trace_handle_return(s);
bc0c38d1
SR
2722}
2723
2c4f035f 2724static enum print_line_t print_raw_fmt(struct trace_iterator *iter)
f9896bf3 2725{
983f938a 2726 struct trace_array *tr = iter->tr;
f9896bf3
IM
2727 struct trace_seq *s = &iter->seq;
2728 struct trace_entry *entry;
f633cef0 2729 struct trace_event *event;
f9896bf3
IM
2730
2731 entry = iter->ent;
dd0e545f 2732
983f938a 2733 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO)
19a7fe20
SRRH
2734 trace_seq_printf(s, "%d %d %llu ",
2735 entry->pid, iter->cpu, iter->ts);
2736
2737 if (trace_seq_has_overflowed(s))
2738 return TRACE_TYPE_PARTIAL_LINE;
f9896bf3 2739
f633cef0 2740 event = ftrace_find_event(entry->type);
268ccda0 2741 if (event)
a9a57763 2742 return event->funcs->raw(iter, 0, event);
d9793bd8 2743
19a7fe20 2744 trace_seq_printf(s, "%d ?\n", entry->type);
777e208d 2745
19a7fe20 2746 return trace_handle_return(s);
f9896bf3
IM
2747}
2748
2c4f035f 2749static enum print_line_t print_hex_fmt(struct trace_iterator *iter)
5e3ca0ec 2750{
983f938a 2751 struct trace_array *tr = iter->tr;
5e3ca0ec
IM
2752 struct trace_seq *s = &iter->seq;
2753 unsigned char newline = '\n';
2754 struct trace_entry *entry;
f633cef0 2755 struct trace_event *event;
5e3ca0ec
IM
2756
2757 entry = iter->ent;
dd0e545f 2758
983f938a 2759 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2760 SEQ_PUT_HEX_FIELD(s, entry->pid);
2761 SEQ_PUT_HEX_FIELD(s, iter->cpu);
2762 SEQ_PUT_HEX_FIELD(s, iter->ts);
2763 if (trace_seq_has_overflowed(s))
2764 return TRACE_TYPE_PARTIAL_LINE;
c4a8e8be 2765 }
5e3ca0ec 2766
f633cef0 2767 event = ftrace_find_event(entry->type);
268ccda0 2768 if (event) {
a9a57763 2769 enum print_line_t ret = event->funcs->hex(iter, 0, event);
d9793bd8
ACM
2770 if (ret != TRACE_TYPE_HANDLED)
2771 return ret;
2772 }
7104f300 2773
19a7fe20 2774 SEQ_PUT_FIELD(s, newline);
5e3ca0ec 2775
19a7fe20 2776 return trace_handle_return(s);
5e3ca0ec
IM
2777}
2778
2c4f035f 2779static enum print_line_t print_bin_fmt(struct trace_iterator *iter)
cb0f12aa 2780{
983f938a 2781 struct trace_array *tr = iter->tr;
cb0f12aa
IM
2782 struct trace_seq *s = &iter->seq;
2783 struct trace_entry *entry;
f633cef0 2784 struct trace_event *event;
cb0f12aa
IM
2785
2786 entry = iter->ent;
dd0e545f 2787
983f938a 2788 if (tr->trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2789 SEQ_PUT_FIELD(s, entry->pid);
2790 SEQ_PUT_FIELD(s, iter->cpu);
2791 SEQ_PUT_FIELD(s, iter->ts);
2792 if (trace_seq_has_overflowed(s))
2793 return TRACE_TYPE_PARTIAL_LINE;
c4a8e8be 2794 }
cb0f12aa 2795
f633cef0 2796 event = ftrace_find_event(entry->type);
a9a57763
SR
2797 return event ? event->funcs->binary(iter, 0, event) :
2798 TRACE_TYPE_HANDLED;
cb0f12aa
IM
2799}
2800
62b915f1 2801int trace_empty(struct trace_iterator *iter)
bc0c38d1 2802{
6d158a81 2803 struct ring_buffer_iter *buf_iter;
bc0c38d1
SR
2804 int cpu;
2805
9aba60fe 2806 /* If we are looking at one CPU buffer, only check that one */
ae3b5093 2807 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
9aba60fe 2808 cpu = iter->cpu_file;
6d158a81
SR
2809 buf_iter = trace_buffer_iter(iter, cpu);
2810 if (buf_iter) {
2811 if (!ring_buffer_iter_empty(buf_iter))
9aba60fe
SR
2812 return 0;
2813 } else {
12883efb 2814 if (!ring_buffer_empty_cpu(iter->trace_buffer->buffer, cpu))
9aba60fe
SR
2815 return 0;
2816 }
2817 return 1;
2818 }
2819
ab46428c 2820 for_each_tracing_cpu(cpu) {
6d158a81
SR
2821 buf_iter = trace_buffer_iter(iter, cpu);
2822 if (buf_iter) {
2823 if (!ring_buffer_iter_empty(buf_iter))
d769041f
SR
2824 return 0;
2825 } else {
12883efb 2826 if (!ring_buffer_empty_cpu(iter->trace_buffer->buffer, cpu))
d769041f
SR
2827 return 0;
2828 }
bc0c38d1 2829 }
d769041f 2830
797d3712 2831 return 1;
bc0c38d1
SR
2832}
2833
4f535968 2834/* Called with trace_event_read_lock() held. */
955b61e5 2835enum print_line_t print_trace_line(struct trace_iterator *iter)
f9896bf3 2836{
983f938a
SRRH
2837 struct trace_array *tr = iter->tr;
2838 unsigned long trace_flags = tr->trace_flags;
2c4f035f
FW
2839 enum print_line_t ret;
2840
19a7fe20
SRRH
2841 if (iter->lost_events) {
2842 trace_seq_printf(&iter->seq, "CPU:%d [LOST %lu EVENTS]\n",
2843 iter->cpu, iter->lost_events);
2844 if (trace_seq_has_overflowed(&iter->seq))
2845 return TRACE_TYPE_PARTIAL_LINE;
2846 }
bc21b478 2847
2c4f035f
FW
2848 if (iter->trace && iter->trace->print_line) {
2849 ret = iter->trace->print_line(iter);
2850 if (ret != TRACE_TYPE_UNHANDLED)
2851 return ret;
2852 }
72829bc3 2853
09ae7234
SRRH
2854 if (iter->ent->type == TRACE_BPUTS &&
2855 trace_flags & TRACE_ITER_PRINTK &&
2856 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
2857 return trace_print_bputs_msg_only(iter);
2858
48ead020
FW
2859 if (iter->ent->type == TRACE_BPRINT &&
2860 trace_flags & TRACE_ITER_PRINTK &&
2861 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
5ef841f6 2862 return trace_print_bprintk_msg_only(iter);
48ead020 2863
66896a85
FW
2864 if (iter->ent->type == TRACE_PRINT &&
2865 trace_flags & TRACE_ITER_PRINTK &&
2866 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
5ef841f6 2867 return trace_print_printk_msg_only(iter);
66896a85 2868
cb0f12aa
IM
2869 if (trace_flags & TRACE_ITER_BIN)
2870 return print_bin_fmt(iter);
2871
5e3ca0ec
IM
2872 if (trace_flags & TRACE_ITER_HEX)
2873 return print_hex_fmt(iter);
2874
f9896bf3
IM
2875 if (trace_flags & TRACE_ITER_RAW)
2876 return print_raw_fmt(iter);
2877
f9896bf3
IM
2878 return print_trace_fmt(iter);
2879}
2880
7e9a49ef
JO
2881void trace_latency_header(struct seq_file *m)
2882{
2883 struct trace_iterator *iter = m->private;
983f938a 2884 struct trace_array *tr = iter->tr;
7e9a49ef
JO
2885
2886 /* print nothing if the buffers are empty */
2887 if (trace_empty(iter))
2888 return;
2889
2890 if (iter->iter_flags & TRACE_FILE_LAT_FMT)
2891 print_trace_header(m, iter);
2892
983f938a 2893 if (!(tr->trace_flags & TRACE_ITER_VERBOSE))
7e9a49ef
JO
2894 print_lat_help_header(m);
2895}
2896
62b915f1
JO
2897void trace_default_header(struct seq_file *m)
2898{
2899 struct trace_iterator *iter = m->private;
983f938a
SRRH
2900 struct trace_array *tr = iter->tr;
2901 unsigned long trace_flags = tr->trace_flags;
62b915f1 2902
f56e7f8e
JO
2903 if (!(trace_flags & TRACE_ITER_CONTEXT_INFO))
2904 return;
2905
62b915f1
JO
2906 if (iter->iter_flags & TRACE_FILE_LAT_FMT) {
2907 /* print nothing if the buffers are empty */
2908 if (trace_empty(iter))
2909 return;
2910 print_trace_header(m, iter);
2911 if (!(trace_flags & TRACE_ITER_VERBOSE))
2912 print_lat_help_header(m);
2913 } else {
77271ce4
SR
2914 if (!(trace_flags & TRACE_ITER_VERBOSE)) {
2915 if (trace_flags & TRACE_ITER_IRQ_INFO)
12883efb 2916 print_func_help_header_irq(iter->trace_buffer, m);
77271ce4 2917 else
12883efb 2918 print_func_help_header(iter->trace_buffer, m);
77271ce4 2919 }
62b915f1
JO
2920 }
2921}
2922
e0a413f6
SR
2923static void test_ftrace_alive(struct seq_file *m)
2924{
2925 if (!ftrace_is_dead())
2926 return;
d79ac28f
RV
2927 seq_puts(m, "# WARNING: FUNCTION TRACING IS CORRUPTED\n"
2928 "# MAY BE MISSING FUNCTION EVENTS\n");
e0a413f6
SR
2929}
2930
d8741e2e 2931#ifdef CONFIG_TRACER_MAX_TRACE
f1affcaa 2932static void show_snapshot_main_help(struct seq_file *m)
d8741e2e 2933{
d79ac28f
RV
2934 seq_puts(m, "# echo 0 > snapshot : Clears and frees snapshot buffer\n"
2935 "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
2936 "# Takes a snapshot of the main buffer.\n"
2937 "# echo 2 > snapshot : Clears snapshot buffer (but does not allocate or free)\n"
2938 "# (Doesn't have to be '2' works with any number that\n"
2939 "# is not a '0' or '1')\n");
d8741e2e 2940}
f1affcaa
SRRH
2941
2942static void show_snapshot_percpu_help(struct seq_file *m)
2943{
fa6f0cc7 2944 seq_puts(m, "# echo 0 > snapshot : Invalid for per_cpu snapshot file.\n");
f1affcaa 2945#ifdef CONFIG_RING_BUFFER_ALLOW_SWAP
d79ac28f
RV
2946 seq_puts(m, "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
2947 "# Takes a snapshot of the main buffer for this cpu.\n");
f1affcaa 2948#else
d79ac28f
RV
2949 seq_puts(m, "# echo 1 > snapshot : Not supported with this kernel.\n"
2950 "# Must use main snapshot file to allocate.\n");
f1affcaa 2951#endif
d79ac28f
RV
2952 seq_puts(m, "# echo 2 > snapshot : Clears this cpu's snapshot buffer (but does not allocate)\n"
2953 "# (Doesn't have to be '2' works with any number that\n"
2954 "# is not a '0' or '1')\n");
f1affcaa
SRRH
2955}
2956
d8741e2e
SRRH
2957static void print_snapshot_help(struct seq_file *m, struct trace_iterator *iter)
2958{
45ad21ca 2959 if (iter->tr->allocated_snapshot)
fa6f0cc7 2960 seq_puts(m, "#\n# * Snapshot is allocated *\n#\n");
d8741e2e 2961 else
fa6f0cc7 2962 seq_puts(m, "#\n# * Snapshot is freed *\n#\n");
d8741e2e 2963
fa6f0cc7 2964 seq_puts(m, "# Snapshot commands:\n");
f1affcaa
SRRH
2965 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
2966 show_snapshot_main_help(m);
2967 else
2968 show_snapshot_percpu_help(m);
d8741e2e
SRRH
2969}
2970#else
2971/* Should never be called */
2972static inline void print_snapshot_help(struct seq_file *m, struct trace_iterator *iter) { }
2973#endif
2974
bc0c38d1
SR
2975static int s_show(struct seq_file *m, void *v)
2976{
2977 struct trace_iterator *iter = v;
a63ce5b3 2978 int ret;
bc0c38d1
SR
2979
2980 if (iter->ent == NULL) {
2981 if (iter->tr) {
2982 seq_printf(m, "# tracer: %s\n", iter->trace->name);
2983 seq_puts(m, "#\n");
e0a413f6 2984 test_ftrace_alive(m);
bc0c38d1 2985 }
d8741e2e
SRRH
2986 if (iter->snapshot && trace_empty(iter))
2987 print_snapshot_help(m, iter);
2988 else if (iter->trace && iter->trace->print_header)
8bba1bf5 2989 iter->trace->print_header(m);
62b915f1
JO
2990 else
2991 trace_default_header(m);
2992
a63ce5b3
SR
2993 } else if (iter->leftover) {
2994 /*
2995 * If we filled the seq_file buffer earlier, we
2996 * want to just show it now.
2997 */
2998 ret = trace_print_seq(m, &iter->seq);
2999
3000 /* ret should this time be zero, but you never know */
3001 iter->leftover = ret;
3002
bc0c38d1 3003 } else {
f9896bf3 3004 print_trace_line(iter);
a63ce5b3
SR
3005 ret = trace_print_seq(m, &iter->seq);
3006 /*
3007 * If we overflow the seq_file buffer, then it will
3008 * ask us for this data again at start up.
3009 * Use that instead.
3010 * ret is 0 if seq_file write succeeded.
3011 * -1 otherwise.
3012 */
3013 iter->leftover = ret;
bc0c38d1
SR
3014 }
3015
3016 return 0;
3017}
3018
649e9c70
ON
3019/*
3020 * Should be used after trace_array_get(), trace_types_lock
3021 * ensures that i_cdev was already initialized.
3022 */
3023static inline int tracing_get_cpu(struct inode *inode)
3024{
3025 if (inode->i_cdev) /* See trace_create_cpu_file() */
3026 return (long)inode->i_cdev - 1;
3027 return RING_BUFFER_ALL_CPUS;
3028}
3029
88e9d34c 3030static const struct seq_operations tracer_seq_ops = {
4bf39a94
IM
3031 .start = s_start,
3032 .next = s_next,
3033 .stop = s_stop,
3034 .show = s_show,
bc0c38d1
SR
3035};
3036
e309b41d 3037static struct trace_iterator *
6484c71c 3038__tracing_open(struct inode *inode, struct file *file, bool snapshot)
bc0c38d1 3039{
6484c71c 3040 struct trace_array *tr = inode->i_private;
bc0c38d1 3041 struct trace_iterator *iter;
50e18b94 3042 int cpu;
bc0c38d1 3043
85a2f9b4
SR
3044 if (tracing_disabled)
3045 return ERR_PTR(-ENODEV);
60a11774 3046
50e18b94 3047 iter = __seq_open_private(file, &tracer_seq_ops, sizeof(*iter));
85a2f9b4
SR
3048 if (!iter)
3049 return ERR_PTR(-ENOMEM);
bc0c38d1 3050
72917235 3051 iter->buffer_iter = kcalloc(nr_cpu_ids, sizeof(*iter->buffer_iter),
6d158a81 3052 GFP_KERNEL);
93574fcc
DC
3053 if (!iter->buffer_iter)
3054 goto release;
3055
d7350c3f
FW
3056 /*
3057 * We make a copy of the current tracer to avoid concurrent
3058 * changes on it while we are reading.
3059 */
bc0c38d1 3060 mutex_lock(&trace_types_lock);
d7350c3f 3061 iter->trace = kzalloc(sizeof(*iter->trace), GFP_KERNEL);
85a2f9b4 3062 if (!iter->trace)
d7350c3f 3063 goto fail;
85a2f9b4 3064
2b6080f2 3065 *iter->trace = *tr->current_trace;
d7350c3f 3066
79f55997 3067 if (!zalloc_cpumask_var(&iter->started, GFP_KERNEL))
b0dfa978
FW
3068 goto fail;
3069
12883efb
SRRH
3070 iter->tr = tr;
3071
3072#ifdef CONFIG_TRACER_MAX_TRACE
2b6080f2
SR
3073 /* Currently only the top directory has a snapshot */
3074 if (tr->current_trace->print_max || snapshot)
12883efb 3075 iter->trace_buffer = &tr->max_buffer;
bc0c38d1 3076 else
12883efb
SRRH
3077#endif
3078 iter->trace_buffer = &tr->trace_buffer;
debdd57f 3079 iter->snapshot = snapshot;
bc0c38d1 3080 iter->pos = -1;
6484c71c 3081 iter->cpu_file = tracing_get_cpu(inode);
d7350c3f 3082 mutex_init(&iter->mutex);
bc0c38d1 3083
8bba1bf5
MM
3084 /* Notify the tracer early; before we stop tracing. */
3085 if (iter->trace && iter->trace->open)
a93751ca 3086 iter->trace->open(iter);
8bba1bf5 3087
12ef7d44 3088 /* Annotate start of buffers if we had overruns */
12883efb 3089 if (ring_buffer_overruns(iter->trace_buffer->buffer))
12ef7d44
SR
3090 iter->iter_flags |= TRACE_FILE_ANNOTATE;
3091
8be0709f 3092 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
58e8eedf 3093 if (trace_clocks[tr->clock_id].in_ns)
8be0709f
DS
3094 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
3095
debdd57f
HT
3096 /* stop the trace while dumping if we are not opening "snapshot" */
3097 if (!iter->snapshot)
2b6080f2 3098 tracing_stop_tr(tr);
2f26ebd5 3099
ae3b5093 3100 if (iter->cpu_file == RING_BUFFER_ALL_CPUS) {
b04cc6b1 3101 for_each_tracing_cpu(cpu) {
b04cc6b1 3102 iter->buffer_iter[cpu] =
12883efb 3103 ring_buffer_read_prepare(iter->trace_buffer->buffer, cpu);
72c9ddfd
DM
3104 }
3105 ring_buffer_read_prepare_sync();
3106 for_each_tracing_cpu(cpu) {
3107 ring_buffer_read_start(iter->buffer_iter[cpu]);
2f26ebd5 3108 tracing_iter_reset(iter, cpu);
b04cc6b1
FW
3109 }
3110 } else {
3111 cpu = iter->cpu_file;
3928a8a2 3112 iter->buffer_iter[cpu] =
12883efb 3113 ring_buffer_read_prepare(iter->trace_buffer->buffer, cpu);
72c9ddfd
DM
3114 ring_buffer_read_prepare_sync();
3115 ring_buffer_read_start(iter->buffer_iter[cpu]);
2f26ebd5 3116 tracing_iter_reset(iter, cpu);
3928a8a2
SR
3117 }
3118
bc0c38d1
SR
3119 mutex_unlock(&trace_types_lock);
3120
bc0c38d1 3121 return iter;
3928a8a2 3122
d7350c3f 3123 fail:
3928a8a2 3124 mutex_unlock(&trace_types_lock);
d7350c3f 3125 kfree(iter->trace);
6d158a81 3126 kfree(iter->buffer_iter);
93574fcc 3127release:
50e18b94
JO
3128 seq_release_private(inode, file);
3129 return ERR_PTR(-ENOMEM);
bc0c38d1
SR
3130}
3131
3132int tracing_open_generic(struct inode *inode, struct file *filp)
3133{
60a11774
SR
3134 if (tracing_disabled)
3135 return -ENODEV;
3136
bc0c38d1
SR
3137 filp->private_data = inode->i_private;
3138 return 0;
3139}
3140
2e86421d
GB
3141bool tracing_is_disabled(void)
3142{
3143 return (tracing_disabled) ? true: false;
3144}
3145
7b85af63
SRRH
3146/*
3147 * Open and update trace_array ref count.
3148 * Must have the current trace_array passed to it.
3149 */
dcc30223 3150static int tracing_open_generic_tr(struct inode *inode, struct file *filp)
7b85af63
SRRH
3151{
3152 struct trace_array *tr = inode->i_private;
3153
3154 if (tracing_disabled)
3155 return -ENODEV;
3156
3157 if (trace_array_get(tr) < 0)
3158 return -ENODEV;
3159
3160 filp->private_data = inode->i_private;
3161
3162 return 0;
7b85af63
SRRH
3163}
3164
4fd27358 3165static int tracing_release(struct inode *inode, struct file *file)
bc0c38d1 3166{
6484c71c 3167 struct trace_array *tr = inode->i_private;
907f2784 3168 struct seq_file *m = file->private_data;
4acd4d00 3169 struct trace_iterator *iter;
3928a8a2 3170 int cpu;
bc0c38d1 3171
ff451961 3172 if (!(file->f_mode & FMODE_READ)) {
6484c71c 3173 trace_array_put(tr);
4acd4d00 3174 return 0;
ff451961 3175 }
4acd4d00 3176
6484c71c 3177 /* Writes do not use seq_file */
4acd4d00 3178 iter = m->private;
bc0c38d1 3179 mutex_lock(&trace_types_lock);
a695cb58 3180
3928a8a2
SR
3181 for_each_tracing_cpu(cpu) {
3182 if (iter->buffer_iter[cpu])
3183 ring_buffer_read_finish(iter->buffer_iter[cpu]);
3184 }
3185
bc0c38d1
SR
3186 if (iter->trace && iter->trace->close)
3187 iter->trace->close(iter);
3188
debdd57f
HT
3189 if (!iter->snapshot)
3190 /* reenable tracing if it was previously enabled */
2b6080f2 3191 tracing_start_tr(tr);
f77d09a3
AL
3192
3193 __trace_array_put(tr);
3194
bc0c38d1
SR
3195 mutex_unlock(&trace_types_lock);
3196
d7350c3f 3197 mutex_destroy(&iter->mutex);
b0dfa978 3198 free_cpumask_var(iter->started);
d7350c3f 3199 kfree(iter->trace);
6d158a81 3200 kfree(iter->buffer_iter);
50e18b94 3201 seq_release_private(inode, file);
ff451961 3202
bc0c38d1
SR
3203 return 0;
3204}
3205
7b85af63
SRRH
3206static int tracing_release_generic_tr(struct inode *inode, struct file *file)
3207{
3208 struct trace_array *tr = inode->i_private;
3209
3210 trace_array_put(tr);
bc0c38d1
SR
3211 return 0;
3212}
3213
7b85af63
SRRH
3214static int tracing_single_release_tr(struct inode *inode, struct file *file)
3215{
3216 struct trace_array *tr = inode->i_private;
3217
3218 trace_array_put(tr);
3219
3220 return single_release(inode, file);
3221}
3222
bc0c38d1
SR
3223static int tracing_open(struct inode *inode, struct file *file)
3224{
6484c71c 3225 struct trace_array *tr = inode->i_private;
85a2f9b4
SR
3226 struct trace_iterator *iter;
3227 int ret = 0;
bc0c38d1 3228
ff451961
SRRH
3229 if (trace_array_get(tr) < 0)
3230 return -ENODEV;
3231
4acd4d00 3232 /* If this file was open for write, then erase contents */
6484c71c
ON
3233 if ((file->f_mode & FMODE_WRITE) && (file->f_flags & O_TRUNC)) {
3234 int cpu = tracing_get_cpu(inode);
3235
3236 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 3237 tracing_reset_online_cpus(&tr->trace_buffer);
4acd4d00 3238 else
6484c71c 3239 tracing_reset(&tr->trace_buffer, cpu);
4acd4d00 3240 }
bc0c38d1 3241
4acd4d00 3242 if (file->f_mode & FMODE_READ) {
6484c71c 3243 iter = __tracing_open(inode, file, false);
4acd4d00
SR
3244 if (IS_ERR(iter))
3245 ret = PTR_ERR(iter);
983f938a 3246 else if (tr->trace_flags & TRACE_ITER_LATENCY_FMT)
4acd4d00
SR
3247 iter->iter_flags |= TRACE_FILE_LAT_FMT;
3248 }
ff451961
SRRH
3249
3250 if (ret < 0)
3251 trace_array_put(tr);
3252
bc0c38d1
SR
3253 return ret;
3254}
3255
607e2ea1
SRRH
3256/*
3257 * Some tracers are not suitable for instance buffers.
3258 * A tracer is always available for the global array (toplevel)
3259 * or if it explicitly states that it is.
3260 */
3261static bool
3262trace_ok_for_array(struct tracer *t, struct trace_array *tr)
3263{
3264 return (tr->flags & TRACE_ARRAY_FL_GLOBAL) || t->allow_instances;
3265}
3266
3267/* Find the next tracer that this trace array may use */
3268static struct tracer *
3269get_tracer_for_array(struct trace_array *tr, struct tracer *t)
3270{
3271 while (t && !trace_ok_for_array(t, tr))
3272 t = t->next;
3273
3274 return t;
3275}
3276
e309b41d 3277static void *
bc0c38d1
SR
3278t_next(struct seq_file *m, void *v, loff_t *pos)
3279{
607e2ea1 3280 struct trace_array *tr = m->private;
f129e965 3281 struct tracer *t = v;
bc0c38d1
SR
3282
3283 (*pos)++;
3284
3285 if (t)
607e2ea1 3286 t = get_tracer_for_array(tr, t->next);
bc0c38d1 3287
bc0c38d1
SR
3288 return t;
3289}
3290
3291static void *t_start(struct seq_file *m, loff_t *pos)
3292{
607e2ea1 3293 struct trace_array *tr = m->private;
f129e965 3294 struct tracer *t;
bc0c38d1
SR
3295 loff_t l = 0;
3296
3297 mutex_lock(&trace_types_lock);
607e2ea1
SRRH
3298
3299 t = get_tracer_for_array(tr, trace_types);
3300 for (; t && l < *pos; t = t_next(m, t, &l))
3301 ;
bc0c38d1
SR
3302
3303 return t;
3304}
3305
3306static void t_stop(struct seq_file *m, void *p)
3307{
3308 mutex_unlock(&trace_types_lock);
3309}
3310
3311static int t_show(struct seq_file *m, void *v)
3312{
3313 struct tracer *t = v;
3314
3315 if (!t)
3316 return 0;
3317
fa6f0cc7 3318 seq_puts(m, t->name);
bc0c38d1
SR
3319 if (t->next)
3320 seq_putc(m, ' ');
3321 else
3322 seq_putc(m, '\n');
3323
3324 return 0;
3325}
3326
88e9d34c 3327static const struct seq_operations show_traces_seq_ops = {
4bf39a94
IM
3328 .start = t_start,
3329 .next = t_next,
3330 .stop = t_stop,
3331 .show = t_show,
bc0c38d1
SR
3332};
3333
3334static int show_traces_open(struct inode *inode, struct file *file)
3335{
607e2ea1
SRRH
3336 struct trace_array *tr = inode->i_private;
3337 struct seq_file *m;
3338 int ret;
3339
60a11774
SR
3340 if (tracing_disabled)
3341 return -ENODEV;
3342
607e2ea1
SRRH
3343 ret = seq_open(file, &show_traces_seq_ops);
3344 if (ret)
3345 return ret;
3346
3347 m = file->private_data;
3348 m->private = tr;
3349
3350 return 0;
bc0c38d1
SR
3351}
3352
4acd4d00
SR
3353static ssize_t
3354tracing_write_stub(struct file *filp, const char __user *ubuf,
3355 size_t count, loff_t *ppos)
3356{
3357 return count;
3358}
3359
098c879e 3360loff_t tracing_lseek(struct file *file, loff_t offset, int whence)
364829b1 3361{
098c879e
SRRH
3362 int ret;
3363
364829b1 3364 if (file->f_mode & FMODE_READ)
098c879e 3365 ret = seq_lseek(file, offset, whence);
364829b1 3366 else
098c879e
SRRH
3367 file->f_pos = ret = 0;
3368
3369 return ret;
364829b1
SP
3370}
3371
5e2336a0 3372static const struct file_operations tracing_fops = {
4bf39a94
IM
3373 .open = tracing_open,
3374 .read = seq_read,
4acd4d00 3375 .write = tracing_write_stub,
098c879e 3376 .llseek = tracing_lseek,
4bf39a94 3377 .release = tracing_release,
bc0c38d1
SR
3378};
3379
5e2336a0 3380static const struct file_operations show_traces_fops = {
c7078de1
IM
3381 .open = show_traces_open,
3382 .read = seq_read,
3383 .release = seq_release,
b444786f 3384 .llseek = seq_lseek,
c7078de1
IM
3385};
3386
36dfe925
IM
3387/*
3388 * The tracer itself will not take this lock, but still we want
3389 * to provide a consistent cpumask to user-space:
3390 */
3391static DEFINE_MUTEX(tracing_cpumask_update_lock);
3392
3393/*
3394 * Temporary storage for the character representation of the
3395 * CPU bitmask (and one more byte for the newline):
3396 */
3397static char mask_str[NR_CPUS + 1];
3398
c7078de1
IM
3399static ssize_t
3400tracing_cpumask_read(struct file *filp, char __user *ubuf,
3401 size_t count, loff_t *ppos)
3402{
ccfe9e42 3403 struct trace_array *tr = file_inode(filp)->i_private;
36dfe925 3404 int len;
c7078de1
IM
3405
3406 mutex_lock(&tracing_cpumask_update_lock);
36dfe925 3407
1a40243b
TH
3408 len = snprintf(mask_str, count, "%*pb\n",
3409 cpumask_pr_args(tr->tracing_cpumask));
3410 if (len >= count) {
36dfe925
IM
3411 count = -EINVAL;
3412 goto out_err;
3413 }
36dfe925
IM
3414 count = simple_read_from_buffer(ubuf, count, ppos, mask_str, NR_CPUS+1);
3415
3416out_err:
c7078de1
IM
3417 mutex_unlock(&tracing_cpumask_update_lock);
3418
3419 return count;
3420}
3421
3422static ssize_t
3423tracing_cpumask_write(struct file *filp, const char __user *ubuf,
3424 size_t count, loff_t *ppos)
3425{
ccfe9e42 3426 struct trace_array *tr = file_inode(filp)->i_private;
9e01c1b7 3427 cpumask_var_t tracing_cpumask_new;
2b6080f2 3428 int err, cpu;
9e01c1b7
RR
3429
3430 if (!alloc_cpumask_var(&tracing_cpumask_new, GFP_KERNEL))
3431 return -ENOMEM;
c7078de1 3432
9e01c1b7 3433 err = cpumask_parse_user(ubuf, count, tracing_cpumask_new);
c7078de1 3434 if (err)
36dfe925
IM
3435 goto err_unlock;
3436
215368e8
LZ
3437 mutex_lock(&tracing_cpumask_update_lock);
3438
a5e25883 3439 local_irq_disable();
0b9b12c1 3440 arch_spin_lock(&tr->max_lock);
ab46428c 3441 for_each_tracing_cpu(cpu) {
36dfe925
IM
3442 /*
3443 * Increase/decrease the disabled counter if we are
3444 * about to flip a bit in the cpumask:
3445 */
ccfe9e42 3446 if (cpumask_test_cpu(cpu, tr->tracing_cpumask) &&
9e01c1b7 3447 !cpumask_test_cpu(cpu, tracing_cpumask_new)) {
12883efb
SRRH
3448 atomic_inc(&per_cpu_ptr(tr->trace_buffer.data, cpu)->disabled);
3449 ring_buffer_record_disable_cpu(tr->trace_buffer.buffer, cpu);
36dfe925 3450 }
ccfe9e42 3451 if (!cpumask_test_cpu(cpu, tr->tracing_cpumask) &&
9e01c1b7 3452 cpumask_test_cpu(cpu, tracing_cpumask_new)) {
12883efb
SRRH
3453 atomic_dec(&per_cpu_ptr(tr->trace_buffer.data, cpu)->disabled);
3454 ring_buffer_record_enable_cpu(tr->trace_buffer.buffer, cpu);
36dfe925
IM
3455 }
3456 }
0b9b12c1 3457 arch_spin_unlock(&tr->max_lock);
a5e25883 3458 local_irq_enable();
36dfe925 3459
ccfe9e42 3460 cpumask_copy(tr->tracing_cpumask, tracing_cpumask_new);
36dfe925
IM
3461
3462 mutex_unlock(&tracing_cpumask_update_lock);
9e01c1b7 3463 free_cpumask_var(tracing_cpumask_new);
c7078de1
IM
3464
3465 return count;
36dfe925
IM
3466
3467err_unlock:
215368e8 3468 free_cpumask_var(tracing_cpumask_new);
36dfe925
IM
3469
3470 return err;
c7078de1
IM
3471}
3472
5e2336a0 3473static const struct file_operations tracing_cpumask_fops = {
ccfe9e42 3474 .open = tracing_open_generic_tr,
c7078de1
IM
3475 .read = tracing_cpumask_read,
3476 .write = tracing_cpumask_write,
ccfe9e42 3477 .release = tracing_release_generic_tr,
b444786f 3478 .llseek = generic_file_llseek,
bc0c38d1
SR
3479};
3480
fdb372ed 3481static int tracing_trace_options_show(struct seq_file *m, void *v)
bc0c38d1 3482{
d8e83d26 3483 struct tracer_opt *trace_opts;
2b6080f2 3484 struct trace_array *tr = m->private;
d8e83d26 3485 u32 tracer_flags;
d8e83d26 3486 int i;
adf9f195 3487
d8e83d26 3488 mutex_lock(&trace_types_lock);
2b6080f2
SR
3489 tracer_flags = tr->current_trace->flags->val;
3490 trace_opts = tr->current_trace->flags->opts;
d8e83d26 3491
bc0c38d1 3492 for (i = 0; trace_options[i]; i++) {
983f938a 3493 if (tr->trace_flags & (1 << i))
fdb372ed 3494 seq_printf(m, "%s\n", trace_options[i]);
bc0c38d1 3495 else
fdb372ed 3496 seq_printf(m, "no%s\n", trace_options[i]);
bc0c38d1
SR
3497 }
3498
adf9f195
FW
3499 for (i = 0; trace_opts[i].name; i++) {
3500 if (tracer_flags & trace_opts[i].bit)
fdb372ed 3501 seq_printf(m, "%s\n", trace_opts[i].name);
adf9f195 3502 else
fdb372ed 3503 seq_printf(m, "no%s\n", trace_opts[i].name);
adf9f195 3504 }
d8e83d26 3505 mutex_unlock(&trace_types_lock);
adf9f195 3506
fdb372ed 3507 return 0;
bc0c38d1 3508}
bc0c38d1 3509
8c1a49ae 3510static int __set_tracer_option(struct trace_array *tr,
8d18eaaf
LZ
3511 struct tracer_flags *tracer_flags,
3512 struct tracer_opt *opts, int neg)
3513{
d39cdd20 3514 struct tracer *trace = tracer_flags->trace;
8d18eaaf 3515 int ret;
bc0c38d1 3516
8c1a49ae 3517 ret = trace->set_flag(tr, tracer_flags->val, opts->bit, !neg);
8d18eaaf
LZ
3518 if (ret)
3519 return ret;
3520
3521 if (neg)
3522 tracer_flags->val &= ~opts->bit;
3523 else
3524 tracer_flags->val |= opts->bit;
3525 return 0;
bc0c38d1
SR
3526}
3527
adf9f195 3528/* Try to assign a tracer specific option */
8c1a49ae 3529static int set_tracer_option(struct trace_array *tr, char *cmp, int neg)
adf9f195 3530{
8c1a49ae 3531 struct tracer *trace = tr->current_trace;
7770841e 3532 struct tracer_flags *tracer_flags = trace->flags;
adf9f195 3533 struct tracer_opt *opts = NULL;
8d18eaaf 3534 int i;
adf9f195 3535
7770841e
Z
3536 for (i = 0; tracer_flags->opts[i].name; i++) {
3537 opts = &tracer_flags->opts[i];
adf9f195 3538
8d18eaaf 3539 if (strcmp(cmp, opts->name) == 0)
8c1a49ae 3540 return __set_tracer_option(tr, trace->flags, opts, neg);
adf9f195 3541 }
adf9f195 3542
8d18eaaf 3543 return -EINVAL;
adf9f195
FW
3544}
3545
613f04a0
SRRH
3546/* Some tracers require overwrite to stay enabled */
3547int trace_keep_overwrite(struct tracer *tracer, u32 mask, int set)
3548{
3549 if (tracer->enabled && (mask & TRACE_ITER_OVERWRITE) && !set)
3550 return -1;
3551
3552 return 0;
3553}
3554
2b6080f2 3555int set_tracer_flag(struct trace_array *tr, unsigned int mask, int enabled)
af4617bd
SR
3556{
3557 /* do nothing if flag is already set */
983f938a 3558 if (!!(tr->trace_flags & mask) == !!enabled)
613f04a0
SRRH
3559 return 0;
3560
3561 /* Give the tracer a chance to approve the change */
2b6080f2 3562 if (tr->current_trace->flag_changed)
bf6065b5 3563 if (tr->current_trace->flag_changed(tr, mask, !!enabled))
613f04a0 3564 return -EINVAL;
af4617bd
SR
3565
3566 if (enabled)
983f938a 3567 tr->trace_flags |= mask;
af4617bd 3568 else
983f938a 3569 tr->trace_flags &= ~mask;
e870e9a1
LZ
3570
3571 if (mask == TRACE_ITER_RECORD_CMD)
3572 trace_event_enable_cmd_record(enabled);
750912fa 3573
c37775d5
SR
3574 if (mask == TRACE_ITER_EVENT_FORK)
3575 trace_event_follow_fork(tr, enabled);
3576
80902822 3577 if (mask == TRACE_ITER_OVERWRITE) {
12883efb 3578 ring_buffer_change_overwrite(tr->trace_buffer.buffer, enabled);
80902822 3579#ifdef CONFIG_TRACER_MAX_TRACE
12883efb 3580 ring_buffer_change_overwrite(tr->max_buffer.buffer, enabled);
80902822
SRRH
3581#endif
3582 }
81698831 3583
b9f9108c 3584 if (mask == TRACE_ITER_PRINTK) {
81698831 3585 trace_printk_start_stop_comm(enabled);
b9f9108c
SRRH
3586 trace_printk_control(enabled);
3587 }
613f04a0
SRRH
3588
3589 return 0;
af4617bd
SR
3590}
3591
2b6080f2 3592static int trace_set_options(struct trace_array *tr, char *option)
bc0c38d1 3593{
8d18eaaf 3594 char *cmp;
bc0c38d1 3595 int neg = 0;
613f04a0 3596 int ret = -ENODEV;
bc0c38d1 3597 int i;
a4d1e688 3598 size_t orig_len = strlen(option);
bc0c38d1 3599
7bcfaf54 3600 cmp = strstrip(option);
bc0c38d1 3601
8d18eaaf 3602 if (strncmp(cmp, "no", 2) == 0) {
bc0c38d1
SR
3603 neg = 1;
3604 cmp += 2;
3605 }
3606
69d34da2
SRRH
3607 mutex_lock(&trace_types_lock);
3608
bc0c38d1 3609 for (i = 0; trace_options[i]; i++) {
8d18eaaf 3610 if (strcmp(cmp, trace_options[i]) == 0) {
2b6080f2 3611 ret = set_tracer_flag(tr, 1 << i, !neg);
bc0c38d1
SR
3612 break;
3613 }
3614 }
adf9f195
FW
3615
3616 /* If no option could be set, test the specific tracer options */
69d34da2 3617 if (!trace_options[i])
8c1a49ae 3618 ret = set_tracer_option(tr, cmp, neg);
69d34da2
SRRH
3619
3620 mutex_unlock(&trace_types_lock);
bc0c38d1 3621
a4d1e688
JW
3622 /*
3623 * If the first trailing whitespace is replaced with '\0' by strstrip,
3624 * turn it back into a space.
3625 */
3626 if (orig_len > strlen(option))
3627 option[strlen(option)] = ' ';
3628
7bcfaf54
SR
3629 return ret;
3630}
3631
a4d1e688
JW
3632static void __init apply_trace_boot_options(void)
3633{
3634 char *buf = trace_boot_options_buf;
3635 char *option;
3636
3637 while (true) {
3638 option = strsep(&buf, ",");
3639
3640 if (!option)
3641 break;
a4d1e688 3642
43ed3843
SRRH
3643 if (*option)
3644 trace_set_options(&global_trace, option);
a4d1e688
JW
3645
3646 /* Put back the comma to allow this to be called again */
3647 if (buf)
3648 *(buf - 1) = ',';
3649 }
3650}
3651
7bcfaf54
SR
3652static ssize_t
3653tracing_trace_options_write(struct file *filp, const char __user *ubuf,
3654 size_t cnt, loff_t *ppos)
3655{
2b6080f2
SR
3656 struct seq_file *m = filp->private_data;
3657 struct trace_array *tr = m->private;
7bcfaf54 3658 char buf[64];
613f04a0 3659 int ret;
7bcfaf54
SR
3660
3661 if (cnt >= sizeof(buf))
3662 return -EINVAL;
3663
3664 if (copy_from_user(&buf, ubuf, cnt))
3665 return -EFAULT;
3666
a8dd2176
SR
3667 buf[cnt] = 0;
3668
2b6080f2 3669 ret = trace_set_options(tr, buf);
613f04a0
SRRH
3670 if (ret < 0)
3671 return ret;
7bcfaf54 3672
cf8517cf 3673 *ppos += cnt;
bc0c38d1
SR
3674
3675 return cnt;
3676}
3677
fdb372ed
LZ
3678static int tracing_trace_options_open(struct inode *inode, struct file *file)
3679{
7b85af63 3680 struct trace_array *tr = inode->i_private;
f77d09a3 3681 int ret;
7b85af63 3682
fdb372ed
LZ
3683 if (tracing_disabled)
3684 return -ENODEV;
2b6080f2 3685
7b85af63
SRRH
3686 if (trace_array_get(tr) < 0)
3687 return -ENODEV;
3688
f77d09a3
AL
3689 ret = single_open(file, tracing_trace_options_show, inode->i_private);
3690 if (ret < 0)
3691 trace_array_put(tr);
3692
3693 return ret;
fdb372ed
LZ
3694}
3695
5e2336a0 3696static const struct file_operations tracing_iter_fops = {
fdb372ed
LZ
3697 .open = tracing_trace_options_open,
3698 .read = seq_read,
3699 .llseek = seq_lseek,
7b85af63 3700 .release = tracing_single_release_tr,
ee6bce52 3701 .write = tracing_trace_options_write,
bc0c38d1
SR
3702};
3703
7bd2f24c
IM
3704static const char readme_msg[] =
3705 "tracing mini-HOWTO:\n\n"
22f45649
SRRH
3706 "# echo 0 > tracing_on : quick way to disable tracing\n"
3707 "# echo 1 > tracing_on : quick way to re-enable tracing\n\n"
3708 " Important files:\n"
3709 " trace\t\t\t- The static contents of the buffer\n"
3710 "\t\t\t To clear the buffer write into this file: echo > trace\n"
3711 " trace_pipe\t\t- A consuming read to see the contents of the buffer\n"
3712 " current_tracer\t- function and latency tracers\n"
3713 " available_tracers\t- list of configured tracers for current_tracer\n"
3714 " buffer_size_kb\t- view and modify size of per cpu buffer\n"
3715 " buffer_total_size_kb - view total size of all cpu buffers\n\n"
3716 " trace_clock\t\t-change the clock used to order events\n"
3717 " local: Per cpu clock but may not be synced across CPUs\n"
3718 " global: Synced across CPUs but slows tracing down.\n"
3719 " counter: Not a clock, but just an increment\n"
3720 " uptime: Jiffy counter from time of boot\n"
3721 " perf: Same clock that perf events use\n"
3722#ifdef CONFIG_X86_64
3723 " x86-tsc: TSC cycle counter\n"
3724#endif
3725 "\n trace_marker\t\t- Writes into this file writes into the kernel buffer\n"
3726 " tracing_cpumask\t- Limit which CPUs to trace\n"
3727 " instances\t\t- Make sub-buffers with: mkdir instances/foo\n"
3728 "\t\t\t Remove sub-buffer with rmdir\n"
3729 " trace_options\t\t- Set format or modify how tracing happens\n"
71485c45
SRRH
3730 "\t\t\t Disable an option by adding a suffix 'no' to the\n"
3731 "\t\t\t option name\n"
939c7a4f 3732 " saved_cmdlines_size\t- echo command number in here to store comm-pid list\n"
22f45649
SRRH
3733#ifdef CONFIG_DYNAMIC_FTRACE
3734 "\n available_filter_functions - list of functions that can be filtered on\n"
71485c45
SRRH
3735 " set_ftrace_filter\t- echo function name in here to only trace these\n"
3736 "\t\t\t functions\n"
3737 "\t accepts: func_full_name, *func_end, func_begin*, *func_middle*\n"
3738 "\t modules: Can select a group via module\n"
3739 "\t Format: :mod:<module-name>\n"
3740 "\t example: echo :mod:ext3 > set_ftrace_filter\n"
3741 "\t triggers: a command to perform when function is hit\n"
3742 "\t Format: <function>:<trigger>[:count]\n"
3743 "\t trigger: traceon, traceoff\n"
3744 "\t\t enable_event:<system>:<event>\n"
3745 "\t\t disable_event:<system>:<event>\n"
22f45649 3746#ifdef CONFIG_STACKTRACE
71485c45 3747 "\t\t stacktrace\n"
22f45649
SRRH
3748#endif
3749#ifdef CONFIG_TRACER_SNAPSHOT
71485c45 3750 "\t\t snapshot\n"
22f45649 3751#endif
17a280ea
SRRH
3752 "\t\t dump\n"
3753 "\t\t cpudump\n"
71485c45
SRRH
3754 "\t example: echo do_fault:traceoff > set_ftrace_filter\n"
3755 "\t echo do_trap:traceoff:3 > set_ftrace_filter\n"
3756 "\t The first one will disable tracing every time do_fault is hit\n"
3757 "\t The second will disable tracing at most 3 times when do_trap is hit\n"
3758 "\t The first time do trap is hit and it disables tracing, the\n"
3759 "\t counter will decrement to 2. If tracing is already disabled,\n"
3760 "\t the counter will not decrement. It only decrements when the\n"
3761 "\t trigger did work\n"
3762 "\t To remove trigger without count:\n"
3763 "\t echo '!<function>:<trigger> > set_ftrace_filter\n"
3764 "\t To remove trigger with a count:\n"
3765 "\t echo '!<function>:<trigger>:0 > set_ftrace_filter\n"
22f45649 3766 " set_ftrace_notrace\t- echo function name in here to never trace.\n"
71485c45
SRRH
3767 "\t accepts: func_full_name, *func_end, func_begin*, *func_middle*\n"
3768 "\t modules: Can select a group via module command :mod:\n"
3769 "\t Does not accept triggers\n"
22f45649
SRRH
3770#endif /* CONFIG_DYNAMIC_FTRACE */
3771#ifdef CONFIG_FUNCTION_TRACER
71485c45
SRRH
3772 " set_ftrace_pid\t- Write pid(s) to only function trace those pids\n"
3773 "\t\t (function)\n"
22f45649
SRRH
3774#endif
3775#ifdef CONFIG_FUNCTION_GRAPH_TRACER
3776 " set_graph_function\t- Trace the nested calls of a function (function_graph)\n"
d048a8c7 3777 " set_graph_notrace\t- Do not trace the nested calls of a function (function_graph)\n"
22f45649
SRRH
3778 " max_graph_depth\t- Trace a limited depth of nested calls (0 is unlimited)\n"
3779#endif
3780#ifdef CONFIG_TRACER_SNAPSHOT
71485c45
SRRH
3781 "\n snapshot\t\t- Like 'trace' but shows the content of the static\n"
3782 "\t\t\t snapshot buffer. Read the contents for more\n"
3783 "\t\t\t information\n"
22f45649 3784#endif
991821c8 3785#ifdef CONFIG_STACK_TRACER
22f45649
SRRH
3786 " stack_trace\t\t- Shows the max stack trace when active\n"
3787 " stack_max_size\t- Shows current max stack size that was traced\n"
71485c45
SRRH
3788 "\t\t\t Write into this file to reset the max size (trigger a\n"
3789 "\t\t\t new trace)\n"
22f45649 3790#ifdef CONFIG_DYNAMIC_FTRACE
71485c45
SRRH
3791 " stack_trace_filter\t- Like set_ftrace_filter but limits what stack_trace\n"
3792 "\t\t\t traces\n"
22f45649 3793#endif
991821c8 3794#endif /* CONFIG_STACK_TRACER */
26f25564
TZ
3795 " events/\t\t- Directory containing all trace event subsystems:\n"
3796 " enable\t\t- Write 0/1 to enable/disable tracing of all events\n"
3797 " events/<system>/\t- Directory containing all trace events for <system>:\n"
71485c45
SRRH
3798 " enable\t\t- Write 0/1 to enable/disable tracing of all <system>\n"
3799 "\t\t\t events\n"
26f25564 3800 " filter\t\t- If set, only events passing filter are traced\n"
71485c45
SRRH
3801 " events/<system>/<event>/\t- Directory containing control files for\n"
3802 "\t\t\t <event>:\n"
26f25564
TZ
3803 " enable\t\t- Write 0/1 to enable/disable tracing of <event>\n"
3804 " filter\t\t- If set, only events passing filter are traced\n"
3805 " trigger\t\t- If set, a command to perform when event is hit\n"
71485c45
SRRH
3806 "\t Format: <trigger>[:count][if <filter>]\n"
3807 "\t trigger: traceon, traceoff\n"
3808 "\t enable_event:<system>:<event>\n"
3809 "\t disable_event:<system>:<event>\n"
26f25564 3810#ifdef CONFIG_STACKTRACE
71485c45 3811 "\t\t stacktrace\n"
26f25564
TZ
3812#endif
3813#ifdef CONFIG_TRACER_SNAPSHOT
71485c45 3814 "\t\t snapshot\n"
7ef224d1
TZ
3815#endif
3816#ifdef CONFIG_HIST_TRIGGERS
3817 "\t\t hist (see below)\n"
26f25564 3818#endif
71485c45
SRRH
3819 "\t example: echo traceoff > events/block/block_unplug/trigger\n"
3820 "\t echo traceoff:3 > events/block/block_unplug/trigger\n"
3821 "\t echo 'enable_event:kmem:kmalloc:3 if nr_rq > 1' > \\\n"
3822 "\t events/block/block_unplug/trigger\n"
3823 "\t The first disables tracing every time block_unplug is hit.\n"
3824 "\t The second disables tracing the first 3 times block_unplug is hit.\n"
3825 "\t The third enables the kmalloc event the first 3 times block_unplug\n"
3826 "\t is hit and has value of greater than 1 for the 'nr_rq' event field.\n"
3827 "\t Like function triggers, the counter is only decremented if it\n"
3828 "\t enabled or disabled tracing.\n"
3829 "\t To remove a trigger without a count:\n"
3830 "\t echo '!<trigger> > <system>/<event>/trigger\n"
3831 "\t To remove a trigger with a count:\n"
3832 "\t echo '!<trigger>:0 > <system>/<event>/trigger\n"
3833 "\t Filters can be ignored when removing a trigger.\n"
7ef224d1
TZ
3834#ifdef CONFIG_HIST_TRIGGERS
3835 " hist trigger\t- If set, event hits are aggregated into a hash table\n"
3836 "\t Format: hist:keys=<field1>\n"
f2606835 3837 "\t [:values=<field1[,field2,...]>]\n"
7ef224d1
TZ
3838 "\t [:size=#entries]\n"
3839 "\t [if <filter>]\n\n"
3840 "\t When a matching event is hit, an entry is added to a hash\n"
f2606835
TZ
3841 "\t table using the key(s) and value(s) named, and the value of a\n"
3842 "\t sum called 'hitcount' is incremented. Keys and values\n"
3843 "\t correspond to fields in the event's format description. Keys\n"
3844 "\t can be any field. Values must correspond to numeric fields.\n"
3845 "\t The 'size' parameter can be used to specify more or fewer\n"
3846 "\t than the default 2048 entries for the hashtable size.\n\n"
7ef224d1
TZ
3847 "\t Reading the 'hist' file for the event will dump the hash\n"
3848 "\t table in its entirety to stdout."
3849#endif
7bd2f24c
IM
3850;
3851
3852static ssize_t
3853tracing_readme_read(struct file *filp, char __user *ubuf,
3854 size_t cnt, loff_t *ppos)
3855{
3856 return simple_read_from_buffer(ubuf, cnt, ppos,
3857 readme_msg, strlen(readme_msg));
3858}
3859
5e2336a0 3860static const struct file_operations tracing_readme_fops = {
c7078de1
IM
3861 .open = tracing_open_generic,
3862 .read = tracing_readme_read,
b444786f 3863 .llseek = generic_file_llseek,
7bd2f24c
IM
3864};
3865
42584c81
YY
3866static void *saved_cmdlines_next(struct seq_file *m, void *v, loff_t *pos)
3867{
3868 unsigned int *ptr = v;
69abe6a5 3869
42584c81
YY
3870 if (*pos || m->count)
3871 ptr++;
69abe6a5 3872
42584c81 3873 (*pos)++;
69abe6a5 3874
939c7a4f
YY
3875 for (; ptr < &savedcmd->map_cmdline_to_pid[savedcmd->cmdline_num];
3876 ptr++) {
42584c81
YY
3877 if (*ptr == -1 || *ptr == NO_CMDLINE_MAP)
3878 continue;
69abe6a5 3879
42584c81
YY
3880 return ptr;
3881 }
69abe6a5 3882
42584c81
YY
3883 return NULL;
3884}
3885
3886static void *saved_cmdlines_start(struct seq_file *m, loff_t *pos)
3887{
3888 void *v;
3889 loff_t l = 0;
69abe6a5 3890
4c27e756
SRRH
3891 preempt_disable();
3892 arch_spin_lock(&trace_cmdline_lock);
3893
939c7a4f 3894 v = &savedcmd->map_cmdline_to_pid[0];
42584c81
YY
3895 while (l <= *pos) {
3896 v = saved_cmdlines_next(m, v, &l);
3897 if (!v)
3898 return NULL;
69abe6a5
AP
3899 }
3900
42584c81
YY
3901 return v;
3902}
3903
3904static void saved_cmdlines_stop(struct seq_file *m, void *v)
3905{
4c27e756
SRRH
3906 arch_spin_unlock(&trace_cmdline_lock);
3907 preempt_enable();
42584c81 3908}
69abe6a5 3909
42584c81
YY
3910static int saved_cmdlines_show(struct seq_file *m, void *v)
3911{
3912 char buf[TASK_COMM_LEN];
3913 unsigned int *pid = v;
69abe6a5 3914
4c27e756 3915 __trace_find_cmdline(*pid, buf);
42584c81
YY
3916 seq_printf(m, "%d %s\n", *pid, buf);
3917 return 0;
3918}
3919
3920static const struct seq_operations tracing_saved_cmdlines_seq_ops = {
3921 .start = saved_cmdlines_start,
3922 .next = saved_cmdlines_next,
3923 .stop = saved_cmdlines_stop,
3924 .show = saved_cmdlines_show,
3925};
3926
3927static int tracing_saved_cmdlines_open(struct inode *inode, struct file *filp)
3928{
3929 if (tracing_disabled)
3930 return -ENODEV;
3931
3932 return seq_open(filp, &tracing_saved_cmdlines_seq_ops);
69abe6a5
AP
3933}
3934
3935static const struct file_operations tracing_saved_cmdlines_fops = {
42584c81
YY
3936 .open = tracing_saved_cmdlines_open,
3937 .read = seq_read,
3938 .llseek = seq_lseek,
3939 .release = seq_release,
69abe6a5
AP
3940};
3941
939c7a4f
YY
3942static ssize_t
3943tracing_saved_cmdlines_size_read(struct file *filp, char __user *ubuf,
3944 size_t cnt, loff_t *ppos)
3945{
3946 char buf[64];
3947 int r;
3948
3949 arch_spin_lock(&trace_cmdline_lock);
a6af8fbf 3950 r = scnprintf(buf, sizeof(buf), "%u\n", savedcmd->cmdline_num);
939c7a4f
YY
3951 arch_spin_unlock(&trace_cmdline_lock);
3952
3953 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
3954}
3955
3956static void free_saved_cmdlines_buffer(struct saved_cmdlines_buffer *s)
3957{
3958 kfree(s->saved_cmdlines);
3959 kfree(s->map_cmdline_to_pid);
3960 kfree(s);
3961}
3962
3963static int tracing_resize_saved_cmdlines(unsigned int val)
3964{
3965 struct saved_cmdlines_buffer *s, *savedcmd_temp;
3966
a6af8fbf 3967 s = kmalloc(sizeof(*s), GFP_KERNEL);
939c7a4f
YY
3968 if (!s)
3969 return -ENOMEM;
3970
3971 if (allocate_cmdlines_buffer(val, s) < 0) {
3972 kfree(s);
3973 return -ENOMEM;
3974 }
3975
3976 arch_spin_lock(&trace_cmdline_lock);
3977 savedcmd_temp = savedcmd;
3978 savedcmd = s;
3979 arch_spin_unlock(&trace_cmdline_lock);
3980 free_saved_cmdlines_buffer(savedcmd_temp);
3981
3982 return 0;
3983}
3984
3985static ssize_t
3986tracing_saved_cmdlines_size_write(struct file *filp, const char __user *ubuf,
3987 size_t cnt, loff_t *ppos)
3988{
3989 unsigned long val;
3990 int ret;
3991
3992 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
3993 if (ret)
3994 return ret;
3995
3996 /* must have at least 1 entry or less than PID_MAX_DEFAULT */
3997 if (!val || val > PID_MAX_DEFAULT)
3998 return -EINVAL;
3999
4000 ret = tracing_resize_saved_cmdlines((unsigned int)val);
4001 if (ret < 0)
4002 return ret;
4003
4004 *ppos += cnt;
4005
4006 return cnt;
4007}
4008
4009static const struct file_operations tracing_saved_cmdlines_size_fops = {
4010 .open = tracing_open_generic,
4011 .read = tracing_saved_cmdlines_size_read,
4012 .write = tracing_saved_cmdlines_size_write,
4013};
4014
9828413d
SRRH
4015#ifdef CONFIG_TRACE_ENUM_MAP_FILE
4016static union trace_enum_map_item *
4017update_enum_map(union trace_enum_map_item *ptr)
4018{
4019 if (!ptr->map.enum_string) {
4020 if (ptr->tail.next) {
4021 ptr = ptr->tail.next;
4022 /* Set ptr to the next real item (skip head) */
4023 ptr++;
4024 } else
4025 return NULL;
4026 }
4027 return ptr;
4028}
4029
4030static void *enum_map_next(struct seq_file *m, void *v, loff_t *pos)
4031{
4032 union trace_enum_map_item *ptr = v;
4033
4034 /*
4035 * Paranoid! If ptr points to end, we don't want to increment past it.
4036 * This really should never happen.
4037 */
4038 ptr = update_enum_map(ptr);
4039 if (WARN_ON_ONCE(!ptr))
4040 return NULL;
4041
4042 ptr++;
4043
4044 (*pos)++;
4045
4046 ptr = update_enum_map(ptr);
4047
4048 return ptr;
4049}
4050
4051static void *enum_map_start(struct seq_file *m, loff_t *pos)
4052{
4053 union trace_enum_map_item *v;
4054 loff_t l = 0;
4055
4056 mutex_lock(&trace_enum_mutex);
4057
4058 v = trace_enum_maps;
4059 if (v)
4060 v++;
4061
4062 while (v && l < *pos) {
4063 v = enum_map_next(m, v, &l);
4064 }
4065
4066 return v;
4067}
4068
4069static void enum_map_stop(struct seq_file *m, void *v)
4070{
4071 mutex_unlock(&trace_enum_mutex);
4072}
4073
4074static int enum_map_show(struct seq_file *m, void *v)
4075{
4076 union trace_enum_map_item *ptr = v;
4077
4078 seq_printf(m, "%s %ld (%s)\n",
4079 ptr->map.enum_string, ptr->map.enum_value,
4080 ptr->map.system);
4081
4082 return 0;
4083}
4084
4085static const struct seq_operations tracing_enum_map_seq_ops = {
4086 .start = enum_map_start,
4087 .next = enum_map_next,
4088 .stop = enum_map_stop,
4089 .show = enum_map_show,
4090};
4091
4092static int tracing_enum_map_open(struct inode *inode, struct file *filp)
4093{
4094 if (tracing_disabled)
4095 return -ENODEV;
4096
4097 return seq_open(filp, &tracing_enum_map_seq_ops);
4098}
4099
4100static const struct file_operations tracing_enum_map_fops = {
4101 .open = tracing_enum_map_open,
4102 .read = seq_read,
4103 .llseek = seq_lseek,
4104 .release = seq_release,
4105};
4106
4107static inline union trace_enum_map_item *
4108trace_enum_jmp_to_tail(union trace_enum_map_item *ptr)
4109{
4110 /* Return tail of array given the head */
4111 return ptr + ptr->head.length + 1;
4112}
4113
4114static void
4115trace_insert_enum_map_file(struct module *mod, struct trace_enum_map **start,
4116 int len)
4117{
4118 struct trace_enum_map **stop;
4119 struct trace_enum_map **map;
4120 union trace_enum_map_item *map_array;
4121 union trace_enum_map_item *ptr;
4122
4123 stop = start + len;
4124
4125 /*
4126 * The trace_enum_maps contains the map plus a head and tail item,
4127 * where the head holds the module and length of array, and the
4128 * tail holds a pointer to the next list.
4129 */
4130 map_array = kmalloc(sizeof(*map_array) * (len + 2), GFP_KERNEL);
4131 if (!map_array) {
a395d6a7 4132 pr_warn("Unable to allocate trace enum mapping\n");
9828413d
SRRH
4133 return;
4134 }
4135
4136 mutex_lock(&trace_enum_mutex);
4137
4138 if (!trace_enum_maps)
4139 trace_enum_maps = map_array;
4140 else {
4141 ptr = trace_enum_maps;
4142 for (;;) {
4143 ptr = trace_enum_jmp_to_tail(ptr);
4144 if (!ptr->tail.next)
4145 break;
4146 ptr = ptr->tail.next;
4147
4148 }
4149 ptr->tail.next = map_array;
4150 }
4151 map_array->head.mod = mod;
4152 map_array->head.length = len;
4153 map_array++;
4154
4155 for (map = start; (unsigned long)map < (unsigned long)stop; map++) {
4156 map_array->map = **map;
4157 map_array++;
4158 }
4159 memset(map_array, 0, sizeof(*map_array));
4160
4161 mutex_unlock(&trace_enum_mutex);
4162}
4163
4164static void trace_create_enum_file(struct dentry *d_tracer)
4165{
4166 trace_create_file("enum_map", 0444, d_tracer,
4167 NULL, &tracing_enum_map_fops);
4168}
4169
4170#else /* CONFIG_TRACE_ENUM_MAP_FILE */
4171static inline void trace_create_enum_file(struct dentry *d_tracer) { }
4172static inline void trace_insert_enum_map_file(struct module *mod,
4173 struct trace_enum_map **start, int len) { }
4174#endif /* !CONFIG_TRACE_ENUM_MAP_FILE */
4175
4176static void trace_insert_enum_map(struct module *mod,
4177 struct trace_enum_map **start, int len)
0c564a53
SRRH
4178{
4179 struct trace_enum_map **map;
0c564a53
SRRH
4180
4181 if (len <= 0)
4182 return;
4183
4184 map = start;
4185
4186 trace_event_enum_update(map, len);
9828413d
SRRH
4187
4188 trace_insert_enum_map_file(mod, start, len);
0c564a53
SRRH
4189}
4190
bc0c38d1
SR
4191static ssize_t
4192tracing_set_trace_read(struct file *filp, char __user *ubuf,
4193 size_t cnt, loff_t *ppos)
4194{
2b6080f2 4195 struct trace_array *tr = filp->private_data;
ee6c2c1b 4196 char buf[MAX_TRACER_SIZE+2];
bc0c38d1
SR
4197 int r;
4198
4199 mutex_lock(&trace_types_lock);
2b6080f2 4200 r = sprintf(buf, "%s\n", tr->current_trace->name);
bc0c38d1
SR
4201 mutex_unlock(&trace_types_lock);
4202
4bf39a94 4203 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
bc0c38d1
SR
4204}
4205
b6f11df2
ACM
4206int tracer_init(struct tracer *t, struct trace_array *tr)
4207{
12883efb 4208 tracing_reset_online_cpus(&tr->trace_buffer);
b6f11df2
ACM
4209 return t->init(tr);
4210}
4211
12883efb 4212static void set_buffer_entries(struct trace_buffer *buf, unsigned long val)
438ced17
VN
4213{
4214 int cpu;
737223fb 4215
438ced17 4216 for_each_tracing_cpu(cpu)
12883efb 4217 per_cpu_ptr(buf->data, cpu)->entries = val;
438ced17
VN
4218}
4219
12883efb 4220#ifdef CONFIG_TRACER_MAX_TRACE
d60da506 4221/* resize @tr's buffer to the size of @size_tr's entries */
12883efb
SRRH
4222static int resize_buffer_duplicate_size(struct trace_buffer *trace_buf,
4223 struct trace_buffer *size_buf, int cpu_id)
d60da506
HT
4224{
4225 int cpu, ret = 0;
4226
4227 if (cpu_id == RING_BUFFER_ALL_CPUS) {
4228 for_each_tracing_cpu(cpu) {
12883efb
SRRH
4229 ret = ring_buffer_resize(trace_buf->buffer,
4230 per_cpu_ptr(size_buf->data, cpu)->entries, cpu);
d60da506
HT
4231 if (ret < 0)
4232 break;
12883efb
SRRH
4233 per_cpu_ptr(trace_buf->data, cpu)->entries =
4234 per_cpu_ptr(size_buf->data, cpu)->entries;
d60da506
HT
4235 }
4236 } else {
12883efb
SRRH
4237 ret = ring_buffer_resize(trace_buf->buffer,
4238 per_cpu_ptr(size_buf->data, cpu_id)->entries, cpu_id);
d60da506 4239 if (ret == 0)
12883efb
SRRH
4240 per_cpu_ptr(trace_buf->data, cpu_id)->entries =
4241 per_cpu_ptr(size_buf->data, cpu_id)->entries;
d60da506
HT
4242 }
4243
4244 return ret;
4245}
12883efb 4246#endif /* CONFIG_TRACER_MAX_TRACE */
d60da506 4247
2b6080f2
SR
4248static int __tracing_resize_ring_buffer(struct trace_array *tr,
4249 unsigned long size, int cpu)
73c5162a
SR
4250{
4251 int ret;
4252
4253 /*
4254 * If kernel or user changes the size of the ring buffer
a123c52b
SR
4255 * we use the size that was given, and we can forget about
4256 * expanding it later.
73c5162a 4257 */
55034cd6 4258 ring_buffer_expanded = true;
73c5162a 4259
b382ede6 4260 /* May be called before buffers are initialized */
12883efb 4261 if (!tr->trace_buffer.buffer)
b382ede6
SR
4262 return 0;
4263
12883efb 4264 ret = ring_buffer_resize(tr->trace_buffer.buffer, size, cpu);
73c5162a
SR
4265 if (ret < 0)
4266 return ret;
4267
12883efb 4268#ifdef CONFIG_TRACER_MAX_TRACE
2b6080f2
SR
4269 if (!(tr->flags & TRACE_ARRAY_FL_GLOBAL) ||
4270 !tr->current_trace->use_max_tr)
ef710e10
KM
4271 goto out;
4272
12883efb 4273 ret = ring_buffer_resize(tr->max_buffer.buffer, size, cpu);
73c5162a 4274 if (ret < 0) {
12883efb
SRRH
4275 int r = resize_buffer_duplicate_size(&tr->trace_buffer,
4276 &tr->trace_buffer, cpu);
73c5162a 4277 if (r < 0) {
a123c52b
SR
4278 /*
4279 * AARGH! We are left with different
4280 * size max buffer!!!!
4281 * The max buffer is our "snapshot" buffer.
4282 * When a tracer needs a snapshot (one of the
4283 * latency tracers), it swaps the max buffer
4284 * with the saved snap shot. We succeeded to
4285 * update the size of the main buffer, but failed to
4286 * update the size of the max buffer. But when we tried
4287 * to reset the main buffer to the original size, we
4288 * failed there too. This is very unlikely to
4289 * happen, but if it does, warn and kill all
4290 * tracing.
4291 */
73c5162a
SR
4292 WARN_ON(1);
4293 tracing_disabled = 1;
4294 }
4295 return ret;
4296 }
4297
438ced17 4298 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 4299 set_buffer_entries(&tr->max_buffer, size);
438ced17 4300 else
12883efb 4301 per_cpu_ptr(tr->max_buffer.data, cpu)->entries = size;
438ced17 4302
ef710e10 4303 out:
12883efb
SRRH
4304#endif /* CONFIG_TRACER_MAX_TRACE */
4305
438ced17 4306 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 4307 set_buffer_entries(&tr->trace_buffer, size);
438ced17 4308 else
12883efb 4309 per_cpu_ptr(tr->trace_buffer.data, cpu)->entries = size;
73c5162a
SR
4310
4311 return ret;
4312}
4313
2b6080f2
SR
4314static ssize_t tracing_resize_ring_buffer(struct trace_array *tr,
4315 unsigned long size, int cpu_id)
4f271a2a 4316{
83f40318 4317 int ret = size;
4f271a2a
VN
4318
4319 mutex_lock(&trace_types_lock);
4320
438ced17
VN
4321 if (cpu_id != RING_BUFFER_ALL_CPUS) {
4322 /* make sure, this cpu is enabled in the mask */
4323 if (!cpumask_test_cpu(cpu_id, tracing_buffer_mask)) {
4324 ret = -EINVAL;
4325 goto out;
4326 }
4327 }
4f271a2a 4328
2b6080f2 4329 ret = __tracing_resize_ring_buffer(tr, size, cpu_id);
4f271a2a
VN
4330 if (ret < 0)
4331 ret = -ENOMEM;
4332
438ced17 4333out:
4f271a2a
VN
4334 mutex_unlock(&trace_types_lock);
4335
4336 return ret;
4337}
4338
ef710e10 4339
1852fcce
SR
4340/**
4341 * tracing_update_buffers - used by tracing facility to expand ring buffers
4342 *
4343 * To save on memory when the tracing is never used on a system with it
4344 * configured in. The ring buffers are set to a minimum size. But once
4345 * a user starts to use the tracing facility, then they need to grow
4346 * to their default size.
4347 *
4348 * This function is to be called when a tracer is about to be used.
4349 */
4350int tracing_update_buffers(void)
4351{
4352 int ret = 0;
4353
1027fcb2 4354 mutex_lock(&trace_types_lock);
1852fcce 4355 if (!ring_buffer_expanded)
2b6080f2 4356 ret = __tracing_resize_ring_buffer(&global_trace, trace_buf_size,
438ced17 4357 RING_BUFFER_ALL_CPUS);
1027fcb2 4358 mutex_unlock(&trace_types_lock);
1852fcce
SR
4359
4360 return ret;
4361}
4362
577b785f
SR
4363struct trace_option_dentry;
4364
37aea98b 4365static void
2b6080f2 4366create_trace_option_files(struct trace_array *tr, struct tracer *tracer);
577b785f 4367
6b450d25
SRRH
4368/*
4369 * Used to clear out the tracer before deletion of an instance.
4370 * Must have trace_types_lock held.
4371 */
4372static void tracing_set_nop(struct trace_array *tr)
4373{
4374 if (tr->current_trace == &nop_trace)
4375 return;
4376
50512ab5 4377 tr->current_trace->enabled--;
6b450d25
SRRH
4378
4379 if (tr->current_trace->reset)
4380 tr->current_trace->reset(tr);
4381
4382 tr->current_trace = &nop_trace;
4383}
4384
41d9c0be 4385static void add_tracer_options(struct trace_array *tr, struct tracer *t)
bc0c38d1 4386{
09d23a1d
SRRH
4387 /* Only enable if the directory has been created already. */
4388 if (!tr->dir)
4389 return;
4390
37aea98b 4391 create_trace_option_files(tr, t);
09d23a1d
SRRH
4392}
4393
4394static int tracing_set_tracer(struct trace_array *tr, const char *buf)
4395{
bc0c38d1 4396 struct tracer *t;
12883efb 4397#ifdef CONFIG_TRACER_MAX_TRACE
34600f0e 4398 bool had_max_tr;
12883efb 4399#endif
d9e54076 4400 int ret = 0;
bc0c38d1 4401
1027fcb2
SR
4402 mutex_lock(&trace_types_lock);
4403
73c5162a 4404 if (!ring_buffer_expanded) {
2b6080f2 4405 ret = __tracing_resize_ring_buffer(tr, trace_buf_size,
438ced17 4406 RING_BUFFER_ALL_CPUS);
73c5162a 4407 if (ret < 0)
59f586db 4408 goto out;
73c5162a
SR
4409 ret = 0;
4410 }
4411
bc0c38d1
SR
4412 for (t = trace_types; t; t = t->next) {
4413 if (strcmp(t->name, buf) == 0)
4414 break;
4415 }
c2931e05
FW
4416 if (!t) {
4417 ret = -EINVAL;
4418 goto out;
4419 }
2b6080f2 4420 if (t == tr->current_trace)
bc0c38d1
SR
4421 goto out;
4422
607e2ea1
SRRH
4423 /* Some tracers are only allowed for the top level buffer */
4424 if (!trace_ok_for_array(t, tr)) {
4425 ret = -EINVAL;
4426 goto out;
4427 }
4428
cf6ab6d9
SRRH
4429 /* If trace pipe files are being read, we can't change the tracer */
4430 if (tr->current_trace->ref) {
4431 ret = -EBUSY;
4432 goto out;
4433 }
4434
9f029e83 4435 trace_branch_disable();
613f04a0 4436
50512ab5 4437 tr->current_trace->enabled--;
613f04a0 4438
2b6080f2
SR
4439 if (tr->current_trace->reset)
4440 tr->current_trace->reset(tr);
34600f0e 4441
12883efb 4442 /* Current trace needs to be nop_trace before synchronize_sched */
2b6080f2 4443 tr->current_trace = &nop_trace;
34600f0e 4444
45ad21ca
SRRH
4445#ifdef CONFIG_TRACER_MAX_TRACE
4446 had_max_tr = tr->allocated_snapshot;
34600f0e
SR
4447
4448 if (had_max_tr && !t->use_max_tr) {
4449 /*
4450 * We need to make sure that the update_max_tr sees that
4451 * current_trace changed to nop_trace to keep it from
4452 * swapping the buffers after we resize it.
4453 * The update_max_tr is called from interrupts disabled
4454 * so a synchronized_sched() is sufficient.
4455 */
4456 synchronize_sched();
3209cff4 4457 free_snapshot(tr);
ef710e10 4458 }
12883efb 4459#endif
12883efb
SRRH
4460
4461#ifdef CONFIG_TRACER_MAX_TRACE
34600f0e 4462 if (t->use_max_tr && !had_max_tr) {
3209cff4 4463 ret = alloc_snapshot(tr);
d60da506
HT
4464 if (ret < 0)
4465 goto out;
ef710e10 4466 }
12883efb 4467#endif
577b785f 4468
1c80025a 4469 if (t->init) {
b6f11df2 4470 ret = tracer_init(t, tr);
1c80025a
FW
4471 if (ret)
4472 goto out;
4473 }
bc0c38d1 4474
2b6080f2 4475 tr->current_trace = t;
50512ab5 4476 tr->current_trace->enabled++;
9f029e83 4477 trace_branch_enable(tr);
bc0c38d1
SR
4478 out:
4479 mutex_unlock(&trace_types_lock);
4480
d9e54076
PZ
4481 return ret;
4482}
4483
4484static ssize_t
4485tracing_set_trace_write(struct file *filp, const char __user *ubuf,
4486 size_t cnt, loff_t *ppos)
4487{
607e2ea1 4488 struct trace_array *tr = filp->private_data;
ee6c2c1b 4489 char buf[MAX_TRACER_SIZE+1];
d9e54076
PZ
4490 int i;
4491 size_t ret;
e6e7a65a
FW
4492 int err;
4493
4494 ret = cnt;
d9e54076 4495
ee6c2c1b
LZ
4496 if (cnt > MAX_TRACER_SIZE)
4497 cnt = MAX_TRACER_SIZE;
d9e54076
PZ
4498
4499 if (copy_from_user(&buf, ubuf, cnt))
4500 return -EFAULT;
4501
4502 buf[cnt] = 0;
4503
4504 /* strip ending whitespace. */
4505 for (i = cnt - 1; i > 0 && isspace(buf[i]); i--)
4506 buf[i] = 0;
4507
607e2ea1 4508 err = tracing_set_tracer(tr, buf);
e6e7a65a
FW
4509 if (err)
4510 return err;
d9e54076 4511
cf8517cf 4512 *ppos += ret;
bc0c38d1 4513
c2931e05 4514 return ret;
bc0c38d1
SR
4515}
4516
4517static ssize_t
6508fa76
SF
4518tracing_nsecs_read(unsigned long *ptr, char __user *ubuf,
4519 size_t cnt, loff_t *ppos)
bc0c38d1 4520{
bc0c38d1
SR
4521 char buf[64];
4522 int r;
4523
cffae437 4524 r = snprintf(buf, sizeof(buf), "%ld\n",
bc0c38d1 4525 *ptr == (unsigned long)-1 ? -1 : nsecs_to_usecs(*ptr));
cffae437
SR
4526 if (r > sizeof(buf))
4527 r = sizeof(buf);
4bf39a94 4528 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
bc0c38d1
SR
4529}
4530
4531static ssize_t
6508fa76
SF
4532tracing_nsecs_write(unsigned long *ptr, const char __user *ubuf,
4533 size_t cnt, loff_t *ppos)
bc0c38d1 4534{
5e39841c 4535 unsigned long val;
c6caeeb1 4536 int ret;
bc0c38d1 4537
22fe9b54
PH
4538 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
4539 if (ret)
c6caeeb1 4540 return ret;
bc0c38d1
SR
4541
4542 *ptr = val * 1000;
4543
4544 return cnt;
4545}
4546
6508fa76
SF
4547static ssize_t
4548tracing_thresh_read(struct file *filp, char __user *ubuf,
4549 size_t cnt, loff_t *ppos)
4550{
4551 return tracing_nsecs_read(&tracing_thresh, ubuf, cnt, ppos);
4552}
4553
4554static ssize_t
4555tracing_thresh_write(struct file *filp, const char __user *ubuf,
4556 size_t cnt, loff_t *ppos)
4557{
4558 struct trace_array *tr = filp->private_data;
4559 int ret;
4560
4561 mutex_lock(&trace_types_lock);
4562 ret = tracing_nsecs_write(&tracing_thresh, ubuf, cnt, ppos);
4563 if (ret < 0)
4564 goto out;
4565
4566 if (tr->current_trace->update_thresh) {
4567 ret = tr->current_trace->update_thresh(tr);
4568 if (ret < 0)
4569 goto out;
4570 }
4571
4572 ret = cnt;
4573out:
4574 mutex_unlock(&trace_types_lock);
4575
4576 return ret;
4577}
4578
e428abbb
CG
4579#ifdef CONFIG_TRACER_MAX_TRACE
4580
6508fa76
SF
4581static ssize_t
4582tracing_max_lat_read(struct file *filp, char __user *ubuf,
4583 size_t cnt, loff_t *ppos)
4584{
4585 return tracing_nsecs_read(filp->private_data, ubuf, cnt, ppos);
4586}
4587
4588static ssize_t
4589tracing_max_lat_write(struct file *filp, const char __user *ubuf,
4590 size_t cnt, loff_t *ppos)
4591{
4592 return tracing_nsecs_write(filp->private_data, ubuf, cnt, ppos);
4593}
4594
e428abbb
CG
4595#endif
4596
b3806b43
SR
4597static int tracing_open_pipe(struct inode *inode, struct file *filp)
4598{
15544209 4599 struct trace_array *tr = inode->i_private;
b3806b43 4600 struct trace_iterator *iter;
b04cc6b1 4601 int ret = 0;
b3806b43
SR
4602
4603 if (tracing_disabled)
4604 return -ENODEV;
4605
7b85af63
SRRH
4606 if (trace_array_get(tr) < 0)
4607 return -ENODEV;
4608
b04cc6b1
FW
4609 mutex_lock(&trace_types_lock);
4610
b3806b43
SR
4611 /* create a buffer to store the information to pass to userspace */
4612 iter = kzalloc(sizeof(*iter), GFP_KERNEL);
b04cc6b1
FW
4613 if (!iter) {
4614 ret = -ENOMEM;
f77d09a3 4615 __trace_array_put(tr);
b04cc6b1
FW
4616 goto out;
4617 }
b3806b43 4618
3a161d99 4619 trace_seq_init(&iter->seq);
d716ff71 4620 iter->trace = tr->current_trace;
d7350c3f 4621
4462344e 4622 if (!alloc_cpumask_var(&iter->started, GFP_KERNEL)) {
b04cc6b1 4623 ret = -ENOMEM;
d7350c3f 4624 goto fail;
4462344e
RR
4625 }
4626
a309720c 4627 /* trace pipe does not show start of buffer */
4462344e 4628 cpumask_setall(iter->started);
a309720c 4629
983f938a 4630 if (tr->trace_flags & TRACE_ITER_LATENCY_FMT)
112f38a7
SR
4631 iter->iter_flags |= TRACE_FILE_LAT_FMT;
4632
8be0709f 4633 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
58e8eedf 4634 if (trace_clocks[tr->clock_id].in_ns)
8be0709f
DS
4635 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
4636
15544209
ON
4637 iter->tr = tr;
4638 iter->trace_buffer = &tr->trace_buffer;
4639 iter->cpu_file = tracing_get_cpu(inode);
d7350c3f 4640 mutex_init(&iter->mutex);
b3806b43
SR
4641 filp->private_data = iter;
4642
107bad8b
SR
4643 if (iter->trace->pipe_open)
4644 iter->trace->pipe_open(iter);
107bad8b 4645
b444786f 4646 nonseekable_open(inode, filp);
cf6ab6d9
SRRH
4647
4648 tr->current_trace->ref++;
b04cc6b1
FW
4649out:
4650 mutex_unlock(&trace_types_lock);
4651 return ret;
d7350c3f
FW
4652
4653fail:
4654 kfree(iter->trace);
4655 kfree(iter);
7b85af63 4656 __trace_array_put(tr);
d7350c3f
FW
4657 mutex_unlock(&trace_types_lock);
4658 return ret;
b3806b43
SR
4659}
4660
4661static int tracing_release_pipe(struct inode *inode, struct file *file)
4662{
4663 struct trace_iterator *iter = file->private_data;
15544209 4664 struct trace_array *tr = inode->i_private;
b3806b43 4665
b04cc6b1
FW
4666 mutex_lock(&trace_types_lock);
4667
cf6ab6d9
SRRH
4668 tr->current_trace->ref--;
4669
29bf4a5e 4670 if (iter->trace->pipe_close)
c521efd1
SR
4671 iter->trace->pipe_close(iter);
4672
b04cc6b1
FW
4673 mutex_unlock(&trace_types_lock);
4674
4462344e 4675 free_cpumask_var(iter->started);
d7350c3f 4676 mutex_destroy(&iter->mutex);
b3806b43 4677 kfree(iter);
b3806b43 4678
7b85af63
SRRH
4679 trace_array_put(tr);
4680
b3806b43
SR
4681 return 0;
4682}
4683
2a2cc8f7 4684static unsigned int
cc60cdc9 4685trace_poll(struct trace_iterator *iter, struct file *filp, poll_table *poll_table)
2a2cc8f7 4686{
983f938a
SRRH
4687 struct trace_array *tr = iter->tr;
4688
15693458
SRRH
4689 /* Iterators are static, they should be filled or empty */
4690 if (trace_buffer_iter(iter, iter->cpu_file))
4691 return POLLIN | POLLRDNORM;
2a2cc8f7 4692
983f938a 4693 if (tr->trace_flags & TRACE_ITER_BLOCK)
2a2cc8f7
SSP
4694 /*
4695 * Always select as readable when in blocking mode
4696 */
4697 return POLLIN | POLLRDNORM;
15693458 4698 else
12883efb 4699 return ring_buffer_poll_wait(iter->trace_buffer->buffer, iter->cpu_file,
15693458 4700 filp, poll_table);
2a2cc8f7 4701}
2a2cc8f7 4702
cc60cdc9
SR
4703static unsigned int
4704tracing_poll_pipe(struct file *filp, poll_table *poll_table)
4705{
4706 struct trace_iterator *iter = filp->private_data;
4707
4708 return trace_poll(iter, filp, poll_table);
2a2cc8f7
SSP
4709}
4710
d716ff71 4711/* Must be called with iter->mutex held. */
ff98781b 4712static int tracing_wait_pipe(struct file *filp)
b3806b43
SR
4713{
4714 struct trace_iterator *iter = filp->private_data;
8b8b3683 4715 int ret;
b3806b43 4716
b3806b43 4717 while (trace_empty(iter)) {
2dc8f095 4718
107bad8b 4719 if ((filp->f_flags & O_NONBLOCK)) {
ff98781b 4720 return -EAGAIN;
107bad8b 4721 }
2dc8f095 4722
b3806b43 4723 /*
250bfd3d 4724 * We block until we read something and tracing is disabled.
b3806b43
SR
4725 * We still block if tracing is disabled, but we have never
4726 * read anything. This allows a user to cat this file, and
4727 * then enable tracing. But after we have read something,
4728 * we give an EOF when tracing is again disabled.
4729 *
4730 * iter->pos will be 0 if we haven't read anything.
4731 */
10246fa3 4732 if (!tracing_is_on() && iter->pos)
b3806b43 4733 break;
f4874261
SRRH
4734
4735 mutex_unlock(&iter->mutex);
4736
e30f53aa 4737 ret = wait_on_pipe(iter, false);
f4874261
SRRH
4738
4739 mutex_lock(&iter->mutex);
4740
8b8b3683
SRRH
4741 if (ret)
4742 return ret;
b3806b43
SR
4743 }
4744
ff98781b
EGM
4745 return 1;
4746}
4747
4748/*
4749 * Consumer reader.
4750 */
4751static ssize_t
4752tracing_read_pipe(struct file *filp, char __user *ubuf,
4753 size_t cnt, loff_t *ppos)
4754{
4755 struct trace_iterator *iter = filp->private_data;
4756 ssize_t sret;
4757
4758 /* return any leftover data */
4759 sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
4760 if (sret != -EBUSY)
4761 return sret;
4762
f9520750 4763 trace_seq_init(&iter->seq);
ff98781b 4764
d7350c3f
FW
4765 /*
4766 * Avoid more than one consumer on a single file descriptor
4767 * This is just a matter of traces coherency, the ring buffer itself
4768 * is protected.
4769 */
4770 mutex_lock(&iter->mutex);
ff98781b
EGM
4771 if (iter->trace->read) {
4772 sret = iter->trace->read(iter, filp, ubuf, cnt, ppos);
4773 if (sret)
4774 goto out;
4775 }
4776
4777waitagain:
4778 sret = tracing_wait_pipe(filp);
4779 if (sret <= 0)
4780 goto out;
4781
b3806b43 4782 /* stop when tracing is finished */
ff98781b
EGM
4783 if (trace_empty(iter)) {
4784 sret = 0;
107bad8b 4785 goto out;
ff98781b 4786 }
b3806b43
SR
4787
4788 if (cnt >= PAGE_SIZE)
4789 cnt = PAGE_SIZE - 1;
4790
53d0aa77 4791 /* reset all but tr, trace, and overruns */
53d0aa77
SR
4792 memset(&iter->seq, 0,
4793 sizeof(struct trace_iterator) -
4794 offsetof(struct trace_iterator, seq));
ed5467da 4795 cpumask_clear(iter->started);
4823ed7e 4796 iter->pos = -1;
b3806b43 4797
4f535968 4798 trace_event_read_lock();
7e53bd42 4799 trace_access_lock(iter->cpu_file);
955b61e5 4800 while (trace_find_next_entry_inc(iter) != NULL) {
2c4f035f 4801 enum print_line_t ret;
5ac48378 4802 int save_len = iter->seq.seq.len;
088b1e42 4803
f9896bf3 4804 ret = print_trace_line(iter);
2c4f035f 4805 if (ret == TRACE_TYPE_PARTIAL_LINE) {
088b1e42 4806 /* don't print partial lines */
5ac48378 4807 iter->seq.seq.len = save_len;
b3806b43 4808 break;
088b1e42 4809 }
b91facc3
FW
4810 if (ret != TRACE_TYPE_NO_CONSUME)
4811 trace_consume(iter);
b3806b43 4812
5ac48378 4813 if (trace_seq_used(&iter->seq) >= cnt)
b3806b43 4814 break;
ee5e51f5
JO
4815
4816 /*
4817 * Setting the full flag means we reached the trace_seq buffer
4818 * size and we should leave by partial output condition above.
4819 * One of the trace_seq_* functions is not used properly.
4820 */
4821 WARN_ONCE(iter->seq.full, "full flag set for trace type %d",
4822 iter->ent->type);
b3806b43 4823 }
7e53bd42 4824 trace_access_unlock(iter->cpu_file);
4f535968 4825 trace_event_read_unlock();
b3806b43 4826
b3806b43 4827 /* Now copy what we have to the user */
6c6c2796 4828 sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
5ac48378 4829 if (iter->seq.seq.readpos >= trace_seq_used(&iter->seq))
f9520750 4830 trace_seq_init(&iter->seq);
9ff4b974
PP
4831
4832 /*
25985edc 4833 * If there was nothing to send to user, in spite of consuming trace
9ff4b974
PP
4834 * entries, go back to wait for more entries.
4835 */
6c6c2796 4836 if (sret == -EBUSY)
9ff4b974 4837 goto waitagain;
b3806b43 4838
107bad8b 4839out:
d7350c3f 4840 mutex_unlock(&iter->mutex);
107bad8b 4841
6c6c2796 4842 return sret;
b3806b43
SR
4843}
4844
3c56819b
EGM
4845static void tracing_spd_release_pipe(struct splice_pipe_desc *spd,
4846 unsigned int idx)
4847{
4848 __free_page(spd->pages[idx]);
4849}
4850
28dfef8f 4851static const struct pipe_buf_operations tracing_pipe_buf_ops = {
34cd4998 4852 .can_merge = 0,
34cd4998 4853 .confirm = generic_pipe_buf_confirm,
92fdd98c 4854 .release = generic_pipe_buf_release,
34cd4998
SR
4855 .steal = generic_pipe_buf_steal,
4856 .get = generic_pipe_buf_get,
3c56819b
EGM
4857};
4858
34cd4998 4859static size_t
fa7c7f6e 4860tracing_fill_pipe_page(size_t rem, struct trace_iterator *iter)
34cd4998
SR
4861{
4862 size_t count;
74f06bb7 4863 int save_len;
34cd4998
SR
4864 int ret;
4865
4866 /* Seq buffer is page-sized, exactly what we need. */
4867 for (;;) {
74f06bb7 4868 save_len = iter->seq.seq.len;
34cd4998 4869 ret = print_trace_line(iter);
74f06bb7
SRRH
4870
4871 if (trace_seq_has_overflowed(&iter->seq)) {
4872 iter->seq.seq.len = save_len;
34cd4998
SR
4873 break;
4874 }
74f06bb7
SRRH
4875
4876 /*
4877 * This should not be hit, because it should only
4878 * be set if the iter->seq overflowed. But check it
4879 * anyway to be safe.
4880 */
34cd4998 4881 if (ret == TRACE_TYPE_PARTIAL_LINE) {
74f06bb7
SRRH
4882 iter->seq.seq.len = save_len;
4883 break;
4884 }
4885
5ac48378 4886 count = trace_seq_used(&iter->seq) - save_len;
74f06bb7
SRRH
4887 if (rem < count) {
4888 rem = 0;
4889 iter->seq.seq.len = save_len;
34cd4998
SR
4890 break;
4891 }
4892
74e7ff8c
LJ
4893 if (ret != TRACE_TYPE_NO_CONSUME)
4894 trace_consume(iter);
34cd4998 4895 rem -= count;
955b61e5 4896 if (!trace_find_next_entry_inc(iter)) {
34cd4998
SR
4897 rem = 0;
4898 iter->ent = NULL;
4899 break;
4900 }
4901 }
4902
4903 return rem;
4904}
4905
3c56819b
EGM
4906static ssize_t tracing_splice_read_pipe(struct file *filp,
4907 loff_t *ppos,
4908 struct pipe_inode_info *pipe,
4909 size_t len,
4910 unsigned int flags)
4911{
35f3d14d
JA
4912 struct page *pages_def[PIPE_DEF_BUFFERS];
4913 struct partial_page partial_def[PIPE_DEF_BUFFERS];
3c56819b
EGM
4914 struct trace_iterator *iter = filp->private_data;
4915 struct splice_pipe_desc spd = {
35f3d14d
JA
4916 .pages = pages_def,
4917 .partial = partial_def,
34cd4998 4918 .nr_pages = 0, /* This gets updated below. */
047fe360 4919 .nr_pages_max = PIPE_DEF_BUFFERS,
34cd4998
SR
4920 .flags = flags,
4921 .ops = &tracing_pipe_buf_ops,
4922 .spd_release = tracing_spd_release_pipe,
3c56819b
EGM
4923 };
4924 ssize_t ret;
34cd4998 4925 size_t rem;
3c56819b
EGM
4926 unsigned int i;
4927
35f3d14d
JA
4928 if (splice_grow_spd(pipe, &spd))
4929 return -ENOMEM;
4930
d7350c3f 4931 mutex_lock(&iter->mutex);
3c56819b
EGM
4932
4933 if (iter->trace->splice_read) {
4934 ret = iter->trace->splice_read(iter, filp,
4935 ppos, pipe, len, flags);
4936 if (ret)
34cd4998 4937 goto out_err;
3c56819b
EGM
4938 }
4939
4940 ret = tracing_wait_pipe(filp);
4941 if (ret <= 0)
34cd4998 4942 goto out_err;
3c56819b 4943
955b61e5 4944 if (!iter->ent && !trace_find_next_entry_inc(iter)) {
3c56819b 4945 ret = -EFAULT;
34cd4998 4946 goto out_err;
3c56819b
EGM
4947 }
4948
4f535968 4949 trace_event_read_lock();
7e53bd42 4950 trace_access_lock(iter->cpu_file);
4f535968 4951
3c56819b 4952 /* Fill as many pages as possible. */
a786c06d 4953 for (i = 0, rem = len; i < spd.nr_pages_max && rem; i++) {
35f3d14d
JA
4954 spd.pages[i] = alloc_page(GFP_KERNEL);
4955 if (!spd.pages[i])
34cd4998 4956 break;
3c56819b 4957
fa7c7f6e 4958 rem = tracing_fill_pipe_page(rem, iter);
3c56819b
EGM
4959
4960 /* Copy the data into the page, so we can start over. */
4961 ret = trace_seq_to_buffer(&iter->seq,
35f3d14d 4962 page_address(spd.pages[i]),
5ac48378 4963 trace_seq_used(&iter->seq));
3c56819b 4964 if (ret < 0) {
35f3d14d 4965 __free_page(spd.pages[i]);
3c56819b
EGM
4966 break;
4967 }
35f3d14d 4968 spd.partial[i].offset = 0;
5ac48378 4969 spd.partial[i].len = trace_seq_used(&iter->seq);
3c56819b 4970
f9520750 4971 trace_seq_init(&iter->seq);
3c56819b
EGM
4972 }
4973
7e53bd42 4974 trace_access_unlock(iter->cpu_file);
4f535968 4975 trace_event_read_unlock();
d7350c3f 4976 mutex_unlock(&iter->mutex);
3c56819b
EGM
4977
4978 spd.nr_pages = i;
4979
a29054d9
SRRH
4980 if (i)
4981 ret = splice_to_pipe(pipe, &spd);
4982 else
4983 ret = 0;
35f3d14d 4984out:
047fe360 4985 splice_shrink_spd(&spd);
35f3d14d 4986 return ret;
3c56819b 4987
34cd4998 4988out_err:
d7350c3f 4989 mutex_unlock(&iter->mutex);
35f3d14d 4990 goto out;
3c56819b
EGM
4991}
4992
a98a3c3f
SR
4993static ssize_t
4994tracing_entries_read(struct file *filp, char __user *ubuf,
4995 size_t cnt, loff_t *ppos)
4996{
0bc392ee
ON
4997 struct inode *inode = file_inode(filp);
4998 struct trace_array *tr = inode->i_private;
4999 int cpu = tracing_get_cpu(inode);
438ced17
VN
5000 char buf[64];
5001 int r = 0;
5002 ssize_t ret;
a98a3c3f 5003
db526ca3 5004 mutex_lock(&trace_types_lock);
438ced17 5005
0bc392ee 5006 if (cpu == RING_BUFFER_ALL_CPUS) {
438ced17
VN
5007 int cpu, buf_size_same;
5008 unsigned long size;
5009
5010 size = 0;
5011 buf_size_same = 1;
5012 /* check if all cpu sizes are same */
5013 for_each_tracing_cpu(cpu) {
5014 /* fill in the size from first enabled cpu */
5015 if (size == 0)
12883efb
SRRH
5016 size = per_cpu_ptr(tr->trace_buffer.data, cpu)->entries;
5017 if (size != per_cpu_ptr(tr->trace_buffer.data, cpu)->entries) {
438ced17
VN
5018 buf_size_same = 0;
5019 break;
5020 }
5021 }
5022
5023 if (buf_size_same) {
5024 if (!ring_buffer_expanded)
5025 r = sprintf(buf, "%lu (expanded: %lu)\n",
5026 size >> 10,
5027 trace_buf_size >> 10);
5028 else
5029 r = sprintf(buf, "%lu\n", size >> 10);
5030 } else
5031 r = sprintf(buf, "X\n");
5032 } else
0bc392ee 5033 r = sprintf(buf, "%lu\n", per_cpu_ptr(tr->trace_buffer.data, cpu)->entries >> 10);
438ced17 5034
db526ca3
SR
5035 mutex_unlock(&trace_types_lock);
5036
438ced17
VN
5037 ret = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
5038 return ret;
a98a3c3f
SR
5039}
5040
5041static ssize_t
5042tracing_entries_write(struct file *filp, const char __user *ubuf,
5043 size_t cnt, loff_t *ppos)
5044{
0bc392ee
ON
5045 struct inode *inode = file_inode(filp);
5046 struct trace_array *tr = inode->i_private;
a98a3c3f 5047 unsigned long val;
4f271a2a 5048 int ret;
a98a3c3f 5049
22fe9b54
PH
5050 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
5051 if (ret)
c6caeeb1 5052 return ret;
a98a3c3f
SR
5053
5054 /* must have at least 1 entry */
5055 if (!val)
5056 return -EINVAL;
5057
1696b2b0
SR
5058 /* value is in KB */
5059 val <<= 10;
0bc392ee 5060 ret = tracing_resize_ring_buffer(tr, val, tracing_get_cpu(inode));
4f271a2a
VN
5061 if (ret < 0)
5062 return ret;
a98a3c3f 5063
cf8517cf 5064 *ppos += cnt;
a98a3c3f 5065
4f271a2a
VN
5066 return cnt;
5067}
bf5e6519 5068
f81ab074
VN
5069static ssize_t
5070tracing_total_entries_read(struct file *filp, char __user *ubuf,
5071 size_t cnt, loff_t *ppos)
5072{
5073 struct trace_array *tr = filp->private_data;
5074 char buf[64];
5075 int r, cpu;
5076 unsigned long size = 0, expanded_size = 0;
5077
5078 mutex_lock(&trace_types_lock);
5079 for_each_tracing_cpu(cpu) {
12883efb 5080 size += per_cpu_ptr(tr->trace_buffer.data, cpu)->entries >> 10;
f81ab074
VN
5081 if (!ring_buffer_expanded)
5082 expanded_size += trace_buf_size >> 10;
5083 }
5084 if (ring_buffer_expanded)
5085 r = sprintf(buf, "%lu\n", size);
5086 else
5087 r = sprintf(buf, "%lu (expanded: %lu)\n", size, expanded_size);
5088 mutex_unlock(&trace_types_lock);
5089
5090 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
5091}
5092
4f271a2a
VN
5093static ssize_t
5094tracing_free_buffer_write(struct file *filp, const char __user *ubuf,
5095 size_t cnt, loff_t *ppos)
5096{
5097 /*
5098 * There is no need to read what the user has written, this function
5099 * is just to make sure that there is no error when "echo" is used
5100 */
5101
5102 *ppos += cnt;
a98a3c3f
SR
5103
5104 return cnt;
5105}
5106
4f271a2a
VN
5107static int
5108tracing_free_buffer_release(struct inode *inode, struct file *filp)
5109{
2b6080f2
SR
5110 struct trace_array *tr = inode->i_private;
5111
cf30cf67 5112 /* disable tracing ? */
983f938a 5113 if (tr->trace_flags & TRACE_ITER_STOP_ON_FREE)
711e1243 5114 tracer_tracing_off(tr);
4f271a2a 5115 /* resize the ring buffer to 0 */
2b6080f2 5116 tracing_resize_ring_buffer(tr, 0, RING_BUFFER_ALL_CPUS);
4f271a2a 5117
7b85af63
SRRH
5118 trace_array_put(tr);
5119
4f271a2a
VN
5120 return 0;
5121}
5122
5bf9a1ee
PP
5123static ssize_t
5124tracing_mark_write(struct file *filp, const char __user *ubuf,
5125 size_t cnt, loff_t *fpos)
5126{
d696b58c 5127 unsigned long addr = (unsigned long)ubuf;
2d71619c 5128 struct trace_array *tr = filp->private_data;
d696b58c
SR
5129 struct ring_buffer_event *event;
5130 struct ring_buffer *buffer;
5131 struct print_entry *entry;
5132 unsigned long irq_flags;
5133 struct page *pages[2];
6edb2a8a 5134 void *map_page[2];
d696b58c
SR
5135 int nr_pages = 1;
5136 ssize_t written;
d696b58c
SR
5137 int offset;
5138 int size;
5139 int len;
5140 int ret;
6edb2a8a 5141 int i;
5bf9a1ee 5142
c76f0694 5143 if (tracing_disabled)
5bf9a1ee
PP
5144 return -EINVAL;
5145
983f938a 5146 if (!(tr->trace_flags & TRACE_ITER_MARKERS))
5224c3a3
MSB
5147 return -EINVAL;
5148
5bf9a1ee
PP
5149 if (cnt > TRACE_BUF_SIZE)
5150 cnt = TRACE_BUF_SIZE;
5151
d696b58c
SR
5152 /*
5153 * Userspace is injecting traces into the kernel trace buffer.
5154 * We want to be as non intrusive as possible.
5155 * To do so, we do not want to allocate any special buffers
5156 * or take any locks, but instead write the userspace data
5157 * straight into the ring buffer.
5158 *
5159 * First we need to pin the userspace buffer into memory,
5160 * which, most likely it is, because it just referenced it.
5161 * But there's no guarantee that it is. By using get_user_pages_fast()
5162 * and kmap_atomic/kunmap_atomic() we can get access to the
5163 * pages directly. We then write the data directly into the
5164 * ring buffer.
5165 */
5166 BUILD_BUG_ON(TRACE_BUF_SIZE >= PAGE_SIZE);
5bf9a1ee 5167
d696b58c
SR
5168 /* check if we cross pages */
5169 if ((addr & PAGE_MASK) != ((addr + cnt) & PAGE_MASK))
5170 nr_pages = 2;
5171
5172 offset = addr & (PAGE_SIZE - 1);
5173 addr &= PAGE_MASK;
5174
5175 ret = get_user_pages_fast(addr, nr_pages, 0, pages);
5176 if (ret < nr_pages) {
5177 while (--ret >= 0)
5178 put_page(pages[ret]);
5179 written = -EFAULT;
5180 goto out;
5bf9a1ee 5181 }
d696b58c 5182
6edb2a8a
SR
5183 for (i = 0; i < nr_pages; i++)
5184 map_page[i] = kmap_atomic(pages[i]);
d696b58c
SR
5185
5186 local_save_flags(irq_flags);
5187 size = sizeof(*entry) + cnt + 2; /* possible \n added */
2d71619c 5188 buffer = tr->trace_buffer.buffer;
d696b58c
SR
5189 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, size,
5190 irq_flags, preempt_count());
5191 if (!event) {
5192 /* Ring buffer disabled, return as if not open for write */
5193 written = -EBADF;
5194 goto out_unlock;
5bf9a1ee 5195 }
d696b58c
SR
5196
5197 entry = ring_buffer_event_data(event);
5198 entry->ip = _THIS_IP_;
5199
5200 if (nr_pages == 2) {
5201 len = PAGE_SIZE - offset;
6edb2a8a
SR
5202 memcpy(&entry->buf, map_page[0] + offset, len);
5203 memcpy(&entry->buf[len], map_page[1], cnt - len);
c13d2f7c 5204 } else
6edb2a8a 5205 memcpy(&entry->buf, map_page[0] + offset, cnt);
5bf9a1ee 5206
d696b58c
SR
5207 if (entry->buf[cnt - 1] != '\n') {
5208 entry->buf[cnt] = '\n';
5209 entry->buf[cnt + 1] = '\0';
5210 } else
5211 entry->buf[cnt] = '\0';
5212
7ffbd48d 5213 __buffer_unlock_commit(buffer, event);
5bf9a1ee 5214
d696b58c 5215 written = cnt;
5bf9a1ee 5216
d696b58c 5217 *fpos += written;
1aa54bca 5218
d696b58c 5219 out_unlock:
7215853e 5220 for (i = nr_pages - 1; i >= 0; i--) {
6edb2a8a
SR
5221 kunmap_atomic(map_page[i]);
5222 put_page(pages[i]);
5223 }
d696b58c 5224 out:
1aa54bca 5225 return written;
5bf9a1ee
PP
5226}
5227
13f16d20 5228static int tracing_clock_show(struct seq_file *m, void *v)
5079f326 5229{
2b6080f2 5230 struct trace_array *tr = m->private;
5079f326
Z
5231 int i;
5232
5233 for (i = 0; i < ARRAY_SIZE(trace_clocks); i++)
13f16d20 5234 seq_printf(m,
5079f326 5235 "%s%s%s%s", i ? " " : "",
2b6080f2
SR
5236 i == tr->clock_id ? "[" : "", trace_clocks[i].name,
5237 i == tr->clock_id ? "]" : "");
13f16d20 5238 seq_putc(m, '\n');
5079f326 5239
13f16d20 5240 return 0;
5079f326
Z
5241}
5242
e1e232ca 5243static int tracing_set_clock(struct trace_array *tr, const char *clockstr)
5079f326 5244{
5079f326
Z
5245 int i;
5246
5079f326
Z
5247 for (i = 0; i < ARRAY_SIZE(trace_clocks); i++) {
5248 if (strcmp(trace_clocks[i].name, clockstr) == 0)
5249 break;
5250 }
5251 if (i == ARRAY_SIZE(trace_clocks))
5252 return -EINVAL;
5253
5079f326
Z
5254 mutex_lock(&trace_types_lock);
5255
2b6080f2
SR
5256 tr->clock_id = i;
5257
12883efb 5258 ring_buffer_set_clock(tr->trace_buffer.buffer, trace_clocks[i].func);
5079f326 5259
60303ed3
DS
5260 /*
5261 * New clock may not be consistent with the previous clock.
5262 * Reset the buffer so that it doesn't have incomparable timestamps.
5263 */
9457158b 5264 tracing_reset_online_cpus(&tr->trace_buffer);
12883efb
SRRH
5265
5266#ifdef CONFIG_TRACER_MAX_TRACE
5267 if (tr->flags & TRACE_ARRAY_FL_GLOBAL && tr->max_buffer.buffer)
5268 ring_buffer_set_clock(tr->max_buffer.buffer, trace_clocks[i].func);
9457158b 5269 tracing_reset_online_cpus(&tr->max_buffer);
12883efb 5270#endif
60303ed3 5271
5079f326
Z
5272 mutex_unlock(&trace_types_lock);
5273
e1e232ca
SR
5274 return 0;
5275}
5276
5277static ssize_t tracing_clock_write(struct file *filp, const char __user *ubuf,
5278 size_t cnt, loff_t *fpos)
5279{
5280 struct seq_file *m = filp->private_data;
5281 struct trace_array *tr = m->private;
5282 char buf[64];
5283 const char *clockstr;
5284 int ret;
5285
5286 if (cnt >= sizeof(buf))
5287 return -EINVAL;
5288
5289 if (copy_from_user(&buf, ubuf, cnt))
5290 return -EFAULT;
5291
5292 buf[cnt] = 0;
5293
5294 clockstr = strstrip(buf);
5295
5296 ret = tracing_set_clock(tr, clockstr);
5297 if (ret)
5298 return ret;
5299
5079f326
Z
5300 *fpos += cnt;
5301
5302 return cnt;
5303}
5304
13f16d20
LZ
5305static int tracing_clock_open(struct inode *inode, struct file *file)
5306{
7b85af63
SRRH
5307 struct trace_array *tr = inode->i_private;
5308 int ret;
5309
13f16d20
LZ
5310 if (tracing_disabled)
5311 return -ENODEV;
2b6080f2 5312
7b85af63
SRRH
5313 if (trace_array_get(tr))
5314 return -ENODEV;
5315
5316 ret = single_open(file, tracing_clock_show, inode->i_private);
5317 if (ret < 0)
5318 trace_array_put(tr);
5319
5320 return ret;
13f16d20
LZ
5321}
5322
6de58e62
SRRH
5323struct ftrace_buffer_info {
5324 struct trace_iterator iter;
5325 void *spare;
5326 unsigned int read;
5327};
5328
debdd57f
HT
5329#ifdef CONFIG_TRACER_SNAPSHOT
5330static int tracing_snapshot_open(struct inode *inode, struct file *file)
5331{
6484c71c 5332 struct trace_array *tr = inode->i_private;
debdd57f 5333 struct trace_iterator *iter;
2b6080f2 5334 struct seq_file *m;
debdd57f
HT
5335 int ret = 0;
5336
ff451961
SRRH
5337 if (trace_array_get(tr) < 0)
5338 return -ENODEV;
5339
debdd57f 5340 if (file->f_mode & FMODE_READ) {
6484c71c 5341 iter = __tracing_open(inode, file, true);
debdd57f
HT
5342 if (IS_ERR(iter))
5343 ret = PTR_ERR(iter);
2b6080f2
SR
5344 } else {
5345 /* Writes still need the seq_file to hold the private data */
f77d09a3 5346 ret = -ENOMEM;
2b6080f2
SR
5347 m = kzalloc(sizeof(*m), GFP_KERNEL);
5348 if (!m)
f77d09a3 5349 goto out;
2b6080f2
SR
5350 iter = kzalloc(sizeof(*iter), GFP_KERNEL);
5351 if (!iter) {
5352 kfree(m);
f77d09a3 5353 goto out;
2b6080f2 5354 }
f77d09a3
AL
5355 ret = 0;
5356
ff451961 5357 iter->tr = tr;
6484c71c
ON
5358 iter->trace_buffer = &tr->max_buffer;
5359 iter->cpu_file = tracing_get_cpu(inode);
2b6080f2
SR
5360 m->private = iter;
5361 file->private_data = m;
debdd57f 5362 }
f77d09a3 5363out:
ff451961
SRRH
5364 if (ret < 0)
5365 trace_array_put(tr);
5366
debdd57f
HT
5367 return ret;
5368}
5369
5370static ssize_t
5371tracing_snapshot_write(struct file *filp, const char __user *ubuf, size_t cnt,
5372 loff_t *ppos)
5373{
2b6080f2
SR
5374 struct seq_file *m = filp->private_data;
5375 struct trace_iterator *iter = m->private;
5376 struct trace_array *tr = iter->tr;
debdd57f
HT
5377 unsigned long val;
5378 int ret;
5379
5380 ret = tracing_update_buffers();
5381 if (ret < 0)
5382 return ret;
5383
5384 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
5385 if (ret)
5386 return ret;
5387
5388 mutex_lock(&trace_types_lock);
5389
2b6080f2 5390 if (tr->current_trace->use_max_tr) {
debdd57f
HT
5391 ret = -EBUSY;
5392 goto out;
5393 }
5394
5395 switch (val) {
5396 case 0:
f1affcaa
SRRH
5397 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
5398 ret = -EINVAL;
5399 break;
debdd57f 5400 }
3209cff4
SRRH
5401 if (tr->allocated_snapshot)
5402 free_snapshot(tr);
debdd57f
HT
5403 break;
5404 case 1:
f1affcaa
SRRH
5405/* Only allow per-cpu swap if the ring buffer supports it */
5406#ifndef CONFIG_RING_BUFFER_ALLOW_SWAP
5407 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
5408 ret = -EINVAL;
5409 break;
5410 }
5411#endif
45ad21ca 5412 if (!tr->allocated_snapshot) {
3209cff4 5413 ret = alloc_snapshot(tr);
debdd57f
HT
5414 if (ret < 0)
5415 break;
debdd57f 5416 }
debdd57f
HT
5417 local_irq_disable();
5418 /* Now, we're going to swap */
f1affcaa 5419 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
ce9bae55 5420 update_max_tr(tr, current, smp_processor_id());
f1affcaa 5421 else
ce9bae55 5422 update_max_tr_single(tr, current, iter->cpu_file);
debdd57f
HT
5423 local_irq_enable();
5424 break;
5425 default:
45ad21ca 5426 if (tr->allocated_snapshot) {
f1affcaa
SRRH
5427 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
5428 tracing_reset_online_cpus(&tr->max_buffer);
5429 else
5430 tracing_reset(&tr->max_buffer, iter->cpu_file);
5431 }
debdd57f
HT
5432 break;
5433 }
5434
5435 if (ret >= 0) {
5436 *ppos += cnt;
5437 ret = cnt;
5438 }
5439out:
5440 mutex_unlock(&trace_types_lock);
5441 return ret;
5442}
2b6080f2
SR
5443
5444static int tracing_snapshot_release(struct inode *inode, struct file *file)
5445{
5446 struct seq_file *m = file->private_data;
ff451961
SRRH
5447 int ret;
5448
5449 ret = tracing_release(inode, file);
2b6080f2
SR
5450
5451 if (file->f_mode & FMODE_READ)
ff451961 5452 return ret;
2b6080f2
SR
5453
5454 /* If write only, the seq_file is just a stub */
5455 if (m)
5456 kfree(m->private);
5457 kfree(m);
5458
5459 return 0;
5460}
5461
6de58e62
SRRH
5462static int tracing_buffers_open(struct inode *inode, struct file *filp);
5463static ssize_t tracing_buffers_read(struct file *filp, char __user *ubuf,
5464 size_t count, loff_t *ppos);
5465static int tracing_buffers_release(struct inode *inode, struct file *file);
5466static ssize_t tracing_buffers_splice_read(struct file *file, loff_t *ppos,
5467 struct pipe_inode_info *pipe, size_t len, unsigned int flags);
5468
5469static int snapshot_raw_open(struct inode *inode, struct file *filp)
5470{
5471 struct ftrace_buffer_info *info;
5472 int ret;
5473
5474 ret = tracing_buffers_open(inode, filp);
5475 if (ret < 0)
5476 return ret;
5477
5478 info = filp->private_data;
5479
5480 if (info->iter.trace->use_max_tr) {
5481 tracing_buffers_release(inode, filp);
5482 return -EBUSY;
5483 }
5484
5485 info->iter.snapshot = true;
5486 info->iter.trace_buffer = &info->iter.tr->max_buffer;
5487
5488 return ret;
5489}
5490
debdd57f
HT
5491#endif /* CONFIG_TRACER_SNAPSHOT */
5492
5493
6508fa76
SF
5494static const struct file_operations tracing_thresh_fops = {
5495 .open = tracing_open_generic,
5496 .read = tracing_thresh_read,
5497 .write = tracing_thresh_write,
5498 .llseek = generic_file_llseek,
5499};
5500
e428abbb 5501#ifdef CONFIG_TRACER_MAX_TRACE
5e2336a0 5502static const struct file_operations tracing_max_lat_fops = {
4bf39a94
IM
5503 .open = tracing_open_generic,
5504 .read = tracing_max_lat_read,
5505 .write = tracing_max_lat_write,
b444786f 5506 .llseek = generic_file_llseek,
bc0c38d1 5507};
e428abbb 5508#endif
bc0c38d1 5509
5e2336a0 5510static const struct file_operations set_tracer_fops = {
4bf39a94
IM
5511 .open = tracing_open_generic,
5512 .read = tracing_set_trace_read,
5513 .write = tracing_set_trace_write,
b444786f 5514 .llseek = generic_file_llseek,
bc0c38d1
SR
5515};
5516
5e2336a0 5517static const struct file_operations tracing_pipe_fops = {
4bf39a94 5518 .open = tracing_open_pipe,
2a2cc8f7 5519 .poll = tracing_poll_pipe,
4bf39a94 5520 .read = tracing_read_pipe,
3c56819b 5521 .splice_read = tracing_splice_read_pipe,
4bf39a94 5522 .release = tracing_release_pipe,
b444786f 5523 .llseek = no_llseek,
b3806b43
SR
5524};
5525
5e2336a0 5526static const struct file_operations tracing_entries_fops = {
0bc392ee 5527 .open = tracing_open_generic_tr,
a98a3c3f
SR
5528 .read = tracing_entries_read,
5529 .write = tracing_entries_write,
b444786f 5530 .llseek = generic_file_llseek,
0bc392ee 5531 .release = tracing_release_generic_tr,
a98a3c3f
SR
5532};
5533
f81ab074 5534static const struct file_operations tracing_total_entries_fops = {
7b85af63 5535 .open = tracing_open_generic_tr,
f81ab074
VN
5536 .read = tracing_total_entries_read,
5537 .llseek = generic_file_llseek,
7b85af63 5538 .release = tracing_release_generic_tr,
f81ab074
VN
5539};
5540
4f271a2a 5541static const struct file_operations tracing_free_buffer_fops = {
7b85af63 5542 .open = tracing_open_generic_tr,
4f271a2a
VN
5543 .write = tracing_free_buffer_write,
5544 .release = tracing_free_buffer_release,
5545};
5546
5e2336a0 5547static const struct file_operations tracing_mark_fops = {
7b85af63 5548 .open = tracing_open_generic_tr,
5bf9a1ee 5549 .write = tracing_mark_write,
b444786f 5550 .llseek = generic_file_llseek,
7b85af63 5551 .release = tracing_release_generic_tr,
5bf9a1ee
PP
5552};
5553
5079f326 5554static const struct file_operations trace_clock_fops = {
13f16d20
LZ
5555 .open = tracing_clock_open,
5556 .read = seq_read,
5557 .llseek = seq_lseek,
7b85af63 5558 .release = tracing_single_release_tr,
5079f326
Z
5559 .write = tracing_clock_write,
5560};
5561
debdd57f
HT
5562#ifdef CONFIG_TRACER_SNAPSHOT
5563static const struct file_operations snapshot_fops = {
5564 .open = tracing_snapshot_open,
5565 .read = seq_read,
5566 .write = tracing_snapshot_write,
098c879e 5567 .llseek = tracing_lseek,
2b6080f2 5568 .release = tracing_snapshot_release,
debdd57f 5569};
debdd57f 5570
6de58e62
SRRH
5571static const struct file_operations snapshot_raw_fops = {
5572 .open = snapshot_raw_open,
5573 .read = tracing_buffers_read,
5574 .release = tracing_buffers_release,
5575 .splice_read = tracing_buffers_splice_read,
5576 .llseek = no_llseek,
2cadf913
SR
5577};
5578
6de58e62
SRRH
5579#endif /* CONFIG_TRACER_SNAPSHOT */
5580
2cadf913
SR
5581static int tracing_buffers_open(struct inode *inode, struct file *filp)
5582{
46ef2be0 5583 struct trace_array *tr = inode->i_private;
2cadf913 5584 struct ftrace_buffer_info *info;
7b85af63 5585 int ret;
2cadf913
SR
5586
5587 if (tracing_disabled)
5588 return -ENODEV;
5589
7b85af63
SRRH
5590 if (trace_array_get(tr) < 0)
5591 return -ENODEV;
5592
2cadf913 5593 info = kzalloc(sizeof(*info), GFP_KERNEL);
7b85af63
SRRH
5594 if (!info) {
5595 trace_array_put(tr);
2cadf913 5596 return -ENOMEM;
7b85af63 5597 }
2cadf913 5598
a695cb58
SRRH
5599 mutex_lock(&trace_types_lock);
5600
cc60cdc9 5601 info->iter.tr = tr;
46ef2be0 5602 info->iter.cpu_file = tracing_get_cpu(inode);
b627344f 5603 info->iter.trace = tr->current_trace;
12883efb 5604 info->iter.trace_buffer = &tr->trace_buffer;
cc60cdc9 5605 info->spare = NULL;
2cadf913 5606 /* Force reading ring buffer for first read */
cc60cdc9 5607 info->read = (unsigned int)-1;
2cadf913
SR
5608
5609 filp->private_data = info;
5610
cf6ab6d9
SRRH
5611 tr->current_trace->ref++;
5612
a695cb58
SRRH
5613 mutex_unlock(&trace_types_lock);
5614
7b85af63
SRRH
5615 ret = nonseekable_open(inode, filp);
5616 if (ret < 0)
5617 trace_array_put(tr);
5618
5619 return ret;
2cadf913
SR
5620}
5621
cc60cdc9
SR
5622static unsigned int
5623tracing_buffers_poll(struct file *filp, poll_table *poll_table)
5624{
5625 struct ftrace_buffer_info *info = filp->private_data;
5626 struct trace_iterator *iter = &info->iter;
5627
5628 return trace_poll(iter, filp, poll_table);
5629}
5630
2cadf913
SR
5631static ssize_t
5632tracing_buffers_read(struct file *filp, char __user *ubuf,
5633 size_t count, loff_t *ppos)
5634{
5635 struct ftrace_buffer_info *info = filp->private_data;
cc60cdc9 5636 struct trace_iterator *iter = &info->iter;
2cadf913 5637 ssize_t ret;
6de58e62 5638 ssize_t size;
2cadf913 5639
2dc5d12b
SR
5640 if (!count)
5641 return 0;
5642
6de58e62 5643#ifdef CONFIG_TRACER_MAX_TRACE
d716ff71
SRRH
5644 if (iter->snapshot && iter->tr->current_trace->use_max_tr)
5645 return -EBUSY;
6de58e62
SRRH
5646#endif
5647
ddd538f3 5648 if (!info->spare)
12883efb
SRRH
5649 info->spare = ring_buffer_alloc_read_page(iter->trace_buffer->buffer,
5650 iter->cpu_file);
ddd538f3 5651 if (!info->spare)
d716ff71 5652 return -ENOMEM;
ddd538f3 5653
2cadf913
SR
5654 /* Do we have previous read data to read? */
5655 if (info->read < PAGE_SIZE)
5656 goto read;
5657
b627344f 5658 again:
cc60cdc9 5659 trace_access_lock(iter->cpu_file);
12883efb 5660 ret = ring_buffer_read_page(iter->trace_buffer->buffer,
2cadf913
SR
5661 &info->spare,
5662 count,
cc60cdc9
SR
5663 iter->cpu_file, 0);
5664 trace_access_unlock(iter->cpu_file);
2cadf913 5665
b627344f
SR
5666 if (ret < 0) {
5667 if (trace_empty(iter)) {
d716ff71
SRRH
5668 if ((filp->f_flags & O_NONBLOCK))
5669 return -EAGAIN;
5670
e30f53aa 5671 ret = wait_on_pipe(iter, false);
d716ff71
SRRH
5672 if (ret)
5673 return ret;
5674
b627344f
SR
5675 goto again;
5676 }
d716ff71 5677 return 0;
b627344f 5678 }
436fc280 5679
436fc280 5680 info->read = 0;
b627344f 5681 read:
2cadf913
SR
5682 size = PAGE_SIZE - info->read;
5683 if (size > count)
5684 size = count;
5685
5686 ret = copy_to_user(ubuf, info->spare + info->read, size);
d716ff71
SRRH
5687 if (ret == size)
5688 return -EFAULT;
5689
2dc5d12b
SR
5690 size -= ret;
5691
2cadf913
SR
5692 *ppos += size;
5693 info->read += size;
5694
5695 return size;
5696}
5697
5698static int tracing_buffers_release(struct inode *inode, struct file *file)
5699{
5700 struct ftrace_buffer_info *info = file->private_data;
cc60cdc9 5701 struct trace_iterator *iter = &info->iter;
2cadf913 5702
a695cb58
SRRH
5703 mutex_lock(&trace_types_lock);
5704
cf6ab6d9
SRRH
5705 iter->tr->current_trace->ref--;
5706
ff451961 5707 __trace_array_put(iter->tr);
2cadf913 5708
ddd538f3 5709 if (info->spare)
12883efb 5710 ring_buffer_free_read_page(iter->trace_buffer->buffer, info->spare);
2cadf913
SR
5711 kfree(info);
5712
a695cb58
SRRH
5713 mutex_unlock(&trace_types_lock);
5714
2cadf913
SR
5715 return 0;
5716}
5717
5718struct buffer_ref {
5719 struct ring_buffer *buffer;
5720 void *page;
5721 int ref;
5722};
5723
5724static void buffer_pipe_buf_release(struct pipe_inode_info *pipe,
5725 struct pipe_buffer *buf)
5726{
5727 struct buffer_ref *ref = (struct buffer_ref *)buf->private;
5728
5729 if (--ref->ref)
5730 return;
5731
5732 ring_buffer_free_read_page(ref->buffer, ref->page);
5733 kfree(ref);
5734 buf->private = 0;
5735}
5736
2cadf913
SR
5737static void buffer_pipe_buf_get(struct pipe_inode_info *pipe,
5738 struct pipe_buffer *buf)
5739{
5740 struct buffer_ref *ref = (struct buffer_ref *)buf->private;
5741
5742 ref->ref++;
5743}
5744
5745/* Pipe buffer operations for a buffer. */
28dfef8f 5746static const struct pipe_buf_operations buffer_pipe_buf_ops = {
2cadf913 5747 .can_merge = 0,
2cadf913
SR
5748 .confirm = generic_pipe_buf_confirm,
5749 .release = buffer_pipe_buf_release,
d55cb6cf 5750 .steal = generic_pipe_buf_steal,
2cadf913
SR
5751 .get = buffer_pipe_buf_get,
5752};
5753
5754/*
5755 * Callback from splice_to_pipe(), if we need to release some pages
5756 * at the end of the spd in case we error'ed out in filling the pipe.
5757 */
5758static void buffer_spd_release(struct splice_pipe_desc *spd, unsigned int i)
5759{
5760 struct buffer_ref *ref =
5761 (struct buffer_ref *)spd->partial[i].private;
5762
5763 if (--ref->ref)
5764 return;
5765
5766 ring_buffer_free_read_page(ref->buffer, ref->page);
5767 kfree(ref);
5768 spd->partial[i].private = 0;
5769}
5770
5771static ssize_t
5772tracing_buffers_splice_read(struct file *file, loff_t *ppos,
5773 struct pipe_inode_info *pipe, size_t len,
5774 unsigned int flags)
5775{
5776 struct ftrace_buffer_info *info = file->private_data;
cc60cdc9 5777 struct trace_iterator *iter = &info->iter;
35f3d14d
JA
5778 struct partial_page partial_def[PIPE_DEF_BUFFERS];
5779 struct page *pages_def[PIPE_DEF_BUFFERS];
2cadf913 5780 struct splice_pipe_desc spd = {
35f3d14d
JA
5781 .pages = pages_def,
5782 .partial = partial_def,
047fe360 5783 .nr_pages_max = PIPE_DEF_BUFFERS,
2cadf913
SR
5784 .flags = flags,
5785 .ops = &buffer_pipe_buf_ops,
5786 .spd_release = buffer_spd_release,
5787 };
5788 struct buffer_ref *ref;
93459c6c 5789 int entries, size, i;
07906da7 5790 ssize_t ret = 0;
2cadf913 5791
6de58e62 5792#ifdef CONFIG_TRACER_MAX_TRACE
d716ff71
SRRH
5793 if (iter->snapshot && iter->tr->current_trace->use_max_tr)
5794 return -EBUSY;
6de58e62
SRRH
5795#endif
5796
d716ff71
SRRH
5797 if (splice_grow_spd(pipe, &spd))
5798 return -ENOMEM;
35f3d14d 5799
d716ff71
SRRH
5800 if (*ppos & (PAGE_SIZE - 1))
5801 return -EINVAL;
93cfb3c9
LJ
5802
5803 if (len & (PAGE_SIZE - 1)) {
d716ff71
SRRH
5804 if (len < PAGE_SIZE)
5805 return -EINVAL;
93cfb3c9
LJ
5806 len &= PAGE_MASK;
5807 }
5808
cc60cdc9
SR
5809 again:
5810 trace_access_lock(iter->cpu_file);
12883efb 5811 entries = ring_buffer_entries_cpu(iter->trace_buffer->buffer, iter->cpu_file);
93459c6c 5812
a786c06d 5813 for (i = 0; i < spd.nr_pages_max && len && entries; i++, len -= PAGE_SIZE) {
2cadf913
SR
5814 struct page *page;
5815 int r;
5816
5817 ref = kzalloc(sizeof(*ref), GFP_KERNEL);
07906da7
RV
5818 if (!ref) {
5819 ret = -ENOMEM;
2cadf913 5820 break;
07906da7 5821 }
2cadf913 5822
7267fa68 5823 ref->ref = 1;
12883efb 5824 ref->buffer = iter->trace_buffer->buffer;
cc60cdc9 5825 ref->page = ring_buffer_alloc_read_page(ref->buffer, iter->cpu_file);
2cadf913 5826 if (!ref->page) {
07906da7 5827 ret = -ENOMEM;
2cadf913
SR
5828 kfree(ref);
5829 break;
5830 }
5831
5832 r = ring_buffer_read_page(ref->buffer, &ref->page,
cc60cdc9 5833 len, iter->cpu_file, 1);
2cadf913 5834 if (r < 0) {
7ea59064 5835 ring_buffer_free_read_page(ref->buffer, ref->page);
2cadf913
SR
5836 kfree(ref);
5837 break;
5838 }
5839
5840 /*
5841 * zero out any left over data, this is going to
5842 * user land.
5843 */
5844 size = ring_buffer_page_len(ref->page);
5845 if (size < PAGE_SIZE)
5846 memset(ref->page + size, 0, PAGE_SIZE - size);
5847
5848 page = virt_to_page(ref->page);
5849
5850 spd.pages[i] = page;
5851 spd.partial[i].len = PAGE_SIZE;
5852 spd.partial[i].offset = 0;
5853 spd.partial[i].private = (unsigned long)ref;
5854 spd.nr_pages++;
93cfb3c9 5855 *ppos += PAGE_SIZE;
93459c6c 5856
12883efb 5857 entries = ring_buffer_entries_cpu(iter->trace_buffer->buffer, iter->cpu_file);
2cadf913
SR
5858 }
5859
cc60cdc9 5860 trace_access_unlock(iter->cpu_file);
2cadf913
SR
5861 spd.nr_pages = i;
5862
5863 /* did we read anything? */
5864 if (!spd.nr_pages) {
07906da7 5865 if (ret)
d716ff71
SRRH
5866 return ret;
5867
5868 if ((file->f_flags & O_NONBLOCK) || (flags & SPLICE_F_NONBLOCK))
5869 return -EAGAIN;
07906da7 5870
e30f53aa 5871 ret = wait_on_pipe(iter, true);
8b8b3683 5872 if (ret)
d716ff71 5873 return ret;
e30f53aa 5874
cc60cdc9 5875 goto again;
2cadf913
SR
5876 }
5877
5878 ret = splice_to_pipe(pipe, &spd);
047fe360 5879 splice_shrink_spd(&spd);
6de58e62 5880
2cadf913
SR
5881 return ret;
5882}
5883
5884static const struct file_operations tracing_buffers_fops = {
5885 .open = tracing_buffers_open,
5886 .read = tracing_buffers_read,
cc60cdc9 5887 .poll = tracing_buffers_poll,
2cadf913
SR
5888 .release = tracing_buffers_release,
5889 .splice_read = tracing_buffers_splice_read,
5890 .llseek = no_llseek,
5891};
5892
c8d77183
SR
5893static ssize_t
5894tracing_stats_read(struct file *filp, char __user *ubuf,
5895 size_t count, loff_t *ppos)
5896{
4d3435b8
ON
5897 struct inode *inode = file_inode(filp);
5898 struct trace_array *tr = inode->i_private;
12883efb 5899 struct trace_buffer *trace_buf = &tr->trace_buffer;
4d3435b8 5900 int cpu = tracing_get_cpu(inode);
c8d77183
SR
5901 struct trace_seq *s;
5902 unsigned long cnt;
c64e148a
VN
5903 unsigned long long t;
5904 unsigned long usec_rem;
c8d77183 5905
e4f2d10f 5906 s = kmalloc(sizeof(*s), GFP_KERNEL);
c8d77183 5907 if (!s)
a646365c 5908 return -ENOMEM;
c8d77183
SR
5909
5910 trace_seq_init(s);
5911
12883efb 5912 cnt = ring_buffer_entries_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5913 trace_seq_printf(s, "entries: %ld\n", cnt);
5914
12883efb 5915 cnt = ring_buffer_overrun_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5916 trace_seq_printf(s, "overrun: %ld\n", cnt);
5917
12883efb 5918 cnt = ring_buffer_commit_overrun_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5919 trace_seq_printf(s, "commit overrun: %ld\n", cnt);
5920
12883efb 5921 cnt = ring_buffer_bytes_cpu(trace_buf->buffer, cpu);
c64e148a
VN
5922 trace_seq_printf(s, "bytes: %ld\n", cnt);
5923
58e8eedf 5924 if (trace_clocks[tr->clock_id].in_ns) {
11043d8b 5925 /* local or global for trace_clock */
12883efb 5926 t = ns2usecs(ring_buffer_oldest_event_ts(trace_buf->buffer, cpu));
11043d8b
YY
5927 usec_rem = do_div(t, USEC_PER_SEC);
5928 trace_seq_printf(s, "oldest event ts: %5llu.%06lu\n",
5929 t, usec_rem);
5930
12883efb 5931 t = ns2usecs(ring_buffer_time_stamp(trace_buf->buffer, cpu));
11043d8b
YY
5932 usec_rem = do_div(t, USEC_PER_SEC);
5933 trace_seq_printf(s, "now ts: %5llu.%06lu\n", t, usec_rem);
5934 } else {
5935 /* counter or tsc mode for trace_clock */
5936 trace_seq_printf(s, "oldest event ts: %llu\n",
12883efb 5937 ring_buffer_oldest_event_ts(trace_buf->buffer, cpu));
c64e148a 5938
11043d8b 5939 trace_seq_printf(s, "now ts: %llu\n",
12883efb 5940 ring_buffer_time_stamp(trace_buf->buffer, cpu));
11043d8b 5941 }
c64e148a 5942
12883efb 5943 cnt = ring_buffer_dropped_events_cpu(trace_buf->buffer, cpu);
884bfe89
SP
5944 trace_seq_printf(s, "dropped events: %ld\n", cnt);
5945
12883efb 5946 cnt = ring_buffer_read_events_cpu(trace_buf->buffer, cpu);
ad964704
SRRH
5947 trace_seq_printf(s, "read events: %ld\n", cnt);
5948
5ac48378
SRRH
5949 count = simple_read_from_buffer(ubuf, count, ppos,
5950 s->buffer, trace_seq_used(s));
c8d77183
SR
5951
5952 kfree(s);
5953
5954 return count;
5955}
5956
5957static const struct file_operations tracing_stats_fops = {
4d3435b8 5958 .open = tracing_open_generic_tr,
c8d77183 5959 .read = tracing_stats_read,
b444786f 5960 .llseek = generic_file_llseek,
4d3435b8 5961 .release = tracing_release_generic_tr,
c8d77183
SR
5962};
5963
bc0c38d1
SR
5964#ifdef CONFIG_DYNAMIC_FTRACE
5965
b807c3d0
SR
5966int __weak ftrace_arch_read_dyn_info(char *buf, int size)
5967{
5968 return 0;
5969}
5970
bc0c38d1 5971static ssize_t
b807c3d0 5972tracing_read_dyn_info(struct file *filp, char __user *ubuf,
bc0c38d1
SR
5973 size_t cnt, loff_t *ppos)
5974{
a26a2a27
SR
5975 static char ftrace_dyn_info_buffer[1024];
5976 static DEFINE_MUTEX(dyn_info_mutex);
bc0c38d1 5977 unsigned long *p = filp->private_data;
b807c3d0 5978 char *buf = ftrace_dyn_info_buffer;
a26a2a27 5979 int size = ARRAY_SIZE(ftrace_dyn_info_buffer);
bc0c38d1
SR
5980 int r;
5981
b807c3d0
SR
5982 mutex_lock(&dyn_info_mutex);
5983 r = sprintf(buf, "%ld ", *p);
4bf39a94 5984
a26a2a27 5985 r += ftrace_arch_read_dyn_info(buf+r, (size-1)-r);
b807c3d0
SR
5986 buf[r++] = '\n';
5987
5988 r = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
5989
5990 mutex_unlock(&dyn_info_mutex);
5991
5992 return r;
bc0c38d1
SR
5993}
5994
5e2336a0 5995static const struct file_operations tracing_dyn_info_fops = {
4bf39a94 5996 .open = tracing_open_generic,
b807c3d0 5997 .read = tracing_read_dyn_info,
b444786f 5998 .llseek = generic_file_llseek,
bc0c38d1 5999};
77fd5c15 6000#endif /* CONFIG_DYNAMIC_FTRACE */
bc0c38d1 6001
77fd5c15
SRRH
6002#if defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE)
6003static void
6004ftrace_snapshot(unsigned long ip, unsigned long parent_ip, void **data)
6005{
6006 tracing_snapshot();
6007}
bc0c38d1 6008
77fd5c15
SRRH
6009static void
6010ftrace_count_snapshot(unsigned long ip, unsigned long parent_ip, void **data)
bc0c38d1 6011{
77fd5c15
SRRH
6012 unsigned long *count = (long *)data;
6013
6014 if (!*count)
6015 return;
bc0c38d1 6016
77fd5c15
SRRH
6017 if (*count != -1)
6018 (*count)--;
6019
6020 tracing_snapshot();
6021}
6022
6023static int
6024ftrace_snapshot_print(struct seq_file *m, unsigned long ip,
6025 struct ftrace_probe_ops *ops, void *data)
6026{
6027 long count = (long)data;
6028
6029 seq_printf(m, "%ps:", (void *)ip);
6030
fa6f0cc7 6031 seq_puts(m, "snapshot");
77fd5c15
SRRH
6032
6033 if (count == -1)
fa6f0cc7 6034 seq_puts(m, ":unlimited\n");
77fd5c15
SRRH
6035 else
6036 seq_printf(m, ":count=%ld\n", count);
6037
6038 return 0;
6039}
6040
6041static struct ftrace_probe_ops snapshot_probe_ops = {
6042 .func = ftrace_snapshot,
6043 .print = ftrace_snapshot_print,
6044};
6045
6046static struct ftrace_probe_ops snapshot_count_probe_ops = {
6047 .func = ftrace_count_snapshot,
6048 .print = ftrace_snapshot_print,
6049};
6050
6051static int
6052ftrace_trace_snapshot_callback(struct ftrace_hash *hash,
6053 char *glob, char *cmd, char *param, int enable)
6054{
6055 struct ftrace_probe_ops *ops;
6056 void *count = (void *)-1;
6057 char *number;
6058 int ret;
6059
6060 /* hash funcs only work with set_ftrace_filter */
6061 if (!enable)
6062 return -EINVAL;
6063
6064 ops = param ? &snapshot_count_probe_ops : &snapshot_probe_ops;
6065
6066 if (glob[0] == '!') {
6067 unregister_ftrace_function_probe_func(glob+1, ops);
6068 return 0;
6069 }
6070
6071 if (!param)
6072 goto out_reg;
6073
6074 number = strsep(&param, ":");
6075
6076 if (!strlen(number))
6077 goto out_reg;
6078
6079 /*
6080 * We use the callback data field (which is a pointer)
6081 * as our counter.
6082 */
6083 ret = kstrtoul(number, 0, (unsigned long *)&count);
6084 if (ret)
6085 return ret;
6086
6087 out_reg:
6088 ret = register_ftrace_function_probe(glob, ops, count);
6089
6090 if (ret >= 0)
6091 alloc_snapshot(&global_trace);
6092
6093 return ret < 0 ? ret : 0;
6094}
6095
6096static struct ftrace_func_command ftrace_snapshot_cmd = {
6097 .name = "snapshot",
6098 .func = ftrace_trace_snapshot_callback,
6099};
6100
38de93ab 6101static __init int register_snapshot_cmd(void)
77fd5c15
SRRH
6102{
6103 return register_ftrace_command(&ftrace_snapshot_cmd);
6104}
6105#else
38de93ab 6106static inline __init int register_snapshot_cmd(void) { return 0; }
77fd5c15 6107#endif /* defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE) */
bc0c38d1 6108
7eeafbca 6109static struct dentry *tracing_get_dentry(struct trace_array *tr)
bc0c38d1 6110{
8434dc93
SRRH
6111 if (WARN_ON(!tr->dir))
6112 return ERR_PTR(-ENODEV);
6113
6114 /* Top directory uses NULL as the parent */
6115 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
6116 return NULL;
6117
6118 /* All sub buffers have a descriptor */
2b6080f2 6119 return tr->dir;
bc0c38d1
SR
6120}
6121
2b6080f2 6122static struct dentry *tracing_dentry_percpu(struct trace_array *tr, int cpu)
b04cc6b1 6123{
b04cc6b1
FW
6124 struct dentry *d_tracer;
6125
2b6080f2
SR
6126 if (tr->percpu_dir)
6127 return tr->percpu_dir;
b04cc6b1 6128
7eeafbca 6129 d_tracer = tracing_get_dentry(tr);
14a5ae40 6130 if (IS_ERR(d_tracer))
b04cc6b1
FW
6131 return NULL;
6132
8434dc93 6133 tr->percpu_dir = tracefs_create_dir("per_cpu", d_tracer);
b04cc6b1 6134
2b6080f2 6135 WARN_ONCE(!tr->percpu_dir,
8434dc93 6136 "Could not create tracefs directory 'per_cpu/%d'\n", cpu);
b04cc6b1 6137
2b6080f2 6138 return tr->percpu_dir;
b04cc6b1
FW
6139}
6140
649e9c70
ON
6141static struct dentry *
6142trace_create_cpu_file(const char *name, umode_t mode, struct dentry *parent,
6143 void *data, long cpu, const struct file_operations *fops)
6144{
6145 struct dentry *ret = trace_create_file(name, mode, parent, data, fops);
6146
6147 if (ret) /* See tracing_get_cpu() */
7682c918 6148 d_inode(ret)->i_cdev = (void *)(cpu + 1);
649e9c70
ON
6149 return ret;
6150}
6151
2b6080f2 6152static void
8434dc93 6153tracing_init_tracefs_percpu(struct trace_array *tr, long cpu)
b04cc6b1 6154{
2b6080f2 6155 struct dentry *d_percpu = tracing_dentry_percpu(tr, cpu);
5452af66 6156 struct dentry *d_cpu;
dd49a38c 6157 char cpu_dir[30]; /* 30 characters should be more than enough */
b04cc6b1 6158
0a3d7ce7
NK
6159 if (!d_percpu)
6160 return;
6161
dd49a38c 6162 snprintf(cpu_dir, 30, "cpu%ld", cpu);
8434dc93 6163 d_cpu = tracefs_create_dir(cpu_dir, d_percpu);
8656e7a2 6164 if (!d_cpu) {
a395d6a7 6165 pr_warn("Could not create tracefs '%s' entry\n", cpu_dir);
8656e7a2
FW
6166 return;
6167 }
b04cc6b1 6168
8656e7a2 6169 /* per cpu trace_pipe */
649e9c70 6170 trace_create_cpu_file("trace_pipe", 0444, d_cpu,
15544209 6171 tr, cpu, &tracing_pipe_fops);
b04cc6b1
FW
6172
6173 /* per cpu trace */
649e9c70 6174 trace_create_cpu_file("trace", 0644, d_cpu,
6484c71c 6175 tr, cpu, &tracing_fops);
7f96f93f 6176
649e9c70 6177 trace_create_cpu_file("trace_pipe_raw", 0444, d_cpu,
46ef2be0 6178 tr, cpu, &tracing_buffers_fops);
7f96f93f 6179
649e9c70 6180 trace_create_cpu_file("stats", 0444, d_cpu,
4d3435b8 6181 tr, cpu, &tracing_stats_fops);
438ced17 6182
649e9c70 6183 trace_create_cpu_file("buffer_size_kb", 0444, d_cpu,
0bc392ee 6184 tr, cpu, &tracing_entries_fops);
f1affcaa
SRRH
6185
6186#ifdef CONFIG_TRACER_SNAPSHOT
649e9c70 6187 trace_create_cpu_file("snapshot", 0644, d_cpu,
6484c71c 6188 tr, cpu, &snapshot_fops);
6de58e62 6189
649e9c70 6190 trace_create_cpu_file("snapshot_raw", 0444, d_cpu,
46ef2be0 6191 tr, cpu, &snapshot_raw_fops);
f1affcaa 6192#endif
b04cc6b1
FW
6193}
6194
60a11774
SR
6195#ifdef CONFIG_FTRACE_SELFTEST
6196/* Let selftest have access to static functions in this file */
6197#include "trace_selftest.c"
6198#endif
6199
577b785f
SR
6200static ssize_t
6201trace_options_read(struct file *filp, char __user *ubuf, size_t cnt,
6202 loff_t *ppos)
6203{
6204 struct trace_option_dentry *topt = filp->private_data;
6205 char *buf;
6206
6207 if (topt->flags->val & topt->opt->bit)
6208 buf = "1\n";
6209 else
6210 buf = "0\n";
6211
6212 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
6213}
6214
6215static ssize_t
6216trace_options_write(struct file *filp, const char __user *ubuf, size_t cnt,
6217 loff_t *ppos)
6218{
6219 struct trace_option_dentry *topt = filp->private_data;
6220 unsigned long val;
577b785f
SR
6221 int ret;
6222
22fe9b54
PH
6223 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6224 if (ret)
577b785f
SR
6225 return ret;
6226
8d18eaaf
LZ
6227 if (val != 0 && val != 1)
6228 return -EINVAL;
577b785f 6229
8d18eaaf 6230 if (!!(topt->flags->val & topt->opt->bit) != val) {
577b785f 6231 mutex_lock(&trace_types_lock);
8c1a49ae 6232 ret = __set_tracer_option(topt->tr, topt->flags,
c757bea9 6233 topt->opt, !val);
577b785f
SR
6234 mutex_unlock(&trace_types_lock);
6235 if (ret)
6236 return ret;
577b785f
SR
6237 }
6238
6239 *ppos += cnt;
6240
6241 return cnt;
6242}
6243
6244
6245static const struct file_operations trace_options_fops = {
6246 .open = tracing_open_generic,
6247 .read = trace_options_read,
6248 .write = trace_options_write,
b444786f 6249 .llseek = generic_file_llseek,
577b785f
SR
6250};
6251
9a38a885
SRRH
6252/*
6253 * In order to pass in both the trace_array descriptor as well as the index
6254 * to the flag that the trace option file represents, the trace_array
6255 * has a character array of trace_flags_index[], which holds the index
6256 * of the bit for the flag it represents. index[0] == 0, index[1] == 1, etc.
6257 * The address of this character array is passed to the flag option file
6258 * read/write callbacks.
6259 *
6260 * In order to extract both the index and the trace_array descriptor,
6261 * get_tr_index() uses the following algorithm.
6262 *
6263 * idx = *ptr;
6264 *
6265 * As the pointer itself contains the address of the index (remember
6266 * index[1] == 1).
6267 *
6268 * Then to get the trace_array descriptor, by subtracting that index
6269 * from the ptr, we get to the start of the index itself.
6270 *
6271 * ptr - idx == &index[0]
6272 *
6273 * Then a simple container_of() from that pointer gets us to the
6274 * trace_array descriptor.
6275 */
6276static void get_tr_index(void *data, struct trace_array **ptr,
6277 unsigned int *pindex)
6278{
6279 *pindex = *(unsigned char *)data;
6280
6281 *ptr = container_of(data - *pindex, struct trace_array,
6282 trace_flags_index);
6283}
6284
a8259075
SR
6285static ssize_t
6286trace_options_core_read(struct file *filp, char __user *ubuf, size_t cnt,
6287 loff_t *ppos)
6288{
9a38a885
SRRH
6289 void *tr_index = filp->private_data;
6290 struct trace_array *tr;
6291 unsigned int index;
a8259075
SR
6292 char *buf;
6293
9a38a885
SRRH
6294 get_tr_index(tr_index, &tr, &index);
6295
6296 if (tr->trace_flags & (1 << index))
a8259075
SR
6297 buf = "1\n";
6298 else
6299 buf = "0\n";
6300
6301 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
6302}
6303
6304static ssize_t
6305trace_options_core_write(struct file *filp, const char __user *ubuf, size_t cnt,
6306 loff_t *ppos)
6307{
9a38a885
SRRH
6308 void *tr_index = filp->private_data;
6309 struct trace_array *tr;
6310 unsigned int index;
a8259075
SR
6311 unsigned long val;
6312 int ret;
6313
9a38a885
SRRH
6314 get_tr_index(tr_index, &tr, &index);
6315
22fe9b54
PH
6316 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6317 if (ret)
a8259075
SR
6318 return ret;
6319
f2d84b65 6320 if (val != 0 && val != 1)
a8259075 6321 return -EINVAL;
69d34da2
SRRH
6322
6323 mutex_lock(&trace_types_lock);
2b6080f2 6324 ret = set_tracer_flag(tr, 1 << index, val);
69d34da2 6325 mutex_unlock(&trace_types_lock);
a8259075 6326
613f04a0
SRRH
6327 if (ret < 0)
6328 return ret;
6329
a8259075
SR
6330 *ppos += cnt;
6331
6332 return cnt;
6333}
6334
a8259075
SR
6335static const struct file_operations trace_options_core_fops = {
6336 .open = tracing_open_generic,
6337 .read = trace_options_core_read,
6338 .write = trace_options_core_write,
b444786f 6339 .llseek = generic_file_llseek,
a8259075
SR
6340};
6341
5452af66 6342struct dentry *trace_create_file(const char *name,
f4ae40a6 6343 umode_t mode,
5452af66
FW
6344 struct dentry *parent,
6345 void *data,
6346 const struct file_operations *fops)
6347{
6348 struct dentry *ret;
6349
8434dc93 6350 ret = tracefs_create_file(name, mode, parent, data, fops);
5452af66 6351 if (!ret)
a395d6a7 6352 pr_warn("Could not create tracefs '%s' entry\n", name);
5452af66
FW
6353
6354 return ret;
6355}
6356
6357
2b6080f2 6358static struct dentry *trace_options_init_dentry(struct trace_array *tr)
a8259075
SR
6359{
6360 struct dentry *d_tracer;
a8259075 6361
2b6080f2
SR
6362 if (tr->options)
6363 return tr->options;
a8259075 6364
7eeafbca 6365 d_tracer = tracing_get_dentry(tr);
14a5ae40 6366 if (IS_ERR(d_tracer))
a8259075
SR
6367 return NULL;
6368
8434dc93 6369 tr->options = tracefs_create_dir("options", d_tracer);
2b6080f2 6370 if (!tr->options) {
a395d6a7 6371 pr_warn("Could not create tracefs directory 'options'\n");
a8259075
SR
6372 return NULL;
6373 }
6374
2b6080f2 6375 return tr->options;
a8259075
SR
6376}
6377
577b785f 6378static void
2b6080f2
SR
6379create_trace_option_file(struct trace_array *tr,
6380 struct trace_option_dentry *topt,
577b785f
SR
6381 struct tracer_flags *flags,
6382 struct tracer_opt *opt)
6383{
6384 struct dentry *t_options;
577b785f 6385
2b6080f2 6386 t_options = trace_options_init_dentry(tr);
577b785f
SR
6387 if (!t_options)
6388 return;
6389
6390 topt->flags = flags;
6391 topt->opt = opt;
2b6080f2 6392 topt->tr = tr;
577b785f 6393
5452af66 6394 topt->entry = trace_create_file(opt->name, 0644, t_options, topt,
577b785f
SR
6395 &trace_options_fops);
6396
577b785f
SR
6397}
6398
37aea98b 6399static void
2b6080f2 6400create_trace_option_files(struct trace_array *tr, struct tracer *tracer)
577b785f
SR
6401{
6402 struct trace_option_dentry *topts;
37aea98b 6403 struct trace_options *tr_topts;
577b785f
SR
6404 struct tracer_flags *flags;
6405 struct tracer_opt *opts;
6406 int cnt;
37aea98b 6407 int i;
577b785f
SR
6408
6409 if (!tracer)
37aea98b 6410 return;
577b785f
SR
6411
6412 flags = tracer->flags;
6413
6414 if (!flags || !flags->opts)
37aea98b
SRRH
6415 return;
6416
6417 /*
6418 * If this is an instance, only create flags for tracers
6419 * the instance may have.
6420 */
6421 if (!trace_ok_for_array(tracer, tr))
6422 return;
6423
6424 for (i = 0; i < tr->nr_topts; i++) {
d39cdd20
CH
6425 /* Make sure there's no duplicate flags. */
6426 if (WARN_ON_ONCE(tr->topts[i].tracer->flags == tracer->flags))
37aea98b
SRRH
6427 return;
6428 }
577b785f
SR
6429
6430 opts = flags->opts;
6431
6432 for (cnt = 0; opts[cnt].name; cnt++)
6433 ;
6434
0cfe8245 6435 topts = kcalloc(cnt + 1, sizeof(*topts), GFP_KERNEL);
577b785f 6436 if (!topts)
37aea98b
SRRH
6437 return;
6438
6439 tr_topts = krealloc(tr->topts, sizeof(*tr->topts) * (tr->nr_topts + 1),
6440 GFP_KERNEL);
6441 if (!tr_topts) {
6442 kfree(topts);
6443 return;
6444 }
6445
6446 tr->topts = tr_topts;
6447 tr->topts[tr->nr_topts].tracer = tracer;
6448 tr->topts[tr->nr_topts].topts = topts;
6449 tr->nr_topts++;
577b785f 6450
41d9c0be 6451 for (cnt = 0; opts[cnt].name; cnt++) {
2b6080f2 6452 create_trace_option_file(tr, &topts[cnt], flags,
577b785f 6453 &opts[cnt]);
41d9c0be
SRRH
6454 WARN_ONCE(topts[cnt].entry == NULL,
6455 "Failed to create trace option: %s",
6456 opts[cnt].name);
6457 }
577b785f
SR
6458}
6459
a8259075 6460static struct dentry *
2b6080f2
SR
6461create_trace_option_core_file(struct trace_array *tr,
6462 const char *option, long index)
a8259075
SR
6463{
6464 struct dentry *t_options;
a8259075 6465
2b6080f2 6466 t_options = trace_options_init_dentry(tr);
a8259075
SR
6467 if (!t_options)
6468 return NULL;
6469
9a38a885
SRRH
6470 return trace_create_file(option, 0644, t_options,
6471 (void *)&tr->trace_flags_index[index],
6472 &trace_options_core_fops);
a8259075
SR
6473}
6474
16270145 6475static void create_trace_options_dir(struct trace_array *tr)
a8259075
SR
6476{
6477 struct dentry *t_options;
16270145 6478 bool top_level = tr == &global_trace;
a8259075
SR
6479 int i;
6480
2b6080f2 6481 t_options = trace_options_init_dentry(tr);
a8259075
SR
6482 if (!t_options)
6483 return;
6484
16270145
SRRH
6485 for (i = 0; trace_options[i]; i++) {
6486 if (top_level ||
6487 !((1 << i) & TOP_LEVEL_TRACE_FLAGS))
6488 create_trace_option_core_file(tr, trace_options[i], i);
6489 }
a8259075
SR
6490}
6491
499e5470
SR
6492static ssize_t
6493rb_simple_read(struct file *filp, char __user *ubuf,
6494 size_t cnt, loff_t *ppos)
6495{
348f0fc2 6496 struct trace_array *tr = filp->private_data;
499e5470
SR
6497 char buf[64];
6498 int r;
6499
10246fa3 6500 r = tracer_tracing_is_on(tr);
499e5470
SR
6501 r = sprintf(buf, "%d\n", r);
6502
6503 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
6504}
6505
6506static ssize_t
6507rb_simple_write(struct file *filp, const char __user *ubuf,
6508 size_t cnt, loff_t *ppos)
6509{
348f0fc2 6510 struct trace_array *tr = filp->private_data;
12883efb 6511 struct ring_buffer *buffer = tr->trace_buffer.buffer;
499e5470
SR
6512 unsigned long val;
6513 int ret;
6514
6515 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6516 if (ret)
6517 return ret;
6518
6519 if (buffer) {
2df8f8a6
SR
6520 mutex_lock(&trace_types_lock);
6521 if (val) {
10246fa3 6522 tracer_tracing_on(tr);
2b6080f2
SR
6523 if (tr->current_trace->start)
6524 tr->current_trace->start(tr);
2df8f8a6 6525 } else {
10246fa3 6526 tracer_tracing_off(tr);
2b6080f2
SR
6527 if (tr->current_trace->stop)
6528 tr->current_trace->stop(tr);
2df8f8a6
SR
6529 }
6530 mutex_unlock(&trace_types_lock);
499e5470
SR
6531 }
6532
6533 (*ppos)++;
6534
6535 return cnt;
6536}
6537
6538static const struct file_operations rb_simple_fops = {
7b85af63 6539 .open = tracing_open_generic_tr,
499e5470
SR
6540 .read = rb_simple_read,
6541 .write = rb_simple_write,
7b85af63 6542 .release = tracing_release_generic_tr,
499e5470
SR
6543 .llseek = default_llseek,
6544};
6545
277ba044
SR
6546struct dentry *trace_instance_dir;
6547
6548static void
8434dc93 6549init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer);
277ba044 6550
55034cd6
SRRH
6551static int
6552allocate_trace_buffer(struct trace_array *tr, struct trace_buffer *buf, int size)
277ba044
SR
6553{
6554 enum ring_buffer_flags rb_flags;
737223fb 6555
983f938a 6556 rb_flags = tr->trace_flags & TRACE_ITER_OVERWRITE ? RB_FL_OVERWRITE : 0;
737223fb 6557
dced341b
SRRH
6558 buf->tr = tr;
6559
55034cd6
SRRH
6560 buf->buffer = ring_buffer_alloc(size, rb_flags);
6561 if (!buf->buffer)
6562 return -ENOMEM;
737223fb 6563
55034cd6
SRRH
6564 buf->data = alloc_percpu(struct trace_array_cpu);
6565 if (!buf->data) {
6566 ring_buffer_free(buf->buffer);
6567 return -ENOMEM;
6568 }
737223fb 6569
737223fb
SRRH
6570 /* Allocate the first page for all buffers */
6571 set_buffer_entries(&tr->trace_buffer,
6572 ring_buffer_size(tr->trace_buffer.buffer, 0));
6573
55034cd6
SRRH
6574 return 0;
6575}
737223fb 6576
55034cd6
SRRH
6577static int allocate_trace_buffers(struct trace_array *tr, int size)
6578{
6579 int ret;
737223fb 6580
55034cd6
SRRH
6581 ret = allocate_trace_buffer(tr, &tr->trace_buffer, size);
6582 if (ret)
6583 return ret;
737223fb 6584
55034cd6
SRRH
6585#ifdef CONFIG_TRACER_MAX_TRACE
6586 ret = allocate_trace_buffer(tr, &tr->max_buffer,
6587 allocate_snapshot ? size : 1);
6588 if (WARN_ON(ret)) {
737223fb 6589 ring_buffer_free(tr->trace_buffer.buffer);
55034cd6
SRRH
6590 free_percpu(tr->trace_buffer.data);
6591 return -ENOMEM;
6592 }
6593 tr->allocated_snapshot = allocate_snapshot;
737223fb 6594
55034cd6
SRRH
6595 /*
6596 * Only the top level trace array gets its snapshot allocated
6597 * from the kernel command line.
6598 */
6599 allocate_snapshot = false;
737223fb 6600#endif
55034cd6 6601 return 0;
737223fb
SRRH
6602}
6603
f0b70cc4
SRRH
6604static void free_trace_buffer(struct trace_buffer *buf)
6605{
6606 if (buf->buffer) {
6607 ring_buffer_free(buf->buffer);
6608 buf->buffer = NULL;
6609 free_percpu(buf->data);
6610 buf->data = NULL;
6611 }
6612}
6613
23aaa3c1
SRRH
6614static void free_trace_buffers(struct trace_array *tr)
6615{
6616 if (!tr)
6617 return;
6618
f0b70cc4 6619 free_trace_buffer(&tr->trace_buffer);
23aaa3c1
SRRH
6620
6621#ifdef CONFIG_TRACER_MAX_TRACE
f0b70cc4 6622 free_trace_buffer(&tr->max_buffer);
23aaa3c1
SRRH
6623#endif
6624}
6625
9a38a885
SRRH
6626static void init_trace_flags_index(struct trace_array *tr)
6627{
6628 int i;
6629
6630 /* Used by the trace options files */
6631 for (i = 0; i < TRACE_FLAGS_MAX_SIZE; i++)
6632 tr->trace_flags_index[i] = i;
6633}
6634
37aea98b
SRRH
6635static void __update_tracer_options(struct trace_array *tr)
6636{
6637 struct tracer *t;
6638
6639 for (t = trace_types; t; t = t->next)
6640 add_tracer_options(tr, t);
6641}
6642
6643static void update_tracer_options(struct trace_array *tr)
6644{
6645 mutex_lock(&trace_types_lock);
6646 __update_tracer_options(tr);
6647 mutex_unlock(&trace_types_lock);
6648}
6649
eae47358 6650static int instance_mkdir(const char *name)
737223fb 6651{
277ba044
SR
6652 struct trace_array *tr;
6653 int ret;
277ba044
SR
6654
6655 mutex_lock(&trace_types_lock);
6656
6657 ret = -EEXIST;
6658 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
6659 if (tr->name && strcmp(tr->name, name) == 0)
6660 goto out_unlock;
6661 }
6662
6663 ret = -ENOMEM;
6664 tr = kzalloc(sizeof(*tr), GFP_KERNEL);
6665 if (!tr)
6666 goto out_unlock;
6667
6668 tr->name = kstrdup(name, GFP_KERNEL);
6669 if (!tr->name)
6670 goto out_free_tr;
6671
ccfe9e42
AL
6672 if (!alloc_cpumask_var(&tr->tracing_cpumask, GFP_KERNEL))
6673 goto out_free_tr;
6674
983f938a
SRRH
6675 tr->trace_flags = global_trace.trace_flags;
6676
ccfe9e42
AL
6677 cpumask_copy(tr->tracing_cpumask, cpu_all_mask);
6678
277ba044
SR
6679 raw_spin_lock_init(&tr->start_lock);
6680
0b9b12c1
SRRH
6681 tr->max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
6682
277ba044
SR
6683 tr->current_trace = &nop_trace;
6684
6685 INIT_LIST_HEAD(&tr->systems);
6686 INIT_LIST_HEAD(&tr->events);
6687
737223fb 6688 if (allocate_trace_buffers(tr, trace_buf_size) < 0)
277ba044
SR
6689 goto out_free_tr;
6690
8434dc93 6691 tr->dir = tracefs_create_dir(name, trace_instance_dir);
277ba044
SR
6692 if (!tr->dir)
6693 goto out_free_tr;
6694
6695 ret = event_trace_add_tracer(tr->dir, tr);
609e85a7 6696 if (ret) {
8434dc93 6697 tracefs_remove_recursive(tr->dir);
277ba044 6698 goto out_free_tr;
609e85a7 6699 }
277ba044 6700
8434dc93 6701 init_tracer_tracefs(tr, tr->dir);
9a38a885 6702 init_trace_flags_index(tr);
37aea98b 6703 __update_tracer_options(tr);
277ba044
SR
6704
6705 list_add(&tr->list, &ftrace_trace_arrays);
6706
6707 mutex_unlock(&trace_types_lock);
6708
6709 return 0;
6710
6711 out_free_tr:
23aaa3c1 6712 free_trace_buffers(tr);
ccfe9e42 6713 free_cpumask_var(tr->tracing_cpumask);
277ba044
SR
6714 kfree(tr->name);
6715 kfree(tr);
6716
6717 out_unlock:
6718 mutex_unlock(&trace_types_lock);
6719
6720 return ret;
6721
6722}
6723
eae47358 6724static int instance_rmdir(const char *name)
0c8916c3
SR
6725{
6726 struct trace_array *tr;
6727 int found = 0;
6728 int ret;
37aea98b 6729 int i;
0c8916c3
SR
6730
6731 mutex_lock(&trace_types_lock);
6732
6733 ret = -ENODEV;
6734 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
6735 if (tr->name && strcmp(tr->name, name) == 0) {
6736 found = 1;
6737 break;
6738 }
6739 }
6740 if (!found)
6741 goto out_unlock;
6742
a695cb58 6743 ret = -EBUSY;
cf6ab6d9 6744 if (tr->ref || (tr->current_trace && tr->current_trace->ref))
a695cb58
SRRH
6745 goto out_unlock;
6746
0c8916c3
SR
6747 list_del(&tr->list);
6748
6b450d25 6749 tracing_set_nop(tr);
0c8916c3 6750 event_trace_del_tracer(tr);
591dffda 6751 ftrace_destroy_function_files(tr);
681a4a2f 6752 tracefs_remove_recursive(tr->dir);
a9fcaaac 6753 free_trace_buffers(tr);
0c8916c3 6754
37aea98b
SRRH
6755 for (i = 0; i < tr->nr_topts; i++) {
6756 kfree(tr->topts[i].topts);
6757 }
6758 kfree(tr->topts);
6759
0c8916c3
SR
6760 kfree(tr->name);
6761 kfree(tr);
6762
6763 ret = 0;
6764
6765 out_unlock:
6766 mutex_unlock(&trace_types_lock);
6767
6768 return ret;
6769}
6770
277ba044
SR
6771static __init void create_trace_instances(struct dentry *d_tracer)
6772{
eae47358
SRRH
6773 trace_instance_dir = tracefs_create_instance_dir("instances", d_tracer,
6774 instance_mkdir,
6775 instance_rmdir);
277ba044
SR
6776 if (WARN_ON(!trace_instance_dir))
6777 return;
277ba044
SR
6778}
6779
2b6080f2 6780static void
8434dc93 6781init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer)
2b6080f2 6782{
121aaee7 6783 int cpu;
2b6080f2 6784
607e2ea1
SRRH
6785 trace_create_file("available_tracers", 0444, d_tracer,
6786 tr, &show_traces_fops);
6787
6788 trace_create_file("current_tracer", 0644, d_tracer,
6789 tr, &set_tracer_fops);
6790
ccfe9e42
AL
6791 trace_create_file("tracing_cpumask", 0644, d_tracer,
6792 tr, &tracing_cpumask_fops);
6793
2b6080f2
SR
6794 trace_create_file("trace_options", 0644, d_tracer,
6795 tr, &tracing_iter_fops);
6796
6797 trace_create_file("trace", 0644, d_tracer,
6484c71c 6798 tr, &tracing_fops);
2b6080f2
SR
6799
6800 trace_create_file("trace_pipe", 0444, d_tracer,
15544209 6801 tr, &tracing_pipe_fops);
2b6080f2
SR
6802
6803 trace_create_file("buffer_size_kb", 0644, d_tracer,
0bc392ee 6804 tr, &tracing_entries_fops);
2b6080f2
SR
6805
6806 trace_create_file("buffer_total_size_kb", 0444, d_tracer,
6807 tr, &tracing_total_entries_fops);
6808
238ae93d 6809 trace_create_file("free_buffer", 0200, d_tracer,
2b6080f2
SR
6810 tr, &tracing_free_buffer_fops);
6811
6812 trace_create_file("trace_marker", 0220, d_tracer,
6813 tr, &tracing_mark_fops);
6814
6815 trace_create_file("trace_clock", 0644, d_tracer, tr,
6816 &trace_clock_fops);
6817
6818 trace_create_file("tracing_on", 0644, d_tracer,
6484c71c 6819 tr, &rb_simple_fops);
ce9bae55 6820
16270145
SRRH
6821 create_trace_options_dir(tr);
6822
6d9b3fa5
SRRH
6823#ifdef CONFIG_TRACER_MAX_TRACE
6824 trace_create_file("tracing_max_latency", 0644, d_tracer,
6825 &tr->max_latency, &tracing_max_lat_fops);
6826#endif
6827
591dffda
SRRH
6828 if (ftrace_create_function_files(tr, d_tracer))
6829 WARN(1, "Could not allocate function filter files");
6830
ce9bae55
SRRH
6831#ifdef CONFIG_TRACER_SNAPSHOT
6832 trace_create_file("snapshot", 0644, d_tracer,
6484c71c 6833 tr, &snapshot_fops);
ce9bae55 6834#endif
121aaee7
SRRH
6835
6836 for_each_tracing_cpu(cpu)
8434dc93 6837 tracing_init_tracefs_percpu(tr, cpu);
121aaee7 6838
2b6080f2
SR
6839}
6840
f76180bc
SRRH
6841static struct vfsmount *trace_automount(void *ingore)
6842{
6843 struct vfsmount *mnt;
6844 struct file_system_type *type;
6845
6846 /*
6847 * To maintain backward compatibility for tools that mount
6848 * debugfs to get to the tracing facility, tracefs is automatically
6849 * mounted to the debugfs/tracing directory.
6850 */
6851 type = get_fs_type("tracefs");
6852 if (!type)
6853 return NULL;
6854 mnt = vfs_kern_mount(type, 0, "tracefs", NULL);
6855 put_filesystem(type);
6856 if (IS_ERR(mnt))
6857 return NULL;
6858 mntget(mnt);
6859
6860 return mnt;
6861}
6862
7eeafbca
SRRH
6863/**
6864 * tracing_init_dentry - initialize top level trace array
6865 *
6866 * This is called when creating files or directories in the tracing
6867 * directory. It is called via fs_initcall() by any of the boot up code
6868 * and expects to return the dentry of the top level tracing directory.
6869 */
6870struct dentry *tracing_init_dentry(void)
6871{
6872 struct trace_array *tr = &global_trace;
6873
f76180bc 6874 /* The top level trace array uses NULL as parent */
7eeafbca 6875 if (tr->dir)
f76180bc 6876 return NULL;
7eeafbca 6877
8b129199
JW
6878 if (WARN_ON(!tracefs_initialized()) ||
6879 (IS_ENABLED(CONFIG_DEBUG_FS) &&
6880 WARN_ON(!debugfs_initialized())))
7eeafbca
SRRH
6881 return ERR_PTR(-ENODEV);
6882
f76180bc
SRRH
6883 /*
6884 * As there may still be users that expect the tracing
6885 * files to exist in debugfs/tracing, we must automount
6886 * the tracefs file system there, so older tools still
6887 * work with the newer kerenl.
6888 */
6889 tr->dir = debugfs_create_automount("tracing", NULL,
6890 trace_automount, NULL);
7eeafbca
SRRH
6891 if (!tr->dir) {
6892 pr_warn_once("Could not create debugfs directory 'tracing'\n");
6893 return ERR_PTR(-ENOMEM);
6894 }
6895
8434dc93 6896 return NULL;
7eeafbca
SRRH
6897}
6898
0c564a53
SRRH
6899extern struct trace_enum_map *__start_ftrace_enum_maps[];
6900extern struct trace_enum_map *__stop_ftrace_enum_maps[];
6901
6902static void __init trace_enum_init(void)
6903{
3673b8e4
SRRH
6904 int len;
6905
6906 len = __stop_ftrace_enum_maps - __start_ftrace_enum_maps;
9828413d 6907 trace_insert_enum_map(NULL, __start_ftrace_enum_maps, len);
3673b8e4
SRRH
6908}
6909
6910#ifdef CONFIG_MODULES
6911static void trace_module_add_enums(struct module *mod)
6912{
6913 if (!mod->num_trace_enums)
6914 return;
6915
6916 /*
6917 * Modules with bad taint do not have events created, do
6918 * not bother with enums either.
6919 */
6920 if (trace_module_has_bad_taint(mod))
6921 return;
6922
9828413d 6923 trace_insert_enum_map(mod, mod->trace_enums, mod->num_trace_enums);
3673b8e4
SRRH
6924}
6925
9828413d
SRRH
6926#ifdef CONFIG_TRACE_ENUM_MAP_FILE
6927static void trace_module_remove_enums(struct module *mod)
6928{
6929 union trace_enum_map_item *map;
6930 union trace_enum_map_item **last = &trace_enum_maps;
6931
6932 if (!mod->num_trace_enums)
6933 return;
6934
6935 mutex_lock(&trace_enum_mutex);
6936
6937 map = trace_enum_maps;
6938
6939 while (map) {
6940 if (map->head.mod == mod)
6941 break;
6942 map = trace_enum_jmp_to_tail(map);
6943 last = &map->tail.next;
6944 map = map->tail.next;
6945 }
6946 if (!map)
6947 goto out;
6948
6949 *last = trace_enum_jmp_to_tail(map)->tail.next;
6950 kfree(map);
6951 out:
6952 mutex_unlock(&trace_enum_mutex);
6953}
6954#else
6955static inline void trace_module_remove_enums(struct module *mod) { }
6956#endif /* CONFIG_TRACE_ENUM_MAP_FILE */
6957
3673b8e4
SRRH
6958static int trace_module_notify(struct notifier_block *self,
6959 unsigned long val, void *data)
6960{
6961 struct module *mod = data;
6962
6963 switch (val) {
6964 case MODULE_STATE_COMING:
6965 trace_module_add_enums(mod);
6966 break;
9828413d
SRRH
6967 case MODULE_STATE_GOING:
6968 trace_module_remove_enums(mod);
6969 break;
3673b8e4
SRRH
6970 }
6971
6972 return 0;
0c564a53
SRRH
6973}
6974
3673b8e4
SRRH
6975static struct notifier_block trace_module_nb = {
6976 .notifier_call = trace_module_notify,
6977 .priority = 0,
6978};
9828413d 6979#endif /* CONFIG_MODULES */
3673b8e4 6980
8434dc93 6981static __init int tracer_init_tracefs(void)
bc0c38d1
SR
6982{
6983 struct dentry *d_tracer;
bc0c38d1 6984
7e53bd42
LJ
6985 trace_access_lock_init();
6986
bc0c38d1 6987 d_tracer = tracing_init_dentry();
14a5ae40 6988 if (IS_ERR(d_tracer))
ed6f1c99 6989 return 0;
bc0c38d1 6990
8434dc93 6991 init_tracer_tracefs(&global_trace, d_tracer);
bc0c38d1 6992
5452af66 6993 trace_create_file("tracing_thresh", 0644, d_tracer,
6508fa76 6994 &global_trace, &tracing_thresh_fops);
a8259075 6995
339ae5d3 6996 trace_create_file("README", 0444, d_tracer,
5452af66
FW
6997 NULL, &tracing_readme_fops);
6998
69abe6a5
AP
6999 trace_create_file("saved_cmdlines", 0444, d_tracer,
7000 NULL, &tracing_saved_cmdlines_fops);
5bf9a1ee 7001
939c7a4f
YY
7002 trace_create_file("saved_cmdlines_size", 0644, d_tracer,
7003 NULL, &tracing_saved_cmdlines_size_fops);
7004
0c564a53
SRRH
7005 trace_enum_init();
7006
9828413d
SRRH
7007 trace_create_enum_file(d_tracer);
7008
3673b8e4
SRRH
7009#ifdef CONFIG_MODULES
7010 register_module_notifier(&trace_module_nb);
7011#endif
7012
bc0c38d1 7013#ifdef CONFIG_DYNAMIC_FTRACE
5452af66
FW
7014 trace_create_file("dyn_ftrace_total_info", 0444, d_tracer,
7015 &ftrace_update_tot_cnt, &tracing_dyn_info_fops);
bc0c38d1 7016#endif
b04cc6b1 7017
277ba044 7018 create_trace_instances(d_tracer);
5452af66 7019
37aea98b 7020 update_tracer_options(&global_trace);
09d23a1d 7021
b5ad384e 7022 return 0;
bc0c38d1
SR
7023}
7024
3f5a54e3
SR
7025static int trace_panic_handler(struct notifier_block *this,
7026 unsigned long event, void *unused)
7027{
944ac425 7028 if (ftrace_dump_on_oops)
cecbca96 7029 ftrace_dump(ftrace_dump_on_oops);
3f5a54e3
SR
7030 return NOTIFY_OK;
7031}
7032
7033static struct notifier_block trace_panic_notifier = {
7034 .notifier_call = trace_panic_handler,
7035 .next = NULL,
7036 .priority = 150 /* priority: INT_MAX >= x >= 0 */
7037};
7038
7039static int trace_die_handler(struct notifier_block *self,
7040 unsigned long val,
7041 void *data)
7042{
7043 switch (val) {
7044 case DIE_OOPS:
944ac425 7045 if (ftrace_dump_on_oops)
cecbca96 7046 ftrace_dump(ftrace_dump_on_oops);
3f5a54e3
SR
7047 break;
7048 default:
7049 break;
7050 }
7051 return NOTIFY_OK;
7052}
7053
7054static struct notifier_block trace_die_notifier = {
7055 .notifier_call = trace_die_handler,
7056 .priority = 200
7057};
7058
7059/*
7060 * printk is set to max of 1024, we really don't need it that big.
7061 * Nothing should be printing 1000 characters anyway.
7062 */
7063#define TRACE_MAX_PRINT 1000
7064
7065/*
7066 * Define here KERN_TRACE so that we have one place to modify
7067 * it if we decide to change what log level the ftrace dump
7068 * should be at.
7069 */
428aee14 7070#define KERN_TRACE KERN_EMERG
3f5a54e3 7071
955b61e5 7072void
3f5a54e3
SR
7073trace_printk_seq(struct trace_seq *s)
7074{
7075 /* Probably should print a warning here. */
3a161d99
SRRH
7076 if (s->seq.len >= TRACE_MAX_PRINT)
7077 s->seq.len = TRACE_MAX_PRINT;
3f5a54e3 7078
820b75f6
SRRH
7079 /*
7080 * More paranoid code. Although the buffer size is set to
7081 * PAGE_SIZE, and TRACE_MAX_PRINT is 1000, this is just
7082 * an extra layer of protection.
7083 */
7084 if (WARN_ON_ONCE(s->seq.len >= s->seq.size))
7085 s->seq.len = s->seq.size - 1;
3f5a54e3
SR
7086
7087 /* should be zero ended, but we are paranoid. */
3a161d99 7088 s->buffer[s->seq.len] = 0;
3f5a54e3
SR
7089
7090 printk(KERN_TRACE "%s", s->buffer);
7091
f9520750 7092 trace_seq_init(s);
3f5a54e3
SR
7093}
7094
955b61e5
JW
7095void trace_init_global_iter(struct trace_iterator *iter)
7096{
7097 iter->tr = &global_trace;
2b6080f2 7098 iter->trace = iter->tr->current_trace;
ae3b5093 7099 iter->cpu_file = RING_BUFFER_ALL_CPUS;
12883efb 7100 iter->trace_buffer = &global_trace.trace_buffer;
b2f974d6
CS
7101
7102 if (iter->trace && iter->trace->open)
7103 iter->trace->open(iter);
7104
7105 /* Annotate start of buffers if we had overruns */
7106 if (ring_buffer_overruns(iter->trace_buffer->buffer))
7107 iter->iter_flags |= TRACE_FILE_ANNOTATE;
7108
7109 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
7110 if (trace_clocks[iter->tr->clock_id].in_ns)
7111 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
955b61e5
JW
7112}
7113
7fe70b57 7114void ftrace_dump(enum ftrace_dump_mode oops_dump_mode)
3f5a54e3 7115{
3f5a54e3
SR
7116 /* use static because iter can be a bit big for the stack */
7117 static struct trace_iterator iter;
7fe70b57 7118 static atomic_t dump_running;
983f938a 7119 struct trace_array *tr = &global_trace;
cf586b61 7120 unsigned int old_userobj;
d769041f
SR
7121 unsigned long flags;
7122 int cnt = 0, cpu;
3f5a54e3 7123
7fe70b57
SRRH
7124 /* Only allow one dump user at a time. */
7125 if (atomic_inc_return(&dump_running) != 1) {
7126 atomic_dec(&dump_running);
7127 return;
7128 }
3f5a54e3 7129
7fe70b57
SRRH
7130 /*
7131 * Always turn off tracing when we dump.
7132 * We don't need to show trace output of what happens
7133 * between multiple crashes.
7134 *
7135 * If the user does a sysrq-z, then they can re-enable
7136 * tracing with echo 1 > tracing_on.
7137 */
0ee6b6cf 7138 tracing_off();
cf586b61 7139
7fe70b57 7140 local_irq_save(flags);
3f5a54e3 7141
38dbe0b1 7142 /* Simulate the iterator */
955b61e5
JW
7143 trace_init_global_iter(&iter);
7144
d769041f 7145 for_each_tracing_cpu(cpu) {
5e2d5ef8 7146 atomic_inc(&per_cpu_ptr(iter.trace_buffer->data, cpu)->disabled);
d769041f
SR
7147 }
7148
983f938a 7149 old_userobj = tr->trace_flags & TRACE_ITER_SYM_USEROBJ;
cf586b61 7150
b54d3de9 7151 /* don't look at user memory in panic mode */
983f938a 7152 tr->trace_flags &= ~TRACE_ITER_SYM_USEROBJ;
b54d3de9 7153
cecbca96
FW
7154 switch (oops_dump_mode) {
7155 case DUMP_ALL:
ae3b5093 7156 iter.cpu_file = RING_BUFFER_ALL_CPUS;
cecbca96
FW
7157 break;
7158 case DUMP_ORIG:
7159 iter.cpu_file = raw_smp_processor_id();
7160 break;
7161 case DUMP_NONE:
7162 goto out_enable;
7163 default:
7164 printk(KERN_TRACE "Bad dumping mode, switching to all CPUs dump\n");
ae3b5093 7165 iter.cpu_file = RING_BUFFER_ALL_CPUS;
cecbca96
FW
7166 }
7167
7168 printk(KERN_TRACE "Dumping ftrace buffer:\n");
3f5a54e3 7169
7fe70b57
SRRH
7170 /* Did function tracer already get disabled? */
7171 if (ftrace_is_dead()) {
7172 printk("# WARNING: FUNCTION TRACING IS CORRUPTED\n");
7173 printk("# MAY BE MISSING FUNCTION EVENTS\n");
7174 }
7175
3f5a54e3
SR
7176 /*
7177 * We need to stop all tracing on all CPUS to read the
7178 * the next buffer. This is a bit expensive, but is
7179 * not done often. We fill all what we can read,
7180 * and then release the locks again.
7181 */
7182
3f5a54e3
SR
7183 while (!trace_empty(&iter)) {
7184
7185 if (!cnt)
7186 printk(KERN_TRACE "---------------------------------\n");
7187
7188 cnt++;
7189
7190 /* reset all but tr, trace, and overruns */
7191 memset(&iter.seq, 0,
7192 sizeof(struct trace_iterator) -
7193 offsetof(struct trace_iterator, seq));
7194 iter.iter_flags |= TRACE_FILE_LAT_FMT;
7195 iter.pos = -1;
7196
955b61e5 7197 if (trace_find_next_entry_inc(&iter) != NULL) {
74e7ff8c
LJ
7198 int ret;
7199
7200 ret = print_trace_line(&iter);
7201 if (ret != TRACE_TYPE_NO_CONSUME)
7202 trace_consume(&iter);
3f5a54e3 7203 }
b892e5c8 7204 touch_nmi_watchdog();
3f5a54e3
SR
7205
7206 trace_printk_seq(&iter.seq);
7207 }
7208
7209 if (!cnt)
7210 printk(KERN_TRACE " (ftrace buffer empty)\n");
7211 else
7212 printk(KERN_TRACE "---------------------------------\n");
7213
cecbca96 7214 out_enable:
983f938a 7215 tr->trace_flags |= old_userobj;
cf586b61 7216
7fe70b57
SRRH
7217 for_each_tracing_cpu(cpu) {
7218 atomic_dec(&per_cpu_ptr(iter.trace_buffer->data, cpu)->disabled);
cf586b61 7219 }
7fe70b57 7220 atomic_dec(&dump_running);
cd891ae0 7221 local_irq_restore(flags);
3f5a54e3 7222}
a8eecf22 7223EXPORT_SYMBOL_GPL(ftrace_dump);
cf586b61 7224
3928a8a2 7225__init static int tracer_alloc_buffers(void)
bc0c38d1 7226{
73c5162a 7227 int ring_buf_size;
9e01c1b7 7228 int ret = -ENOMEM;
4c11d7ae 7229
b5e87c05
SRRH
7230 /*
7231 * Make sure we don't accidently add more trace options
7232 * than we have bits for.
7233 */
9a38a885 7234 BUILD_BUG_ON(TRACE_ITER_LAST_BIT > TRACE_FLAGS_MAX_SIZE);
b5e87c05 7235
9e01c1b7
RR
7236 if (!alloc_cpumask_var(&tracing_buffer_mask, GFP_KERNEL))
7237 goto out;
7238
ccfe9e42 7239 if (!alloc_cpumask_var(&global_trace.tracing_cpumask, GFP_KERNEL))
9e01c1b7 7240 goto out_free_buffer_mask;
4c11d7ae 7241
07d777fe
SR
7242 /* Only allocate trace_printk buffers if a trace_printk exists */
7243 if (__stop___trace_bprintk_fmt != __start___trace_bprintk_fmt)
81698831 7244 /* Must be called before global_trace.buffer is allocated */
07d777fe
SR
7245 trace_printk_init_buffers();
7246
73c5162a
SR
7247 /* To save memory, keep the ring buffer size to its minimum */
7248 if (ring_buffer_expanded)
7249 ring_buf_size = trace_buf_size;
7250 else
7251 ring_buf_size = 1;
7252
9e01c1b7 7253 cpumask_copy(tracing_buffer_mask, cpu_possible_mask);
ccfe9e42 7254 cpumask_copy(global_trace.tracing_cpumask, cpu_all_mask);
9e01c1b7 7255
2b6080f2
SR
7256 raw_spin_lock_init(&global_trace.start_lock);
7257
2c4a33ab
SRRH
7258 /* Used for event triggers */
7259 temp_buffer = ring_buffer_alloc(PAGE_SIZE, RB_FL_OVERWRITE);
7260 if (!temp_buffer)
7261 goto out_free_cpumask;
7262
939c7a4f
YY
7263 if (trace_create_savedcmd() < 0)
7264 goto out_free_temp_buffer;
7265
9e01c1b7 7266 /* TODO: make the number of buffers hot pluggable with CPUS */
737223fb 7267 if (allocate_trace_buffers(&global_trace, ring_buf_size) < 0) {
3928a8a2
SR
7268 printk(KERN_ERR "tracer: failed to allocate ring buffer!\n");
7269 WARN_ON(1);
939c7a4f 7270 goto out_free_savedcmd;
4c11d7ae 7271 }
a7603ff4 7272
499e5470
SR
7273 if (global_trace.buffer_disabled)
7274 tracing_off();
4c11d7ae 7275
e1e232ca
SR
7276 if (trace_boot_clock) {
7277 ret = tracing_set_clock(&global_trace, trace_boot_clock);
7278 if (ret < 0)
a395d6a7
JP
7279 pr_warn("Trace clock %s not defined, going back to default\n",
7280 trace_boot_clock);
e1e232ca
SR
7281 }
7282
ca164318
SRRH
7283 /*
7284 * register_tracer() might reference current_trace, so it
7285 * needs to be set before we register anything. This is
7286 * just a bootstrap of current_trace anyway.
7287 */
2b6080f2
SR
7288 global_trace.current_trace = &nop_trace;
7289
0b9b12c1
SRRH
7290 global_trace.max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
7291
4104d326
SRRH
7292 ftrace_init_global_array_ops(&global_trace);
7293
9a38a885
SRRH
7294 init_trace_flags_index(&global_trace);
7295
ca164318
SRRH
7296 register_tracer(&nop_trace);
7297
60a11774
SR
7298 /* All seems OK, enable tracing */
7299 tracing_disabled = 0;
3928a8a2 7300
3f5a54e3
SR
7301 atomic_notifier_chain_register(&panic_notifier_list,
7302 &trace_panic_notifier);
7303
7304 register_die_notifier(&trace_die_notifier);
2fc1dfbe 7305
ae63b31e
SR
7306 global_trace.flags = TRACE_ARRAY_FL_GLOBAL;
7307
7308 INIT_LIST_HEAD(&global_trace.systems);
7309 INIT_LIST_HEAD(&global_trace.events);
7310 list_add(&global_trace.list, &ftrace_trace_arrays);
7311
a4d1e688 7312 apply_trace_boot_options();
7bcfaf54 7313
77fd5c15
SRRH
7314 register_snapshot_cmd();
7315
2fc1dfbe 7316 return 0;
3f5a54e3 7317
939c7a4f
YY
7318out_free_savedcmd:
7319 free_saved_cmdlines_buffer(savedcmd);
2c4a33ab
SRRH
7320out_free_temp_buffer:
7321 ring_buffer_free(temp_buffer);
9e01c1b7 7322out_free_cpumask:
ccfe9e42 7323 free_cpumask_var(global_trace.tracing_cpumask);
9e01c1b7
RR
7324out_free_buffer_mask:
7325 free_cpumask_var(tracing_buffer_mask);
7326out:
7327 return ret;
bc0c38d1 7328}
b2821ae6 7329
5f893b26
SRRH
7330void __init trace_init(void)
7331{
0daa2302
SRRH
7332 if (tracepoint_printk) {
7333 tracepoint_print_iter =
7334 kmalloc(sizeof(*tracepoint_print_iter), GFP_KERNEL);
7335 if (WARN_ON(!tracepoint_print_iter))
7336 tracepoint_printk = 0;
7337 }
5f893b26 7338 tracer_alloc_buffers();
0c564a53 7339 trace_event_init();
5f893b26
SRRH
7340}
7341
b2821ae6
SR
7342__init static int clear_boot_tracer(void)
7343{
7344 /*
7345 * The default tracer at boot buffer is an init section.
7346 * This function is called in lateinit. If we did not
7347 * find the boot tracer, then clear it out, to prevent
7348 * later registration from accessing the buffer that is
7349 * about to be freed.
7350 */
7351 if (!default_bootup_tracer)
7352 return 0;
7353
7354 printk(KERN_INFO "ftrace bootup tracer '%s' not registered.\n",
7355 default_bootup_tracer);
7356 default_bootup_tracer = NULL;
7357
7358 return 0;
7359}
7360
8434dc93 7361fs_initcall(tracer_init_tracefs);
b2821ae6 7362late_initcall(clear_boot_tracer);