]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - kernel/trace/trace.c
tracing: Make tracing_init_dentry_tr() static
[mirror_ubuntu-jammy-kernel.git] / kernel / trace / trace.c
CommitLineData
bc0c38d1
SR
1/*
2 * ring buffer based function tracer
3 *
2b6080f2 4 * Copyright (C) 2007-2012 Steven Rostedt <srostedt@redhat.com>
bc0c38d1
SR
5 * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
6 *
7 * Originally taken from the RT patch by:
8 * Arnaldo Carvalho de Melo <acme@redhat.com>
9 *
10 * Based on code from the latency_tracer, that is:
11 * Copyright (C) 2004-2006 Ingo Molnar
6d49e352 12 * Copyright (C) 2004 Nadia Yvette Chambers
bc0c38d1 13 */
2cadf913 14#include <linux/ring_buffer.h>
273b281f 15#include <generated/utsrelease.h>
2cadf913
SR
16#include <linux/stacktrace.h>
17#include <linux/writeback.h>
bc0c38d1
SR
18#include <linux/kallsyms.h>
19#include <linux/seq_file.h>
3f5a54e3 20#include <linux/notifier.h>
2cadf913 21#include <linux/irqflags.h>
bc0c38d1 22#include <linux/debugfs.h>
4c11d7ae 23#include <linux/pagemap.h>
bc0c38d1
SR
24#include <linux/hardirq.h>
25#include <linux/linkage.h>
26#include <linux/uaccess.h>
2cadf913 27#include <linux/kprobes.h>
bc0c38d1
SR
28#include <linux/ftrace.h>
29#include <linux/module.h>
30#include <linux/percpu.h>
2cadf913 31#include <linux/splice.h>
3f5a54e3 32#include <linux/kdebug.h>
5f0c6c03 33#include <linux/string.h>
7e53bd42 34#include <linux/rwsem.h>
5a0e3ad6 35#include <linux/slab.h>
bc0c38d1
SR
36#include <linux/ctype.h>
37#include <linux/init.h>
2a2cc8f7 38#include <linux/poll.h>
b892e5c8 39#include <linux/nmi.h>
bc0c38d1 40#include <linux/fs.h>
8bd75c77 41#include <linux/sched/rt.h>
86387f7e 42
bc0c38d1 43#include "trace.h"
f0868d1e 44#include "trace_output.h"
bc0c38d1 45
73c5162a
SR
46/*
47 * On boot up, the ring buffer is set to the minimum size, so that
48 * we do not waste memory on systems that are not using tracing.
49 */
55034cd6 50bool ring_buffer_expanded;
73c5162a 51
8e1b82e0
FW
52/*
53 * We need to change this state when a selftest is running.
ff32504f
FW
54 * A selftest will lurk into the ring-buffer to count the
55 * entries inserted during the selftest although some concurrent
5e1607a0 56 * insertions into the ring-buffer such as trace_printk could occurred
ff32504f
FW
57 * at the same time, giving false positive or negative results.
58 */
8e1b82e0 59static bool __read_mostly tracing_selftest_running;
ff32504f 60
b2821ae6
SR
61/*
62 * If a tracer is running, we do not want to run SELFTEST.
63 */
020e5f85 64bool __read_mostly tracing_selftest_disabled;
b2821ae6 65
0daa2302
SRRH
66/* Pipe tracepoints to printk */
67struct trace_iterator *tracepoint_print_iter;
68int tracepoint_printk;
69
adf9f195
FW
70/* For tracers that don't implement custom flags */
71static struct tracer_opt dummy_tracer_opt[] = {
72 { }
73};
74
75static struct tracer_flags dummy_tracer_flags = {
76 .val = 0,
77 .opts = dummy_tracer_opt
78};
79
8c1a49ae
SRRH
80static int
81dummy_set_flag(struct trace_array *tr, u32 old_flags, u32 bit, int set)
adf9f195
FW
82{
83 return 0;
84}
0f048701 85
7ffbd48d
SR
86/*
87 * To prevent the comm cache from being overwritten when no
88 * tracing is active, only save the comm when a trace event
89 * occurred.
90 */
91static DEFINE_PER_CPU(bool, trace_cmdline_save);
92
0f048701
SR
93/*
94 * Kill all tracing for good (never come back).
95 * It is initialized to 1 but will turn to zero if the initialization
96 * of the tracer is successful. But that is the only place that sets
97 * this back to zero.
98 */
4fd27358 99static int tracing_disabled = 1;
0f048701 100
9288f99a 101DEFINE_PER_CPU(int, ftrace_cpu_disabled);
d769041f 102
955b61e5 103cpumask_var_t __read_mostly tracing_buffer_mask;
ab46428c 104
944ac425
SR
105/*
106 * ftrace_dump_on_oops - variable to dump ftrace buffer on oops
107 *
108 * If there is an oops (or kernel panic) and the ftrace_dump_on_oops
109 * is set, then ftrace_dump is called. This will output the contents
110 * of the ftrace buffers to the console. This is very useful for
111 * capturing traces that lead to crashes and outputing it to a
112 * serial console.
113 *
114 * It is default off, but you can enable it with either specifying
115 * "ftrace_dump_on_oops" in the kernel command line, or setting
cecbca96
FW
116 * /proc/sys/kernel/ftrace_dump_on_oops
117 * Set 1 if you want to dump buffers of all CPUs
118 * Set 2 if you want to dump the buffer of the CPU that triggered oops
944ac425 119 */
cecbca96
FW
120
121enum ftrace_dump_mode ftrace_dump_on_oops;
944ac425 122
de7edd31
SRRH
123/* When set, tracing will stop when a WARN*() is hit */
124int __disable_trace_on_warning;
125
607e2ea1 126static int tracing_set_tracer(struct trace_array *tr, const char *buf);
b2821ae6 127
ee6c2c1b
LZ
128#define MAX_TRACER_SIZE 100
129static char bootup_tracer_buf[MAX_TRACER_SIZE] __initdata;
b2821ae6 130static char *default_bootup_tracer;
d9e54076 131
55034cd6
SRRH
132static bool allocate_snapshot;
133
1beee96b 134static int __init set_cmdline_ftrace(char *str)
d9e54076 135{
67012ab1 136 strlcpy(bootup_tracer_buf, str, MAX_TRACER_SIZE);
b2821ae6 137 default_bootup_tracer = bootup_tracer_buf;
73c5162a 138 /* We are using ftrace early, expand it */
55034cd6 139 ring_buffer_expanded = true;
d9e54076
PZ
140 return 1;
141}
1beee96b 142__setup("ftrace=", set_cmdline_ftrace);
d9e54076 143
944ac425
SR
144static int __init set_ftrace_dump_on_oops(char *str)
145{
cecbca96
FW
146 if (*str++ != '=' || !*str) {
147 ftrace_dump_on_oops = DUMP_ALL;
148 return 1;
149 }
150
151 if (!strcmp("orig_cpu", str)) {
152 ftrace_dump_on_oops = DUMP_ORIG;
153 return 1;
154 }
155
156 return 0;
944ac425
SR
157}
158__setup("ftrace_dump_on_oops", set_ftrace_dump_on_oops);
60a11774 159
de7edd31
SRRH
160static int __init stop_trace_on_warning(char *str)
161{
933ff9f2
LCG
162 if ((strcmp(str, "=0") != 0 && strcmp(str, "=off") != 0))
163 __disable_trace_on_warning = 1;
de7edd31
SRRH
164 return 1;
165}
933ff9f2 166__setup("traceoff_on_warning", stop_trace_on_warning);
de7edd31 167
3209cff4 168static int __init boot_alloc_snapshot(char *str)
55034cd6
SRRH
169{
170 allocate_snapshot = true;
171 /* We also need the main ring buffer expanded */
172 ring_buffer_expanded = true;
173 return 1;
174}
3209cff4 175__setup("alloc_snapshot", boot_alloc_snapshot);
55034cd6 176
7bcfaf54
SR
177
178static char trace_boot_options_buf[MAX_TRACER_SIZE] __initdata;
179static char *trace_boot_options __initdata;
180
181static int __init set_trace_boot_options(char *str)
182{
67012ab1 183 strlcpy(trace_boot_options_buf, str, MAX_TRACER_SIZE);
7bcfaf54
SR
184 trace_boot_options = trace_boot_options_buf;
185 return 0;
186}
187__setup("trace_options=", set_trace_boot_options);
188
e1e232ca
SR
189static char trace_boot_clock_buf[MAX_TRACER_SIZE] __initdata;
190static char *trace_boot_clock __initdata;
191
192static int __init set_trace_boot_clock(char *str)
193{
194 strlcpy(trace_boot_clock_buf, str, MAX_TRACER_SIZE);
195 trace_boot_clock = trace_boot_clock_buf;
196 return 0;
197}
198__setup("trace_clock=", set_trace_boot_clock);
199
0daa2302
SRRH
200static int __init set_tracepoint_printk(char *str)
201{
202 if ((strcmp(str, "=0") != 0 && strcmp(str, "=off") != 0))
203 tracepoint_printk = 1;
204 return 1;
205}
206__setup("tp_printk", set_tracepoint_printk);
de7edd31 207
cf8e3474 208unsigned long long ns2usecs(cycle_t nsec)
bc0c38d1
SR
209{
210 nsec += 500;
211 do_div(nsec, 1000);
212 return nsec;
213}
214
4fcdae83
SR
215/*
216 * The global_trace is the descriptor that holds the tracing
217 * buffers for the live tracing. For each CPU, it contains
218 * a link list of pages that will store trace entries. The
219 * page descriptor of the pages in the memory is used to hold
220 * the link list by linking the lru item in the page descriptor
221 * to each of the pages in the buffer per CPU.
222 *
223 * For each active CPU there is a data field that holds the
224 * pages for the buffer for that CPU. Each CPU has the same number
225 * of pages allocated for its buffer.
226 */
bc0c38d1
SR
227static struct trace_array global_trace;
228
ae63b31e 229LIST_HEAD(ftrace_trace_arrays);
bc0c38d1 230
ff451961
SRRH
231int trace_array_get(struct trace_array *this_tr)
232{
233 struct trace_array *tr;
234 int ret = -ENODEV;
235
236 mutex_lock(&trace_types_lock);
237 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
238 if (tr == this_tr) {
239 tr->ref++;
240 ret = 0;
241 break;
242 }
243 }
244 mutex_unlock(&trace_types_lock);
245
246 return ret;
247}
248
249static void __trace_array_put(struct trace_array *this_tr)
250{
251 WARN_ON(!this_tr->ref);
252 this_tr->ref--;
253}
254
255void trace_array_put(struct trace_array *this_tr)
256{
257 mutex_lock(&trace_types_lock);
258 __trace_array_put(this_tr);
259 mutex_unlock(&trace_types_lock);
260}
261
f306cc82
TZ
262int filter_check_discard(struct ftrace_event_file *file, void *rec,
263 struct ring_buffer *buffer,
264 struct ring_buffer_event *event)
eb02ce01 265{
f306cc82
TZ
266 if (unlikely(file->flags & FTRACE_EVENT_FL_FILTERED) &&
267 !filter_match_preds(file->filter, rec)) {
268 ring_buffer_discard_commit(buffer, event);
269 return 1;
270 }
271
272 return 0;
273}
274EXPORT_SYMBOL_GPL(filter_check_discard);
275
276int call_filter_check_discard(struct ftrace_event_call *call, void *rec,
277 struct ring_buffer *buffer,
278 struct ring_buffer_event *event)
279{
280 if (unlikely(call->flags & TRACE_EVENT_FL_FILTERED) &&
281 !filter_match_preds(call->filter, rec)) {
282 ring_buffer_discard_commit(buffer, event);
283 return 1;
284 }
285
286 return 0;
eb02ce01 287}
f306cc82 288EXPORT_SYMBOL_GPL(call_filter_check_discard);
eb02ce01 289
ad1438a0 290static cycle_t buffer_ftrace_now(struct trace_buffer *buf, int cpu)
37886f6a
SR
291{
292 u64 ts;
293
294 /* Early boot up does not have a buffer yet */
9457158b 295 if (!buf->buffer)
37886f6a
SR
296 return trace_clock_local();
297
9457158b
AL
298 ts = ring_buffer_time_stamp(buf->buffer, cpu);
299 ring_buffer_normalize_time_stamp(buf->buffer, cpu, &ts);
37886f6a
SR
300
301 return ts;
302}
bc0c38d1 303
9457158b
AL
304cycle_t ftrace_now(int cpu)
305{
306 return buffer_ftrace_now(&global_trace.trace_buffer, cpu);
307}
308
10246fa3
SRRH
309/**
310 * tracing_is_enabled - Show if global_trace has been disabled
311 *
312 * Shows if the global trace has been enabled or not. It uses the
313 * mirror flag "buffer_disabled" to be used in fast paths such as for
314 * the irqsoff tracer. But it may be inaccurate due to races. If you
315 * need to know the accurate state, use tracing_is_on() which is a little
316 * slower, but accurate.
317 */
9036990d
SR
318int tracing_is_enabled(void)
319{
10246fa3
SRRH
320 /*
321 * For quick access (irqsoff uses this in fast path), just
322 * return the mirror variable of the state of the ring buffer.
323 * It's a little racy, but we don't really care.
324 */
325 smp_rmb();
326 return !global_trace.buffer_disabled;
9036990d
SR
327}
328
4fcdae83 329/*
3928a8a2
SR
330 * trace_buf_size is the size in bytes that is allocated
331 * for a buffer. Note, the number of bytes is always rounded
332 * to page size.
3f5a54e3
SR
333 *
334 * This number is purposely set to a low number of 16384.
335 * If the dump on oops happens, it will be much appreciated
336 * to not have to wait for all that output. Anyway this can be
337 * boot time and run time configurable.
4fcdae83 338 */
3928a8a2 339#define TRACE_BUF_SIZE_DEFAULT 1441792UL /* 16384 * 88 (sizeof(entry)) */
3f5a54e3 340
3928a8a2 341static unsigned long trace_buf_size = TRACE_BUF_SIZE_DEFAULT;
bc0c38d1 342
4fcdae83 343/* trace_types holds a link list of available tracers. */
bc0c38d1 344static struct tracer *trace_types __read_mostly;
4fcdae83 345
4fcdae83
SR
346/*
347 * trace_types_lock is used to protect the trace_types list.
4fcdae83 348 */
a8227415 349DEFINE_MUTEX(trace_types_lock);
4fcdae83 350
7e53bd42
LJ
351/*
352 * serialize the access of the ring buffer
353 *
354 * ring buffer serializes readers, but it is low level protection.
355 * The validity of the events (which returns by ring_buffer_peek() ..etc)
356 * are not protected by ring buffer.
357 *
358 * The content of events may become garbage if we allow other process consumes
359 * these events concurrently:
360 * A) the page of the consumed events may become a normal page
361 * (not reader page) in ring buffer, and this page will be rewrited
362 * by events producer.
363 * B) The page of the consumed events may become a page for splice_read,
364 * and this page will be returned to system.
365 *
366 * These primitives allow multi process access to different cpu ring buffer
367 * concurrently.
368 *
369 * These primitives don't distinguish read-only and read-consume access.
370 * Multi read-only access are also serialized.
371 */
372
373#ifdef CONFIG_SMP
374static DECLARE_RWSEM(all_cpu_access_lock);
375static DEFINE_PER_CPU(struct mutex, cpu_access_lock);
376
377static inline void trace_access_lock(int cpu)
378{
ae3b5093 379 if (cpu == RING_BUFFER_ALL_CPUS) {
7e53bd42
LJ
380 /* gain it for accessing the whole ring buffer. */
381 down_write(&all_cpu_access_lock);
382 } else {
383 /* gain it for accessing a cpu ring buffer. */
384
ae3b5093 385 /* Firstly block other trace_access_lock(RING_BUFFER_ALL_CPUS). */
7e53bd42
LJ
386 down_read(&all_cpu_access_lock);
387
388 /* Secondly block other access to this @cpu ring buffer. */
389 mutex_lock(&per_cpu(cpu_access_lock, cpu));
390 }
391}
392
393static inline void trace_access_unlock(int cpu)
394{
ae3b5093 395 if (cpu == RING_BUFFER_ALL_CPUS) {
7e53bd42
LJ
396 up_write(&all_cpu_access_lock);
397 } else {
398 mutex_unlock(&per_cpu(cpu_access_lock, cpu));
399 up_read(&all_cpu_access_lock);
400 }
401}
402
403static inline void trace_access_lock_init(void)
404{
405 int cpu;
406
407 for_each_possible_cpu(cpu)
408 mutex_init(&per_cpu(cpu_access_lock, cpu));
409}
410
411#else
412
413static DEFINE_MUTEX(access_lock);
414
415static inline void trace_access_lock(int cpu)
416{
417 (void)cpu;
418 mutex_lock(&access_lock);
419}
420
421static inline void trace_access_unlock(int cpu)
422{
423 (void)cpu;
424 mutex_unlock(&access_lock);
425}
426
427static inline void trace_access_lock_init(void)
428{
429}
430
431#endif
432
ee6bce52 433/* trace_flags holds trace_options default values */
12ef7d44 434unsigned long trace_flags = TRACE_ITER_PRINT_PARENT | TRACE_ITER_PRINTK |
a2a16d6a 435 TRACE_ITER_ANNOTATE | TRACE_ITER_CONTEXT_INFO | TRACE_ITER_SLEEP_TIME |
77271ce4 436 TRACE_ITER_GRAPH_TIME | TRACE_ITER_RECORD_CMD | TRACE_ITER_OVERWRITE |
328df475 437 TRACE_ITER_IRQ_INFO | TRACE_ITER_MARKERS | TRACE_ITER_FUNCTION;
e7e2ee89 438
5280bcef 439static void tracer_tracing_on(struct trace_array *tr)
10246fa3
SRRH
440{
441 if (tr->trace_buffer.buffer)
442 ring_buffer_record_on(tr->trace_buffer.buffer);
443 /*
444 * This flag is looked at when buffers haven't been allocated
445 * yet, or by some tracers (like irqsoff), that just want to
446 * know if the ring buffer has been disabled, but it can handle
447 * races of where it gets disabled but we still do a record.
448 * As the check is in the fast path of the tracers, it is more
449 * important to be fast than accurate.
450 */
451 tr->buffer_disabled = 0;
452 /* Make the flag seen by readers */
453 smp_wmb();
454}
455
499e5470
SR
456/**
457 * tracing_on - enable tracing buffers
458 *
459 * This function enables tracing buffers that may have been
460 * disabled with tracing_off.
461 */
462void tracing_on(void)
463{
10246fa3 464 tracer_tracing_on(&global_trace);
499e5470
SR
465}
466EXPORT_SYMBOL_GPL(tracing_on);
467
09ae7234
SRRH
468/**
469 * __trace_puts - write a constant string into the trace buffer.
470 * @ip: The address of the caller
471 * @str: The constant string to write
472 * @size: The size of the string.
473 */
474int __trace_puts(unsigned long ip, const char *str, int size)
475{
476 struct ring_buffer_event *event;
477 struct ring_buffer *buffer;
478 struct print_entry *entry;
479 unsigned long irq_flags;
480 int alloc;
8abfb872
J
481 int pc;
482
f0160a5a
J
483 if (!(trace_flags & TRACE_ITER_PRINTK))
484 return 0;
485
8abfb872 486 pc = preempt_count();
09ae7234 487
3132e107
SRRH
488 if (unlikely(tracing_selftest_running || tracing_disabled))
489 return 0;
490
09ae7234
SRRH
491 alloc = sizeof(*entry) + size + 2; /* possible \n added */
492
493 local_save_flags(irq_flags);
494 buffer = global_trace.trace_buffer.buffer;
495 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, alloc,
8abfb872 496 irq_flags, pc);
09ae7234
SRRH
497 if (!event)
498 return 0;
499
500 entry = ring_buffer_event_data(event);
501 entry->ip = ip;
502
503 memcpy(&entry->buf, str, size);
504
505 /* Add a newline if necessary */
506 if (entry->buf[size - 1] != '\n') {
507 entry->buf[size] = '\n';
508 entry->buf[size + 1] = '\0';
509 } else
510 entry->buf[size] = '\0';
511
512 __buffer_unlock_commit(buffer, event);
8abfb872 513 ftrace_trace_stack(buffer, irq_flags, 4, pc);
09ae7234
SRRH
514
515 return size;
516}
517EXPORT_SYMBOL_GPL(__trace_puts);
518
519/**
520 * __trace_bputs - write the pointer to a constant string into trace buffer
521 * @ip: The address of the caller
522 * @str: The constant string to write to the buffer to
523 */
524int __trace_bputs(unsigned long ip, const char *str)
525{
526 struct ring_buffer_event *event;
527 struct ring_buffer *buffer;
528 struct bputs_entry *entry;
529 unsigned long irq_flags;
530 int size = sizeof(struct bputs_entry);
8abfb872
J
531 int pc;
532
f0160a5a
J
533 if (!(trace_flags & TRACE_ITER_PRINTK))
534 return 0;
535
8abfb872 536 pc = preempt_count();
09ae7234 537
3132e107
SRRH
538 if (unlikely(tracing_selftest_running || tracing_disabled))
539 return 0;
540
09ae7234
SRRH
541 local_save_flags(irq_flags);
542 buffer = global_trace.trace_buffer.buffer;
543 event = trace_buffer_lock_reserve(buffer, TRACE_BPUTS, size,
8abfb872 544 irq_flags, pc);
09ae7234
SRRH
545 if (!event)
546 return 0;
547
548 entry = ring_buffer_event_data(event);
549 entry->ip = ip;
550 entry->str = str;
551
552 __buffer_unlock_commit(buffer, event);
8abfb872 553 ftrace_trace_stack(buffer, irq_flags, 4, pc);
09ae7234
SRRH
554
555 return 1;
556}
557EXPORT_SYMBOL_GPL(__trace_bputs);
558
ad909e21
SRRH
559#ifdef CONFIG_TRACER_SNAPSHOT
560/**
561 * trace_snapshot - take a snapshot of the current buffer.
562 *
563 * This causes a swap between the snapshot buffer and the current live
564 * tracing buffer. You can use this to take snapshots of the live
565 * trace when some condition is triggered, but continue to trace.
566 *
567 * Note, make sure to allocate the snapshot with either
568 * a tracing_snapshot_alloc(), or by doing it manually
569 * with: echo 1 > /sys/kernel/debug/tracing/snapshot
570 *
571 * If the snapshot buffer is not allocated, it will stop tracing.
572 * Basically making a permanent snapshot.
573 */
574void tracing_snapshot(void)
575{
576 struct trace_array *tr = &global_trace;
577 struct tracer *tracer = tr->current_trace;
578 unsigned long flags;
579
1b22e382
SRRH
580 if (in_nmi()) {
581 internal_trace_puts("*** SNAPSHOT CALLED FROM NMI CONTEXT ***\n");
582 internal_trace_puts("*** snapshot is being ignored ***\n");
583 return;
584 }
585
ad909e21 586 if (!tr->allocated_snapshot) {
ca268da6
SRRH
587 internal_trace_puts("*** SNAPSHOT NOT ALLOCATED ***\n");
588 internal_trace_puts("*** stopping trace here! ***\n");
ad909e21
SRRH
589 tracing_off();
590 return;
591 }
592
593 /* Note, snapshot can not be used when the tracer uses it */
594 if (tracer->use_max_tr) {
ca268da6
SRRH
595 internal_trace_puts("*** LATENCY TRACER ACTIVE ***\n");
596 internal_trace_puts("*** Can not use snapshot (sorry) ***\n");
ad909e21
SRRH
597 return;
598 }
599
600 local_irq_save(flags);
601 update_max_tr(tr, current, smp_processor_id());
602 local_irq_restore(flags);
603}
1b22e382 604EXPORT_SYMBOL_GPL(tracing_snapshot);
ad909e21
SRRH
605
606static int resize_buffer_duplicate_size(struct trace_buffer *trace_buf,
607 struct trace_buffer *size_buf, int cpu_id);
3209cff4
SRRH
608static void set_buffer_entries(struct trace_buffer *buf, unsigned long val);
609
610static int alloc_snapshot(struct trace_array *tr)
611{
612 int ret;
613
614 if (!tr->allocated_snapshot) {
615
616 /* allocate spare buffer */
617 ret = resize_buffer_duplicate_size(&tr->max_buffer,
618 &tr->trace_buffer, RING_BUFFER_ALL_CPUS);
619 if (ret < 0)
620 return ret;
621
622 tr->allocated_snapshot = true;
623 }
624
625 return 0;
626}
627
ad1438a0 628static void free_snapshot(struct trace_array *tr)
3209cff4
SRRH
629{
630 /*
631 * We don't free the ring buffer. instead, resize it because
632 * The max_tr ring buffer has some state (e.g. ring->clock) and
633 * we want preserve it.
634 */
635 ring_buffer_resize(tr->max_buffer.buffer, 1, RING_BUFFER_ALL_CPUS);
636 set_buffer_entries(&tr->max_buffer, 1);
637 tracing_reset_online_cpus(&tr->max_buffer);
638 tr->allocated_snapshot = false;
639}
ad909e21 640
93e31ffb
TZ
641/**
642 * tracing_alloc_snapshot - allocate snapshot buffer.
643 *
644 * This only allocates the snapshot buffer if it isn't already
645 * allocated - it doesn't also take a snapshot.
646 *
647 * This is meant to be used in cases where the snapshot buffer needs
648 * to be set up for events that can't sleep but need to be able to
649 * trigger a snapshot.
650 */
651int tracing_alloc_snapshot(void)
652{
653 struct trace_array *tr = &global_trace;
654 int ret;
655
656 ret = alloc_snapshot(tr);
657 WARN_ON(ret < 0);
658
659 return ret;
660}
661EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
662
ad909e21
SRRH
663/**
664 * trace_snapshot_alloc - allocate and take a snapshot of the current buffer.
665 *
666 * This is similar to trace_snapshot(), but it will allocate the
667 * snapshot buffer if it isn't already allocated. Use this only
668 * where it is safe to sleep, as the allocation may sleep.
669 *
670 * This causes a swap between the snapshot buffer and the current live
671 * tracing buffer. You can use this to take snapshots of the live
672 * trace when some condition is triggered, but continue to trace.
673 */
674void tracing_snapshot_alloc(void)
675{
ad909e21
SRRH
676 int ret;
677
93e31ffb
TZ
678 ret = tracing_alloc_snapshot();
679 if (ret < 0)
3209cff4 680 return;
ad909e21
SRRH
681
682 tracing_snapshot();
683}
1b22e382 684EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
ad909e21
SRRH
685#else
686void tracing_snapshot(void)
687{
688 WARN_ONCE(1, "Snapshot feature not enabled, but internal snapshot used");
689}
1b22e382 690EXPORT_SYMBOL_GPL(tracing_snapshot);
93e31ffb
TZ
691int tracing_alloc_snapshot(void)
692{
693 WARN_ONCE(1, "Snapshot feature not enabled, but snapshot allocation used");
694 return -ENODEV;
695}
696EXPORT_SYMBOL_GPL(tracing_alloc_snapshot);
ad909e21
SRRH
697void tracing_snapshot_alloc(void)
698{
699 /* Give warning */
700 tracing_snapshot();
701}
1b22e382 702EXPORT_SYMBOL_GPL(tracing_snapshot_alloc);
ad909e21
SRRH
703#endif /* CONFIG_TRACER_SNAPSHOT */
704
5280bcef 705static void tracer_tracing_off(struct trace_array *tr)
10246fa3
SRRH
706{
707 if (tr->trace_buffer.buffer)
708 ring_buffer_record_off(tr->trace_buffer.buffer);
709 /*
710 * This flag is looked at when buffers haven't been allocated
711 * yet, or by some tracers (like irqsoff), that just want to
712 * know if the ring buffer has been disabled, but it can handle
713 * races of where it gets disabled but we still do a record.
714 * As the check is in the fast path of the tracers, it is more
715 * important to be fast than accurate.
716 */
717 tr->buffer_disabled = 1;
718 /* Make the flag seen by readers */
719 smp_wmb();
720}
721
499e5470
SR
722/**
723 * tracing_off - turn off tracing buffers
724 *
725 * This function stops the tracing buffers from recording data.
726 * It does not disable any overhead the tracers themselves may
727 * be causing. This function simply causes all recording to
728 * the ring buffers to fail.
729 */
730void tracing_off(void)
731{
10246fa3 732 tracer_tracing_off(&global_trace);
499e5470
SR
733}
734EXPORT_SYMBOL_GPL(tracing_off);
735
de7edd31
SRRH
736void disable_trace_on_warning(void)
737{
738 if (__disable_trace_on_warning)
739 tracing_off();
740}
741
10246fa3
SRRH
742/**
743 * tracer_tracing_is_on - show real state of ring buffer enabled
744 * @tr : the trace array to know if ring buffer is enabled
745 *
746 * Shows real state of the ring buffer if it is enabled or not.
747 */
5280bcef 748static int tracer_tracing_is_on(struct trace_array *tr)
10246fa3
SRRH
749{
750 if (tr->trace_buffer.buffer)
751 return ring_buffer_record_is_on(tr->trace_buffer.buffer);
752 return !tr->buffer_disabled;
753}
754
499e5470
SR
755/**
756 * tracing_is_on - show state of ring buffers enabled
757 */
758int tracing_is_on(void)
759{
10246fa3 760 return tracer_tracing_is_on(&global_trace);
499e5470
SR
761}
762EXPORT_SYMBOL_GPL(tracing_is_on);
763
3928a8a2 764static int __init set_buf_size(char *str)
bc0c38d1 765{
3928a8a2 766 unsigned long buf_size;
c6caeeb1 767
bc0c38d1
SR
768 if (!str)
769 return 0;
9d612bef 770 buf_size = memparse(str, &str);
c6caeeb1 771 /* nr_entries can not be zero */
9d612bef 772 if (buf_size == 0)
c6caeeb1 773 return 0;
3928a8a2 774 trace_buf_size = buf_size;
bc0c38d1
SR
775 return 1;
776}
3928a8a2 777__setup("trace_buf_size=", set_buf_size);
bc0c38d1 778
0e950173
TB
779static int __init set_tracing_thresh(char *str)
780{
87abb3b1 781 unsigned long threshold;
0e950173
TB
782 int ret;
783
784 if (!str)
785 return 0;
bcd83ea6 786 ret = kstrtoul(str, 0, &threshold);
0e950173
TB
787 if (ret < 0)
788 return 0;
87abb3b1 789 tracing_thresh = threshold * 1000;
0e950173
TB
790 return 1;
791}
792__setup("tracing_thresh=", set_tracing_thresh);
793
57f50be1
SR
794unsigned long nsecs_to_usecs(unsigned long nsecs)
795{
796 return nsecs / 1000;
797}
798
4fcdae83 799/* These must match the bit postions in trace_iterator_flags */
bc0c38d1
SR
800static const char *trace_options[] = {
801 "print-parent",
802 "sym-offset",
803 "sym-addr",
804 "verbose",
f9896bf3 805 "raw",
5e3ca0ec 806 "hex",
cb0f12aa 807 "bin",
2a2cc8f7 808 "block",
86387f7e 809 "stacktrace",
5e1607a0 810 "trace_printk",
b2a866f9 811 "ftrace_preempt",
9f029e83 812 "branch",
12ef7d44 813 "annotate",
02b67518 814 "userstacktrace",
b54d3de9 815 "sym-userobj",
66896a85 816 "printk-msg-only",
c4a8e8be 817 "context-info",
c032ef64 818 "latency-format",
be6f164a 819 "sleep-time",
a2a16d6a 820 "graph-time",
e870e9a1 821 "record-cmd",
750912fa 822 "overwrite",
cf30cf67 823 "disable_on_free",
77271ce4 824 "irq-info",
5224c3a3 825 "markers",
328df475 826 "function-trace",
bc0c38d1
SR
827 NULL
828};
829
5079f326
Z
830static struct {
831 u64 (*func)(void);
832 const char *name;
8be0709f 833 int in_ns; /* is this clock in nanoseconds? */
5079f326 834} trace_clocks[] = {
1b3e5c09
TG
835 { trace_clock_local, "local", 1 },
836 { trace_clock_global, "global", 1 },
837 { trace_clock_counter, "counter", 0 },
e7fda6c4 838 { trace_clock_jiffies, "uptime", 0 },
1b3e5c09
TG
839 { trace_clock, "perf", 1 },
840 { ktime_get_mono_fast_ns, "mono", 1 },
8cbd9cc6 841 ARCH_TRACE_CLOCKS
5079f326
Z
842};
843
b63f39ea 844/*
845 * trace_parser_get_init - gets the buffer for trace parser
846 */
847int trace_parser_get_init(struct trace_parser *parser, int size)
848{
849 memset(parser, 0, sizeof(*parser));
850
851 parser->buffer = kmalloc(size, GFP_KERNEL);
852 if (!parser->buffer)
853 return 1;
854
855 parser->size = size;
856 return 0;
857}
858
859/*
860 * trace_parser_put - frees the buffer for trace parser
861 */
862void trace_parser_put(struct trace_parser *parser)
863{
864 kfree(parser->buffer);
865}
866
867/*
868 * trace_get_user - reads the user input string separated by space
869 * (matched by isspace(ch))
870 *
871 * For each string found the 'struct trace_parser' is updated,
872 * and the function returns.
873 *
874 * Returns number of bytes read.
875 *
876 * See kernel/trace/trace.h for 'struct trace_parser' details.
877 */
878int trace_get_user(struct trace_parser *parser, const char __user *ubuf,
879 size_t cnt, loff_t *ppos)
880{
881 char ch;
882 size_t read = 0;
883 ssize_t ret;
884
885 if (!*ppos)
886 trace_parser_clear(parser);
887
888 ret = get_user(ch, ubuf++);
889 if (ret)
890 goto out;
891
892 read++;
893 cnt--;
894
895 /*
896 * The parser is not finished with the last write,
897 * continue reading the user input without skipping spaces.
898 */
899 if (!parser->cont) {
900 /* skip white space */
901 while (cnt && isspace(ch)) {
902 ret = get_user(ch, ubuf++);
903 if (ret)
904 goto out;
905 read++;
906 cnt--;
907 }
908
909 /* only spaces were written */
910 if (isspace(ch)) {
911 *ppos += read;
912 ret = read;
913 goto out;
914 }
915
916 parser->idx = 0;
917 }
918
919 /* read the non-space input */
920 while (cnt && !isspace(ch)) {
3c235a33 921 if (parser->idx < parser->size - 1)
b63f39ea 922 parser->buffer[parser->idx++] = ch;
923 else {
924 ret = -EINVAL;
925 goto out;
926 }
927 ret = get_user(ch, ubuf++);
928 if (ret)
929 goto out;
930 read++;
931 cnt--;
932 }
933
934 /* We either got finished input or we have to wait for another call. */
935 if (isspace(ch)) {
936 parser->buffer[parser->idx] = 0;
937 parser->cont = false;
057db848 938 } else if (parser->idx < parser->size - 1) {
b63f39ea 939 parser->cont = true;
940 parser->buffer[parser->idx++] = ch;
057db848
SR
941 } else {
942 ret = -EINVAL;
943 goto out;
b63f39ea 944 }
945
946 *ppos += read;
947 ret = read;
948
949out:
950 return ret;
951}
952
3a161d99 953/* TODO add a seq_buf_to_buffer() */
b8b94265 954static ssize_t trace_seq_to_buffer(struct trace_seq *s, void *buf, size_t cnt)
3c56819b
EGM
955{
956 int len;
3c56819b 957
5ac48378 958 if (trace_seq_used(s) <= s->seq.readpos)
3c56819b
EGM
959 return -EBUSY;
960
5ac48378 961 len = trace_seq_used(s) - s->seq.readpos;
3c56819b
EGM
962 if (cnt > len)
963 cnt = len;
3a161d99 964 memcpy(buf, s->buffer + s->seq.readpos, cnt);
3c56819b 965
3a161d99 966 s->seq.readpos += cnt;
3c56819b
EGM
967 return cnt;
968}
969
0e950173
TB
970unsigned long __read_mostly tracing_thresh;
971
5d4a9dba 972#ifdef CONFIG_TRACER_MAX_TRACE
5d4a9dba
SR
973/*
974 * Copy the new maximum trace into the separate maximum-trace
975 * structure. (this way the maximum trace is permanently saved,
976 * for later retrieval via /sys/kernel/debug/tracing/latency_trace)
977 */
978static void
979__update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
980{
12883efb
SRRH
981 struct trace_buffer *trace_buf = &tr->trace_buffer;
982 struct trace_buffer *max_buf = &tr->max_buffer;
983 struct trace_array_cpu *data = per_cpu_ptr(trace_buf->data, cpu);
984 struct trace_array_cpu *max_data = per_cpu_ptr(max_buf->data, cpu);
5d4a9dba 985
12883efb
SRRH
986 max_buf->cpu = cpu;
987 max_buf->time_start = data->preempt_timestamp;
5d4a9dba 988
6d9b3fa5 989 max_data->saved_latency = tr->max_latency;
8248ac05
SR
990 max_data->critical_start = data->critical_start;
991 max_data->critical_end = data->critical_end;
5d4a9dba 992
1acaa1b2 993 memcpy(max_data->comm, tsk->comm, TASK_COMM_LEN);
8248ac05 994 max_data->pid = tsk->pid;
f17a5194
SRRH
995 /*
996 * If tsk == current, then use current_uid(), as that does not use
997 * RCU. The irq tracer can be called out of RCU scope.
998 */
999 if (tsk == current)
1000 max_data->uid = current_uid();
1001 else
1002 max_data->uid = task_uid(tsk);
1003
8248ac05
SR
1004 max_data->nice = tsk->static_prio - 20 - MAX_RT_PRIO;
1005 max_data->policy = tsk->policy;
1006 max_data->rt_priority = tsk->rt_priority;
5d4a9dba
SR
1007
1008 /* record this tasks comm */
1009 tracing_record_cmdline(tsk);
1010}
1011
4fcdae83
SR
1012/**
1013 * update_max_tr - snapshot all trace buffers from global_trace to max_tr
1014 * @tr: tracer
1015 * @tsk: the task with the latency
1016 * @cpu: The cpu that initiated the trace.
1017 *
1018 * Flip the buffers between the @tr and the max_tr and record information
1019 * about which task was the cause of this latency.
1020 */
e309b41d 1021void
bc0c38d1
SR
1022update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
1023{
2721e72d 1024 struct ring_buffer *buf;
bc0c38d1 1025
2b6080f2 1026 if (tr->stop_count)
b8de7bd1
SR
1027 return;
1028
4c11d7ae 1029 WARN_ON_ONCE(!irqs_disabled());
34600f0e 1030
45ad21ca 1031 if (!tr->allocated_snapshot) {
debdd57f 1032 /* Only the nop tracer should hit this when disabling */
2b6080f2 1033 WARN_ON_ONCE(tr->current_trace != &nop_trace);
34600f0e 1034 return;
debdd57f 1035 }
34600f0e 1036
0b9b12c1 1037 arch_spin_lock(&tr->max_lock);
3928a8a2 1038
12883efb
SRRH
1039 buf = tr->trace_buffer.buffer;
1040 tr->trace_buffer.buffer = tr->max_buffer.buffer;
1041 tr->max_buffer.buffer = buf;
3928a8a2 1042
bc0c38d1 1043 __update_max_tr(tr, tsk, cpu);
0b9b12c1 1044 arch_spin_unlock(&tr->max_lock);
bc0c38d1
SR
1045}
1046
1047/**
1048 * update_max_tr_single - only copy one trace over, and reset the rest
1049 * @tr - tracer
1050 * @tsk - task with the latency
1051 * @cpu - the cpu of the buffer to copy.
4fcdae83
SR
1052 *
1053 * Flip the trace of a single CPU buffer between the @tr and the max_tr.
bc0c38d1 1054 */
e309b41d 1055void
bc0c38d1
SR
1056update_max_tr_single(struct trace_array *tr, struct task_struct *tsk, int cpu)
1057{
3928a8a2 1058 int ret;
bc0c38d1 1059
2b6080f2 1060 if (tr->stop_count)
b8de7bd1
SR
1061 return;
1062
4c11d7ae 1063 WARN_ON_ONCE(!irqs_disabled());
6c24499f 1064 if (!tr->allocated_snapshot) {
2930e04d 1065 /* Only the nop tracer should hit this when disabling */
9e8529af 1066 WARN_ON_ONCE(tr->current_trace != &nop_trace);
ef710e10 1067 return;
2930e04d 1068 }
ef710e10 1069
0b9b12c1 1070 arch_spin_lock(&tr->max_lock);
bc0c38d1 1071
12883efb 1072 ret = ring_buffer_swap_cpu(tr->max_buffer.buffer, tr->trace_buffer.buffer, cpu);
3928a8a2 1073
e8165dbb
SR
1074 if (ret == -EBUSY) {
1075 /*
1076 * We failed to swap the buffer due to a commit taking
1077 * place on this CPU. We fail to record, but we reset
1078 * the max trace buffer (no one writes directly to it)
1079 * and flag that it failed.
1080 */
12883efb 1081 trace_array_printk_buf(tr->max_buffer.buffer, _THIS_IP_,
e8165dbb
SR
1082 "Failed to swap buffers due to commit in progress\n");
1083 }
1084
e8165dbb 1085 WARN_ON_ONCE(ret && ret != -EAGAIN && ret != -EBUSY);
bc0c38d1
SR
1086
1087 __update_max_tr(tr, tsk, cpu);
0b9b12c1 1088 arch_spin_unlock(&tr->max_lock);
bc0c38d1 1089}
5d4a9dba 1090#endif /* CONFIG_TRACER_MAX_TRACE */
bc0c38d1 1091
e30f53aa 1092static int wait_on_pipe(struct trace_iterator *iter, bool full)
0d5c6e1c 1093{
15693458
SRRH
1094 /* Iterators are static, they should be filled or empty */
1095 if (trace_buffer_iter(iter, iter->cpu_file))
8b8b3683 1096 return 0;
0d5c6e1c 1097
e30f53aa
RV
1098 return ring_buffer_wait(iter->trace_buffer->buffer, iter->cpu_file,
1099 full);
0d5c6e1c
SR
1100}
1101
f4e781c0
SRRH
1102#ifdef CONFIG_FTRACE_STARTUP_TEST
1103static int run_tracer_selftest(struct tracer *type)
1104{
1105 struct trace_array *tr = &global_trace;
1106 struct tracer *saved_tracer = tr->current_trace;
1107 int ret;
0d5c6e1c 1108
f4e781c0
SRRH
1109 if (!type->selftest || tracing_selftest_disabled)
1110 return 0;
0d5c6e1c
SR
1111
1112 /*
f4e781c0
SRRH
1113 * Run a selftest on this tracer.
1114 * Here we reset the trace buffer, and set the current
1115 * tracer to be this tracer. The tracer can then run some
1116 * internal tracing to verify that everything is in order.
1117 * If we fail, we do not register this tracer.
0d5c6e1c 1118 */
f4e781c0 1119 tracing_reset_online_cpus(&tr->trace_buffer);
0d5c6e1c 1120
f4e781c0
SRRH
1121 tr->current_trace = type;
1122
1123#ifdef CONFIG_TRACER_MAX_TRACE
1124 if (type->use_max_tr) {
1125 /* If we expanded the buffers, make sure the max is expanded too */
1126 if (ring_buffer_expanded)
1127 ring_buffer_resize(tr->max_buffer.buffer, trace_buf_size,
1128 RING_BUFFER_ALL_CPUS);
1129 tr->allocated_snapshot = true;
1130 }
1131#endif
1132
1133 /* the test is responsible for initializing and enabling */
1134 pr_info("Testing tracer %s: ", type->name);
1135 ret = type->selftest(type, tr);
1136 /* the test is responsible for resetting too */
1137 tr->current_trace = saved_tracer;
1138 if (ret) {
1139 printk(KERN_CONT "FAILED!\n");
1140 /* Add the warning after printing 'FAILED' */
1141 WARN_ON(1);
1142 return -1;
1143 }
1144 /* Only reset on passing, to avoid touching corrupted buffers */
1145 tracing_reset_online_cpus(&tr->trace_buffer);
1146
1147#ifdef CONFIG_TRACER_MAX_TRACE
1148 if (type->use_max_tr) {
1149 tr->allocated_snapshot = false;
0d5c6e1c 1150
f4e781c0
SRRH
1151 /* Shrink the max buffer again */
1152 if (ring_buffer_expanded)
1153 ring_buffer_resize(tr->max_buffer.buffer, 1,
1154 RING_BUFFER_ALL_CPUS);
1155 }
1156#endif
1157
1158 printk(KERN_CONT "PASSED\n");
1159 return 0;
1160}
1161#else
1162static inline int run_tracer_selftest(struct tracer *type)
1163{
1164 return 0;
0d5c6e1c 1165}
f4e781c0 1166#endif /* CONFIG_FTRACE_STARTUP_TEST */
0d5c6e1c 1167
4fcdae83
SR
1168/**
1169 * register_tracer - register a tracer with the ftrace system.
1170 * @type - the plugin for the tracer
1171 *
1172 * Register a new plugin tracer.
1173 */
bc0c38d1
SR
1174int register_tracer(struct tracer *type)
1175{
1176 struct tracer *t;
bc0c38d1
SR
1177 int ret = 0;
1178
1179 if (!type->name) {
1180 pr_info("Tracer must have a name\n");
1181 return -1;
1182 }
1183
24a461d5 1184 if (strlen(type->name) >= MAX_TRACER_SIZE) {
ee6c2c1b
LZ
1185 pr_info("Tracer has a name longer than %d\n", MAX_TRACER_SIZE);
1186 return -1;
1187 }
1188
bc0c38d1 1189 mutex_lock(&trace_types_lock);
86fa2f60 1190
8e1b82e0
FW
1191 tracing_selftest_running = true;
1192
bc0c38d1
SR
1193 for (t = trace_types; t; t = t->next) {
1194 if (strcmp(type->name, t->name) == 0) {
1195 /* already found */
ee6c2c1b 1196 pr_info("Tracer %s already registered\n",
bc0c38d1
SR
1197 type->name);
1198 ret = -1;
1199 goto out;
1200 }
1201 }
1202
adf9f195
FW
1203 if (!type->set_flag)
1204 type->set_flag = &dummy_set_flag;
1205 if (!type->flags)
1206 type->flags = &dummy_tracer_flags;
1207 else
1208 if (!type->flags->opts)
1209 type->flags->opts = dummy_tracer_opt;
6eaaa5d5 1210
f4e781c0
SRRH
1211 ret = run_tracer_selftest(type);
1212 if (ret < 0)
1213 goto out;
60a11774 1214
bc0c38d1
SR
1215 type->next = trace_types;
1216 trace_types = type;
60a11774 1217
bc0c38d1 1218 out:
8e1b82e0 1219 tracing_selftest_running = false;
bc0c38d1
SR
1220 mutex_unlock(&trace_types_lock);
1221
dac74940
SR
1222 if (ret || !default_bootup_tracer)
1223 goto out_unlock;
1224
ee6c2c1b 1225 if (strncmp(default_bootup_tracer, type->name, MAX_TRACER_SIZE))
dac74940
SR
1226 goto out_unlock;
1227
1228 printk(KERN_INFO "Starting tracer '%s'\n", type->name);
1229 /* Do we want this tracer to start on bootup? */
607e2ea1 1230 tracing_set_tracer(&global_trace, type->name);
dac74940
SR
1231 default_bootup_tracer = NULL;
1232 /* disable other selftests, since this will break it. */
55034cd6 1233 tracing_selftest_disabled = true;
b2821ae6 1234#ifdef CONFIG_FTRACE_STARTUP_TEST
dac74940
SR
1235 printk(KERN_INFO "Disabling FTRACE selftests due to running tracer '%s'\n",
1236 type->name);
b2821ae6 1237#endif
b2821ae6 1238
dac74940 1239 out_unlock:
bc0c38d1
SR
1240 return ret;
1241}
1242
12883efb 1243void tracing_reset(struct trace_buffer *buf, int cpu)
f633903a 1244{
12883efb 1245 struct ring_buffer *buffer = buf->buffer;
f633903a 1246
a5416411
HT
1247 if (!buffer)
1248 return;
1249
f633903a
SR
1250 ring_buffer_record_disable(buffer);
1251
1252 /* Make sure all commits have finished */
1253 synchronize_sched();
68179686 1254 ring_buffer_reset_cpu(buffer, cpu);
f633903a
SR
1255
1256 ring_buffer_record_enable(buffer);
1257}
1258
12883efb 1259void tracing_reset_online_cpus(struct trace_buffer *buf)
213cc060 1260{
12883efb 1261 struct ring_buffer *buffer = buf->buffer;
213cc060
PE
1262 int cpu;
1263
a5416411
HT
1264 if (!buffer)
1265 return;
1266
621968cd
SR
1267 ring_buffer_record_disable(buffer);
1268
1269 /* Make sure all commits have finished */
1270 synchronize_sched();
1271
9457158b 1272 buf->time_start = buffer_ftrace_now(buf, buf->cpu);
213cc060
PE
1273
1274 for_each_online_cpu(cpu)
68179686 1275 ring_buffer_reset_cpu(buffer, cpu);
621968cd
SR
1276
1277 ring_buffer_record_enable(buffer);
213cc060
PE
1278}
1279
09d8091c 1280/* Must have trace_types_lock held */
873c642f 1281void tracing_reset_all_online_cpus(void)
9456f0fa 1282{
873c642f
SRRH
1283 struct trace_array *tr;
1284
873c642f 1285 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
12883efb
SRRH
1286 tracing_reset_online_cpus(&tr->trace_buffer);
1287#ifdef CONFIG_TRACER_MAX_TRACE
1288 tracing_reset_online_cpus(&tr->max_buffer);
1289#endif
873c642f 1290 }
9456f0fa
SR
1291}
1292
939c7a4f 1293#define SAVED_CMDLINES_DEFAULT 128
2c7eea4c 1294#define NO_CMDLINE_MAP UINT_MAX
edc35bd7 1295static arch_spinlock_t trace_cmdline_lock = __ARCH_SPIN_LOCK_UNLOCKED;
939c7a4f
YY
1296struct saved_cmdlines_buffer {
1297 unsigned map_pid_to_cmdline[PID_MAX_DEFAULT+1];
1298 unsigned *map_cmdline_to_pid;
1299 unsigned cmdline_num;
1300 int cmdline_idx;
1301 char *saved_cmdlines;
1302};
1303static struct saved_cmdlines_buffer *savedcmd;
25b0b44a 1304
25b0b44a 1305/* temporary disable recording */
4fd27358 1306static atomic_t trace_record_cmdline_disabled __read_mostly;
bc0c38d1 1307
939c7a4f
YY
1308static inline char *get_saved_cmdlines(int idx)
1309{
1310 return &savedcmd->saved_cmdlines[idx * TASK_COMM_LEN];
1311}
1312
1313static inline void set_cmdline(int idx, const char *cmdline)
bc0c38d1 1314{
939c7a4f
YY
1315 memcpy(get_saved_cmdlines(idx), cmdline, TASK_COMM_LEN);
1316}
1317
1318static int allocate_cmdlines_buffer(unsigned int val,
1319 struct saved_cmdlines_buffer *s)
1320{
1321 s->map_cmdline_to_pid = kmalloc(val * sizeof(*s->map_cmdline_to_pid),
1322 GFP_KERNEL);
1323 if (!s->map_cmdline_to_pid)
1324 return -ENOMEM;
1325
1326 s->saved_cmdlines = kmalloc(val * TASK_COMM_LEN, GFP_KERNEL);
1327 if (!s->saved_cmdlines) {
1328 kfree(s->map_cmdline_to_pid);
1329 return -ENOMEM;
1330 }
1331
1332 s->cmdline_idx = 0;
1333 s->cmdline_num = val;
1334 memset(&s->map_pid_to_cmdline, NO_CMDLINE_MAP,
1335 sizeof(s->map_pid_to_cmdline));
1336 memset(s->map_cmdline_to_pid, NO_CMDLINE_MAP,
1337 val * sizeof(*s->map_cmdline_to_pid));
1338
1339 return 0;
1340}
1341
1342static int trace_create_savedcmd(void)
1343{
1344 int ret;
1345
a6af8fbf 1346 savedcmd = kmalloc(sizeof(*savedcmd), GFP_KERNEL);
939c7a4f
YY
1347 if (!savedcmd)
1348 return -ENOMEM;
1349
1350 ret = allocate_cmdlines_buffer(SAVED_CMDLINES_DEFAULT, savedcmd);
1351 if (ret < 0) {
1352 kfree(savedcmd);
1353 savedcmd = NULL;
1354 return -ENOMEM;
1355 }
1356
1357 return 0;
bc0c38d1
SR
1358}
1359
b5130b1e
CE
1360int is_tracing_stopped(void)
1361{
2b6080f2 1362 return global_trace.stop_count;
b5130b1e
CE
1363}
1364
0f048701
SR
1365/**
1366 * tracing_start - quick start of the tracer
1367 *
1368 * If tracing is enabled but was stopped by tracing_stop,
1369 * this will start the tracer back up.
1370 */
1371void tracing_start(void)
1372{
1373 struct ring_buffer *buffer;
1374 unsigned long flags;
1375
1376 if (tracing_disabled)
1377 return;
1378
2b6080f2
SR
1379 raw_spin_lock_irqsave(&global_trace.start_lock, flags);
1380 if (--global_trace.stop_count) {
1381 if (global_trace.stop_count < 0) {
b06a8301
SR
1382 /* Someone screwed up their debugging */
1383 WARN_ON_ONCE(1);
2b6080f2 1384 global_trace.stop_count = 0;
b06a8301 1385 }
0f048701
SR
1386 goto out;
1387 }
1388
a2f80714 1389 /* Prevent the buffers from switching */
0b9b12c1 1390 arch_spin_lock(&global_trace.max_lock);
0f048701 1391
12883efb 1392 buffer = global_trace.trace_buffer.buffer;
0f048701
SR
1393 if (buffer)
1394 ring_buffer_record_enable(buffer);
1395
12883efb
SRRH
1396#ifdef CONFIG_TRACER_MAX_TRACE
1397 buffer = global_trace.max_buffer.buffer;
0f048701
SR
1398 if (buffer)
1399 ring_buffer_record_enable(buffer);
12883efb 1400#endif
0f048701 1401
0b9b12c1 1402 arch_spin_unlock(&global_trace.max_lock);
a2f80714 1403
0f048701 1404 out:
2b6080f2
SR
1405 raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
1406}
1407
1408static void tracing_start_tr(struct trace_array *tr)
1409{
1410 struct ring_buffer *buffer;
1411 unsigned long flags;
1412
1413 if (tracing_disabled)
1414 return;
1415
1416 /* If global, we need to also start the max tracer */
1417 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
1418 return tracing_start();
1419
1420 raw_spin_lock_irqsave(&tr->start_lock, flags);
1421
1422 if (--tr->stop_count) {
1423 if (tr->stop_count < 0) {
1424 /* Someone screwed up their debugging */
1425 WARN_ON_ONCE(1);
1426 tr->stop_count = 0;
1427 }
1428 goto out;
1429 }
1430
12883efb 1431 buffer = tr->trace_buffer.buffer;
2b6080f2
SR
1432 if (buffer)
1433 ring_buffer_record_enable(buffer);
1434
1435 out:
1436 raw_spin_unlock_irqrestore(&tr->start_lock, flags);
0f048701
SR
1437}
1438
1439/**
1440 * tracing_stop - quick stop of the tracer
1441 *
1442 * Light weight way to stop tracing. Use in conjunction with
1443 * tracing_start.
1444 */
1445void tracing_stop(void)
1446{
1447 struct ring_buffer *buffer;
1448 unsigned long flags;
1449
2b6080f2
SR
1450 raw_spin_lock_irqsave(&global_trace.start_lock, flags);
1451 if (global_trace.stop_count++)
0f048701
SR
1452 goto out;
1453
a2f80714 1454 /* Prevent the buffers from switching */
0b9b12c1 1455 arch_spin_lock(&global_trace.max_lock);
a2f80714 1456
12883efb 1457 buffer = global_trace.trace_buffer.buffer;
0f048701
SR
1458 if (buffer)
1459 ring_buffer_record_disable(buffer);
1460
12883efb
SRRH
1461#ifdef CONFIG_TRACER_MAX_TRACE
1462 buffer = global_trace.max_buffer.buffer;
0f048701
SR
1463 if (buffer)
1464 ring_buffer_record_disable(buffer);
12883efb 1465#endif
0f048701 1466
0b9b12c1 1467 arch_spin_unlock(&global_trace.max_lock);
a2f80714 1468
0f048701 1469 out:
2b6080f2
SR
1470 raw_spin_unlock_irqrestore(&global_trace.start_lock, flags);
1471}
1472
1473static void tracing_stop_tr(struct trace_array *tr)
1474{
1475 struct ring_buffer *buffer;
1476 unsigned long flags;
1477
1478 /* If global, we need to also stop the max tracer */
1479 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
1480 return tracing_stop();
1481
1482 raw_spin_lock_irqsave(&tr->start_lock, flags);
1483 if (tr->stop_count++)
1484 goto out;
1485
12883efb 1486 buffer = tr->trace_buffer.buffer;
2b6080f2
SR
1487 if (buffer)
1488 ring_buffer_record_disable(buffer);
1489
1490 out:
1491 raw_spin_unlock_irqrestore(&tr->start_lock, flags);
0f048701
SR
1492}
1493
e309b41d 1494void trace_stop_cmdline_recording(void);
bc0c38d1 1495
379cfdac 1496static int trace_save_cmdline(struct task_struct *tsk)
bc0c38d1 1497{
a635cf04 1498 unsigned pid, idx;
bc0c38d1
SR
1499
1500 if (!tsk->pid || unlikely(tsk->pid > PID_MAX_DEFAULT))
379cfdac 1501 return 0;
bc0c38d1
SR
1502
1503 /*
1504 * It's not the end of the world if we don't get
1505 * the lock, but we also don't want to spin
1506 * nor do we want to disable interrupts,
1507 * so if we miss here, then better luck next time.
1508 */
0199c4e6 1509 if (!arch_spin_trylock(&trace_cmdline_lock))
379cfdac 1510 return 0;
bc0c38d1 1511
939c7a4f 1512 idx = savedcmd->map_pid_to_cmdline[tsk->pid];
2c7eea4c 1513 if (idx == NO_CMDLINE_MAP) {
939c7a4f 1514 idx = (savedcmd->cmdline_idx + 1) % savedcmd->cmdline_num;
bc0c38d1 1515
a635cf04
CE
1516 /*
1517 * Check whether the cmdline buffer at idx has a pid
1518 * mapped. We are going to overwrite that entry so we
1519 * need to clear the map_pid_to_cmdline. Otherwise we
1520 * would read the new comm for the old pid.
1521 */
939c7a4f 1522 pid = savedcmd->map_cmdline_to_pid[idx];
a635cf04 1523 if (pid != NO_CMDLINE_MAP)
939c7a4f 1524 savedcmd->map_pid_to_cmdline[pid] = NO_CMDLINE_MAP;
bc0c38d1 1525
939c7a4f
YY
1526 savedcmd->map_cmdline_to_pid[idx] = tsk->pid;
1527 savedcmd->map_pid_to_cmdline[tsk->pid] = idx;
bc0c38d1 1528
939c7a4f 1529 savedcmd->cmdline_idx = idx;
bc0c38d1
SR
1530 }
1531
939c7a4f 1532 set_cmdline(idx, tsk->comm);
bc0c38d1 1533
0199c4e6 1534 arch_spin_unlock(&trace_cmdline_lock);
379cfdac
SRRH
1535
1536 return 1;
bc0c38d1
SR
1537}
1538
4c27e756 1539static void __trace_find_cmdline(int pid, char comm[])
bc0c38d1 1540{
bc0c38d1
SR
1541 unsigned map;
1542
4ca53085
SR
1543 if (!pid) {
1544 strcpy(comm, "<idle>");
1545 return;
1546 }
bc0c38d1 1547
74bf4076
SR
1548 if (WARN_ON_ONCE(pid < 0)) {
1549 strcpy(comm, "<XXX>");
1550 return;
1551 }
1552
4ca53085
SR
1553 if (pid > PID_MAX_DEFAULT) {
1554 strcpy(comm, "<...>");
1555 return;
1556 }
bc0c38d1 1557
939c7a4f 1558 map = savedcmd->map_pid_to_cmdline[pid];
50d88758 1559 if (map != NO_CMDLINE_MAP)
939c7a4f 1560 strcpy(comm, get_saved_cmdlines(map));
50d88758
TG
1561 else
1562 strcpy(comm, "<...>");
4c27e756
SRRH
1563}
1564
1565void trace_find_cmdline(int pid, char comm[])
1566{
1567 preempt_disable();
1568 arch_spin_lock(&trace_cmdline_lock);
1569
1570 __trace_find_cmdline(pid, comm);
bc0c38d1 1571
0199c4e6 1572 arch_spin_unlock(&trace_cmdline_lock);
5b6045a9 1573 preempt_enable();
bc0c38d1
SR
1574}
1575
e309b41d 1576void tracing_record_cmdline(struct task_struct *tsk)
bc0c38d1 1577{
0fb9656d 1578 if (atomic_read(&trace_record_cmdline_disabled) || !tracing_is_on())
bc0c38d1
SR
1579 return;
1580
7ffbd48d
SR
1581 if (!__this_cpu_read(trace_cmdline_save))
1582 return;
1583
379cfdac
SRRH
1584 if (trace_save_cmdline(tsk))
1585 __this_cpu_write(trace_cmdline_save, false);
bc0c38d1
SR
1586}
1587
45dcd8b8 1588void
38697053
SR
1589tracing_generic_entry_update(struct trace_entry *entry, unsigned long flags,
1590 int pc)
bc0c38d1
SR
1591{
1592 struct task_struct *tsk = current;
bc0c38d1 1593
777e208d
SR
1594 entry->preempt_count = pc & 0xff;
1595 entry->pid = (tsk) ? tsk->pid : 0;
1596 entry->flags =
9244489a 1597#ifdef CONFIG_TRACE_IRQFLAGS_SUPPORT
2e2ca155 1598 (irqs_disabled_flags(flags) ? TRACE_FLAG_IRQS_OFF : 0) |
9244489a
SR
1599#else
1600 TRACE_FLAG_IRQS_NOSUPPORT |
1601#endif
bc0c38d1
SR
1602 ((pc & HARDIRQ_MASK) ? TRACE_FLAG_HARDIRQ : 0) |
1603 ((pc & SOFTIRQ_MASK) ? TRACE_FLAG_SOFTIRQ : 0) |
e5137b50
PZ
1604 (tif_need_resched() ? TRACE_FLAG_NEED_RESCHED : 0) |
1605 (test_preempt_need_resched() ? TRACE_FLAG_PREEMPT_RESCHED : 0);
bc0c38d1 1606}
f413cdb8 1607EXPORT_SYMBOL_GPL(tracing_generic_entry_update);
bc0c38d1 1608
e77405ad
SR
1609struct ring_buffer_event *
1610trace_buffer_lock_reserve(struct ring_buffer *buffer,
1611 int type,
1612 unsigned long len,
1613 unsigned long flags, int pc)
51a763dd
ACM
1614{
1615 struct ring_buffer_event *event;
1616
e77405ad 1617 event = ring_buffer_lock_reserve(buffer, len);
51a763dd
ACM
1618 if (event != NULL) {
1619 struct trace_entry *ent = ring_buffer_event_data(event);
1620
1621 tracing_generic_entry_update(ent, flags, pc);
1622 ent->type = type;
1623 }
1624
1625 return event;
1626}
51a763dd 1627
7ffbd48d
SR
1628void
1629__buffer_unlock_commit(struct ring_buffer *buffer, struct ring_buffer_event *event)
1630{
1631 __this_cpu_write(trace_cmdline_save, true);
1632 ring_buffer_unlock_commit(buffer, event);
1633}
1634
e77405ad
SR
1635static inline void
1636__trace_buffer_unlock_commit(struct ring_buffer *buffer,
1637 struct ring_buffer_event *event,
0d5c6e1c 1638 unsigned long flags, int pc)
51a763dd 1639{
7ffbd48d 1640 __buffer_unlock_commit(buffer, event);
51a763dd 1641
e77405ad
SR
1642 ftrace_trace_stack(buffer, flags, 6, pc);
1643 ftrace_trace_userstack(buffer, flags, pc);
07edf712
FW
1644}
1645
e77405ad
SR
1646void trace_buffer_unlock_commit(struct ring_buffer *buffer,
1647 struct ring_buffer_event *event,
1648 unsigned long flags, int pc)
07edf712 1649{
0d5c6e1c 1650 __trace_buffer_unlock_commit(buffer, event, flags, pc);
51a763dd 1651}
0d5c6e1c 1652EXPORT_SYMBOL_GPL(trace_buffer_unlock_commit);
51a763dd 1653
2c4a33ab
SRRH
1654static struct ring_buffer *temp_buffer;
1655
ccb469a1
SR
1656struct ring_buffer_event *
1657trace_event_buffer_lock_reserve(struct ring_buffer **current_rb,
1658 struct ftrace_event_file *ftrace_file,
1659 int type, unsigned long len,
1660 unsigned long flags, int pc)
1661{
2c4a33ab
SRRH
1662 struct ring_buffer_event *entry;
1663
12883efb 1664 *current_rb = ftrace_file->tr->trace_buffer.buffer;
2c4a33ab 1665 entry = trace_buffer_lock_reserve(*current_rb,
ccb469a1 1666 type, len, flags, pc);
2c4a33ab
SRRH
1667 /*
1668 * If tracing is off, but we have triggers enabled
1669 * we still need to look at the event data. Use the temp_buffer
1670 * to store the trace event for the tigger to use. It's recusive
1671 * safe and will not be recorded anywhere.
1672 */
1673 if (!entry && ftrace_file->flags & FTRACE_EVENT_FL_TRIGGER_COND) {
1674 *current_rb = temp_buffer;
1675 entry = trace_buffer_lock_reserve(*current_rb,
1676 type, len, flags, pc);
1677 }
1678 return entry;
ccb469a1
SR
1679}
1680EXPORT_SYMBOL_GPL(trace_event_buffer_lock_reserve);
1681
ef5580d0 1682struct ring_buffer_event *
e77405ad
SR
1683trace_current_buffer_lock_reserve(struct ring_buffer **current_rb,
1684 int type, unsigned long len,
ef5580d0
SR
1685 unsigned long flags, int pc)
1686{
12883efb 1687 *current_rb = global_trace.trace_buffer.buffer;
e77405ad 1688 return trace_buffer_lock_reserve(*current_rb,
ef5580d0
SR
1689 type, len, flags, pc);
1690}
94487d6d 1691EXPORT_SYMBOL_GPL(trace_current_buffer_lock_reserve);
ef5580d0 1692
e77405ad
SR
1693void trace_current_buffer_unlock_commit(struct ring_buffer *buffer,
1694 struct ring_buffer_event *event,
ef5580d0
SR
1695 unsigned long flags, int pc)
1696{
0d5c6e1c 1697 __trace_buffer_unlock_commit(buffer, event, flags, pc);
07edf712 1698}
94487d6d 1699EXPORT_SYMBOL_GPL(trace_current_buffer_unlock_commit);
07edf712 1700
0d5c6e1c
SR
1701void trace_buffer_unlock_commit_regs(struct ring_buffer *buffer,
1702 struct ring_buffer_event *event,
1703 unsigned long flags, int pc,
1704 struct pt_regs *regs)
1fd8df2c 1705{
7ffbd48d 1706 __buffer_unlock_commit(buffer, event);
1fd8df2c
MH
1707
1708 ftrace_trace_stack_regs(buffer, flags, 0, pc, regs);
1709 ftrace_trace_userstack(buffer, flags, pc);
1710}
0d5c6e1c 1711EXPORT_SYMBOL_GPL(trace_buffer_unlock_commit_regs);
1fd8df2c 1712
e77405ad
SR
1713void trace_current_buffer_discard_commit(struct ring_buffer *buffer,
1714 struct ring_buffer_event *event)
77d9f465 1715{
e77405ad 1716 ring_buffer_discard_commit(buffer, event);
ef5580d0 1717}
12acd473 1718EXPORT_SYMBOL_GPL(trace_current_buffer_discard_commit);
ef5580d0 1719
e309b41d 1720void
7be42151 1721trace_function(struct trace_array *tr,
38697053
SR
1722 unsigned long ip, unsigned long parent_ip, unsigned long flags,
1723 int pc)
bc0c38d1 1724{
e1112b4d 1725 struct ftrace_event_call *call = &event_function;
12883efb 1726 struct ring_buffer *buffer = tr->trace_buffer.buffer;
3928a8a2 1727 struct ring_buffer_event *event;
777e208d 1728 struct ftrace_entry *entry;
bc0c38d1 1729
d769041f 1730 /* If we are reading the ring buffer, don't trace */
dd17c8f7 1731 if (unlikely(__this_cpu_read(ftrace_cpu_disabled)))
d769041f
SR
1732 return;
1733
e77405ad 1734 event = trace_buffer_lock_reserve(buffer, TRACE_FN, sizeof(*entry),
51a763dd 1735 flags, pc);
3928a8a2
SR
1736 if (!event)
1737 return;
1738 entry = ring_buffer_event_data(event);
777e208d
SR
1739 entry->ip = ip;
1740 entry->parent_ip = parent_ip;
e1112b4d 1741
f306cc82 1742 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1743 __buffer_unlock_commit(buffer, event);
bc0c38d1
SR
1744}
1745
c0a0d0d3 1746#ifdef CONFIG_STACKTRACE
4a9bd3f1
SR
1747
1748#define FTRACE_STACK_MAX_ENTRIES (PAGE_SIZE / sizeof(unsigned long))
1749struct ftrace_stack {
1750 unsigned long calls[FTRACE_STACK_MAX_ENTRIES];
1751};
1752
1753static DEFINE_PER_CPU(struct ftrace_stack, ftrace_stack);
1754static DEFINE_PER_CPU(int, ftrace_stack_reserve);
1755
e77405ad 1756static void __ftrace_trace_stack(struct ring_buffer *buffer,
53614991 1757 unsigned long flags,
1fd8df2c 1758 int skip, int pc, struct pt_regs *regs)
86387f7e 1759{
e1112b4d 1760 struct ftrace_event_call *call = &event_kernel_stack;
3928a8a2 1761 struct ring_buffer_event *event;
777e208d 1762 struct stack_entry *entry;
86387f7e 1763 struct stack_trace trace;
4a9bd3f1
SR
1764 int use_stack;
1765 int size = FTRACE_STACK_ENTRIES;
1766
1767 trace.nr_entries = 0;
1768 trace.skip = skip;
1769
1770 /*
1771 * Since events can happen in NMIs there's no safe way to
1772 * use the per cpu ftrace_stacks. We reserve it and if an interrupt
1773 * or NMI comes in, it will just have to use the default
1774 * FTRACE_STACK_SIZE.
1775 */
1776 preempt_disable_notrace();
1777
82146529 1778 use_stack = __this_cpu_inc_return(ftrace_stack_reserve);
4a9bd3f1
SR
1779 /*
1780 * We don't need any atomic variables, just a barrier.
1781 * If an interrupt comes in, we don't care, because it would
1782 * have exited and put the counter back to what we want.
1783 * We just need a barrier to keep gcc from moving things
1784 * around.
1785 */
1786 barrier();
1787 if (use_stack == 1) {
bdffd893 1788 trace.entries = this_cpu_ptr(ftrace_stack.calls);
4a9bd3f1
SR
1789 trace.max_entries = FTRACE_STACK_MAX_ENTRIES;
1790
1791 if (regs)
1792 save_stack_trace_regs(regs, &trace);
1793 else
1794 save_stack_trace(&trace);
1795
1796 if (trace.nr_entries > size)
1797 size = trace.nr_entries;
1798 } else
1799 /* From now on, use_stack is a boolean */
1800 use_stack = 0;
1801
1802 size *= sizeof(unsigned long);
86387f7e 1803
e77405ad 1804 event = trace_buffer_lock_reserve(buffer, TRACE_STACK,
4a9bd3f1 1805 sizeof(*entry) + size, flags, pc);
3928a8a2 1806 if (!event)
4a9bd3f1
SR
1807 goto out;
1808 entry = ring_buffer_event_data(event);
86387f7e 1809
4a9bd3f1
SR
1810 memset(&entry->caller, 0, size);
1811
1812 if (use_stack)
1813 memcpy(&entry->caller, trace.entries,
1814 trace.nr_entries * sizeof(unsigned long));
1815 else {
1816 trace.max_entries = FTRACE_STACK_ENTRIES;
1817 trace.entries = entry->caller;
1818 if (regs)
1819 save_stack_trace_regs(regs, &trace);
1820 else
1821 save_stack_trace(&trace);
1822 }
1823
1824 entry->size = trace.nr_entries;
86387f7e 1825
f306cc82 1826 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1827 __buffer_unlock_commit(buffer, event);
4a9bd3f1
SR
1828
1829 out:
1830 /* Again, don't let gcc optimize things here */
1831 barrier();
82146529 1832 __this_cpu_dec(ftrace_stack_reserve);
4a9bd3f1
SR
1833 preempt_enable_notrace();
1834
f0a920d5
IM
1835}
1836
1fd8df2c
MH
1837void ftrace_trace_stack_regs(struct ring_buffer *buffer, unsigned long flags,
1838 int skip, int pc, struct pt_regs *regs)
1839{
1840 if (!(trace_flags & TRACE_ITER_STACKTRACE))
1841 return;
1842
1843 __ftrace_trace_stack(buffer, flags, skip, pc, regs);
1844}
1845
e77405ad
SR
1846void ftrace_trace_stack(struct ring_buffer *buffer, unsigned long flags,
1847 int skip, int pc)
53614991
SR
1848{
1849 if (!(trace_flags & TRACE_ITER_STACKTRACE))
1850 return;
1851
1fd8df2c 1852 __ftrace_trace_stack(buffer, flags, skip, pc, NULL);
53614991
SR
1853}
1854
c0a0d0d3
FW
1855void __trace_stack(struct trace_array *tr, unsigned long flags, int skip,
1856 int pc)
38697053 1857{
12883efb 1858 __ftrace_trace_stack(tr->trace_buffer.buffer, flags, skip, pc, NULL);
38697053
SR
1859}
1860
03889384
SR
1861/**
1862 * trace_dump_stack - record a stack back trace in the trace buffer
c142be8e 1863 * @skip: Number of functions to skip (helper handlers)
03889384 1864 */
c142be8e 1865void trace_dump_stack(int skip)
03889384
SR
1866{
1867 unsigned long flags;
1868
1869 if (tracing_disabled || tracing_selftest_running)
e36c5458 1870 return;
03889384
SR
1871
1872 local_save_flags(flags);
1873
c142be8e
SRRH
1874 /*
1875 * Skip 3 more, seems to get us at the caller of
1876 * this function.
1877 */
1878 skip += 3;
1879 __ftrace_trace_stack(global_trace.trace_buffer.buffer,
1880 flags, skip, preempt_count(), NULL);
03889384
SR
1881}
1882
91e86e56
SR
1883static DEFINE_PER_CPU(int, user_stack_count);
1884
e77405ad
SR
1885void
1886ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
02b67518 1887{
e1112b4d 1888 struct ftrace_event_call *call = &event_user_stack;
8d7c6a96 1889 struct ring_buffer_event *event;
02b67518
TE
1890 struct userstack_entry *entry;
1891 struct stack_trace trace;
02b67518
TE
1892
1893 if (!(trace_flags & TRACE_ITER_USERSTACKTRACE))
1894 return;
1895
b6345879
SR
1896 /*
1897 * NMIs can not handle page faults, even with fix ups.
1898 * The save user stack can (and often does) fault.
1899 */
1900 if (unlikely(in_nmi()))
1901 return;
02b67518 1902
91e86e56
SR
1903 /*
1904 * prevent recursion, since the user stack tracing may
1905 * trigger other kernel events.
1906 */
1907 preempt_disable();
1908 if (__this_cpu_read(user_stack_count))
1909 goto out;
1910
1911 __this_cpu_inc(user_stack_count);
1912
e77405ad 1913 event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK,
51a763dd 1914 sizeof(*entry), flags, pc);
02b67518 1915 if (!event)
1dbd1951 1916 goto out_drop_count;
02b67518 1917 entry = ring_buffer_event_data(event);
02b67518 1918
48659d31 1919 entry->tgid = current->tgid;
02b67518
TE
1920 memset(&entry->caller, 0, sizeof(entry->caller));
1921
1922 trace.nr_entries = 0;
1923 trace.max_entries = FTRACE_STACK_ENTRIES;
1924 trace.skip = 0;
1925 trace.entries = entry->caller;
1926
1927 save_stack_trace_user(&trace);
f306cc82 1928 if (!call_filter_check_discard(call, entry, buffer, event))
7ffbd48d 1929 __buffer_unlock_commit(buffer, event);
91e86e56 1930
1dbd1951 1931 out_drop_count:
91e86e56 1932 __this_cpu_dec(user_stack_count);
91e86e56
SR
1933 out:
1934 preempt_enable();
02b67518
TE
1935}
1936
4fd27358
HE
1937#ifdef UNUSED
1938static void __trace_userstack(struct trace_array *tr, unsigned long flags)
02b67518 1939{
7be42151 1940 ftrace_trace_userstack(tr, flags, preempt_count());
02b67518 1941}
4fd27358 1942#endif /* UNUSED */
02b67518 1943
c0a0d0d3
FW
1944#endif /* CONFIG_STACKTRACE */
1945
07d777fe
SR
1946/* created for use with alloc_percpu */
1947struct trace_buffer_struct {
1948 char buffer[TRACE_BUF_SIZE];
1949};
1950
1951static struct trace_buffer_struct *trace_percpu_buffer;
1952static struct trace_buffer_struct *trace_percpu_sirq_buffer;
1953static struct trace_buffer_struct *trace_percpu_irq_buffer;
1954static struct trace_buffer_struct *trace_percpu_nmi_buffer;
1955
1956/*
1957 * The buffer used is dependent on the context. There is a per cpu
1958 * buffer for normal context, softirq contex, hard irq context and
1959 * for NMI context. Thise allows for lockless recording.
1960 *
1961 * Note, if the buffers failed to be allocated, then this returns NULL
1962 */
1963static char *get_trace_buf(void)
1964{
1965 struct trace_buffer_struct *percpu_buffer;
07d777fe
SR
1966
1967 /*
1968 * If we have allocated per cpu buffers, then we do not
1969 * need to do any locking.
1970 */
1971 if (in_nmi())
1972 percpu_buffer = trace_percpu_nmi_buffer;
1973 else if (in_irq())
1974 percpu_buffer = trace_percpu_irq_buffer;
1975 else if (in_softirq())
1976 percpu_buffer = trace_percpu_sirq_buffer;
1977 else
1978 percpu_buffer = trace_percpu_buffer;
1979
1980 if (!percpu_buffer)
1981 return NULL;
1982
d8a0349c 1983 return this_cpu_ptr(&percpu_buffer->buffer[0]);
07d777fe
SR
1984}
1985
1986static int alloc_percpu_trace_buffer(void)
1987{
1988 struct trace_buffer_struct *buffers;
1989 struct trace_buffer_struct *sirq_buffers;
1990 struct trace_buffer_struct *irq_buffers;
1991 struct trace_buffer_struct *nmi_buffers;
1992
1993 buffers = alloc_percpu(struct trace_buffer_struct);
1994 if (!buffers)
1995 goto err_warn;
1996
1997 sirq_buffers = alloc_percpu(struct trace_buffer_struct);
1998 if (!sirq_buffers)
1999 goto err_sirq;
2000
2001 irq_buffers = alloc_percpu(struct trace_buffer_struct);
2002 if (!irq_buffers)
2003 goto err_irq;
2004
2005 nmi_buffers = alloc_percpu(struct trace_buffer_struct);
2006 if (!nmi_buffers)
2007 goto err_nmi;
2008
2009 trace_percpu_buffer = buffers;
2010 trace_percpu_sirq_buffer = sirq_buffers;
2011 trace_percpu_irq_buffer = irq_buffers;
2012 trace_percpu_nmi_buffer = nmi_buffers;
2013
2014 return 0;
2015
2016 err_nmi:
2017 free_percpu(irq_buffers);
2018 err_irq:
2019 free_percpu(sirq_buffers);
2020 err_sirq:
2021 free_percpu(buffers);
2022 err_warn:
2023 WARN(1, "Could not allocate percpu trace_printk buffer");
2024 return -ENOMEM;
2025}
2026
81698831
SR
2027static int buffers_allocated;
2028
07d777fe
SR
2029void trace_printk_init_buffers(void)
2030{
07d777fe
SR
2031 if (buffers_allocated)
2032 return;
2033
2034 if (alloc_percpu_trace_buffer())
2035 return;
2036
2184db46
SR
2037 /* trace_printk() is for debug use only. Don't use it in production. */
2038
69a1c994
BP
2039 pr_warning("\n");
2040 pr_warning("**********************************************************\n");
2184db46
SR
2041 pr_warning("** NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE **\n");
2042 pr_warning("** **\n");
2043 pr_warning("** trace_printk() being used. Allocating extra memory. **\n");
2044 pr_warning("** **\n");
2045 pr_warning("** This means that this is a DEBUG kernel and it is **\n");
eff264ef 2046 pr_warning("** unsafe for production use. **\n");
2184db46
SR
2047 pr_warning("** **\n");
2048 pr_warning("** If you see this message and you are not debugging **\n");
2049 pr_warning("** the kernel, report this immediately to your vendor! **\n");
2050 pr_warning("** **\n");
2051 pr_warning("** NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE NOTICE **\n");
2052 pr_warning("**********************************************************\n");
07d777fe 2053
b382ede6
SR
2054 /* Expand the buffers to set size */
2055 tracing_update_buffers();
2056
07d777fe 2057 buffers_allocated = 1;
81698831
SR
2058
2059 /*
2060 * trace_printk_init_buffers() can be called by modules.
2061 * If that happens, then we need to start cmdline recording
2062 * directly here. If the global_trace.buffer is already
2063 * allocated here, then this was called by module code.
2064 */
12883efb 2065 if (global_trace.trace_buffer.buffer)
81698831
SR
2066 tracing_start_cmdline_record();
2067}
2068
2069void trace_printk_start_comm(void)
2070{
2071 /* Start tracing comms if trace printk is set */
2072 if (!buffers_allocated)
2073 return;
2074 tracing_start_cmdline_record();
2075}
2076
2077static void trace_printk_start_stop_comm(int enabled)
2078{
2079 if (!buffers_allocated)
2080 return;
2081
2082 if (enabled)
2083 tracing_start_cmdline_record();
2084 else
2085 tracing_stop_cmdline_record();
07d777fe
SR
2086}
2087
769b0441 2088/**
48ead020 2089 * trace_vbprintk - write binary msg to tracing buffer
769b0441
FW
2090 *
2091 */
40ce74f1 2092int trace_vbprintk(unsigned long ip, const char *fmt, va_list args)
769b0441 2093{
e1112b4d 2094 struct ftrace_event_call *call = &event_bprint;
769b0441 2095 struct ring_buffer_event *event;
e77405ad 2096 struct ring_buffer *buffer;
769b0441 2097 struct trace_array *tr = &global_trace;
48ead020 2098 struct bprint_entry *entry;
769b0441 2099 unsigned long flags;
07d777fe
SR
2100 char *tbuffer;
2101 int len = 0, size, pc;
769b0441
FW
2102
2103 if (unlikely(tracing_selftest_running || tracing_disabled))
2104 return 0;
2105
2106 /* Don't pollute graph traces with trace_vprintk internals */
2107 pause_graph_tracing();
2108
2109 pc = preempt_count();
5168ae50 2110 preempt_disable_notrace();
769b0441 2111
07d777fe
SR
2112 tbuffer = get_trace_buf();
2113 if (!tbuffer) {
2114 len = 0;
769b0441 2115 goto out;
07d777fe 2116 }
769b0441 2117
07d777fe 2118 len = vbin_printf((u32 *)tbuffer, TRACE_BUF_SIZE/sizeof(int), fmt, args);
769b0441 2119
07d777fe
SR
2120 if (len > TRACE_BUF_SIZE/sizeof(int) || len < 0)
2121 goto out;
769b0441 2122
07d777fe 2123 local_save_flags(flags);
769b0441 2124 size = sizeof(*entry) + sizeof(u32) * len;
12883efb 2125 buffer = tr->trace_buffer.buffer;
e77405ad
SR
2126 event = trace_buffer_lock_reserve(buffer, TRACE_BPRINT, size,
2127 flags, pc);
769b0441 2128 if (!event)
07d777fe 2129 goto out;
769b0441
FW
2130 entry = ring_buffer_event_data(event);
2131 entry->ip = ip;
769b0441
FW
2132 entry->fmt = fmt;
2133
07d777fe 2134 memcpy(entry->buf, tbuffer, sizeof(u32) * len);
f306cc82 2135 if (!call_filter_check_discard(call, entry, buffer, event)) {
7ffbd48d 2136 __buffer_unlock_commit(buffer, event);
d931369b
SR
2137 ftrace_trace_stack(buffer, flags, 6, pc);
2138 }
769b0441 2139
769b0441 2140out:
5168ae50 2141 preempt_enable_notrace();
769b0441
FW
2142 unpause_graph_tracing();
2143
2144 return len;
2145}
48ead020
FW
2146EXPORT_SYMBOL_GPL(trace_vbprintk);
2147
12883efb
SRRH
2148static int
2149__trace_array_vprintk(struct ring_buffer *buffer,
2150 unsigned long ip, const char *fmt, va_list args)
48ead020 2151{
e1112b4d 2152 struct ftrace_event_call *call = &event_print;
48ead020 2153 struct ring_buffer_event *event;
07d777fe 2154 int len = 0, size, pc;
48ead020 2155 struct print_entry *entry;
07d777fe
SR
2156 unsigned long flags;
2157 char *tbuffer;
48ead020
FW
2158
2159 if (tracing_disabled || tracing_selftest_running)
2160 return 0;
2161
07d777fe
SR
2162 /* Don't pollute graph traces with trace_vprintk internals */
2163 pause_graph_tracing();
2164
48ead020
FW
2165 pc = preempt_count();
2166 preempt_disable_notrace();
48ead020 2167
07d777fe
SR
2168
2169 tbuffer = get_trace_buf();
2170 if (!tbuffer) {
2171 len = 0;
48ead020 2172 goto out;
07d777fe 2173 }
48ead020 2174
3558a5ac 2175 len = vscnprintf(tbuffer, TRACE_BUF_SIZE, fmt, args);
48ead020 2176
07d777fe 2177 local_save_flags(flags);
48ead020 2178 size = sizeof(*entry) + len + 1;
e77405ad 2179 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, size,
07d777fe 2180 flags, pc);
48ead020 2181 if (!event)
07d777fe 2182 goto out;
48ead020 2183 entry = ring_buffer_event_data(event);
c13d2f7c 2184 entry->ip = ip;
48ead020 2185
3558a5ac 2186 memcpy(&entry->buf, tbuffer, len + 1);
f306cc82 2187 if (!call_filter_check_discard(call, entry, buffer, event)) {
7ffbd48d 2188 __buffer_unlock_commit(buffer, event);
07d777fe 2189 ftrace_trace_stack(buffer, flags, 6, pc);
d931369b 2190 }
48ead020
FW
2191 out:
2192 preempt_enable_notrace();
07d777fe 2193 unpause_graph_tracing();
48ead020
FW
2194
2195 return len;
2196}
659372d3 2197
12883efb
SRRH
2198int trace_array_vprintk(struct trace_array *tr,
2199 unsigned long ip, const char *fmt, va_list args)
2200{
2201 return __trace_array_vprintk(tr->trace_buffer.buffer, ip, fmt, args);
2202}
2203
2204int trace_array_printk(struct trace_array *tr,
2205 unsigned long ip, const char *fmt, ...)
2206{
2207 int ret;
2208 va_list ap;
2209
2210 if (!(trace_flags & TRACE_ITER_PRINTK))
2211 return 0;
2212
2213 va_start(ap, fmt);
2214 ret = trace_array_vprintk(tr, ip, fmt, ap);
2215 va_end(ap);
2216 return ret;
2217}
2218
2219int trace_array_printk_buf(struct ring_buffer *buffer,
2220 unsigned long ip, const char *fmt, ...)
2221{
2222 int ret;
2223 va_list ap;
2224
2225 if (!(trace_flags & TRACE_ITER_PRINTK))
2226 return 0;
2227
2228 va_start(ap, fmt);
2229 ret = __trace_array_vprintk(buffer, ip, fmt, ap);
2230 va_end(ap);
2231 return ret;
2232}
2233
659372d3
SR
2234int trace_vprintk(unsigned long ip, const char *fmt, va_list args)
2235{
a813a159 2236 return trace_array_vprintk(&global_trace, ip, fmt, args);
659372d3 2237}
769b0441
FW
2238EXPORT_SYMBOL_GPL(trace_vprintk);
2239
e2ac8ef5 2240static void trace_iterator_increment(struct trace_iterator *iter)
5a90f577 2241{
6d158a81
SR
2242 struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, iter->cpu);
2243
5a90f577 2244 iter->idx++;
6d158a81
SR
2245 if (buf_iter)
2246 ring_buffer_read(buf_iter, NULL);
5a90f577
SR
2247}
2248
e309b41d 2249static struct trace_entry *
bc21b478
SR
2250peek_next_entry(struct trace_iterator *iter, int cpu, u64 *ts,
2251 unsigned long *lost_events)
dd0e545f 2252{
3928a8a2 2253 struct ring_buffer_event *event;
6d158a81 2254 struct ring_buffer_iter *buf_iter = trace_buffer_iter(iter, cpu);
dd0e545f 2255
d769041f
SR
2256 if (buf_iter)
2257 event = ring_buffer_iter_peek(buf_iter, ts);
2258 else
12883efb 2259 event = ring_buffer_peek(iter->trace_buffer->buffer, cpu, ts,
bc21b478 2260 lost_events);
d769041f 2261
4a9bd3f1
SR
2262 if (event) {
2263 iter->ent_size = ring_buffer_event_length(event);
2264 return ring_buffer_event_data(event);
2265 }
2266 iter->ent_size = 0;
2267 return NULL;
dd0e545f 2268}
d769041f 2269
dd0e545f 2270static struct trace_entry *
bc21b478
SR
2271__find_next_entry(struct trace_iterator *iter, int *ent_cpu,
2272 unsigned long *missing_events, u64 *ent_ts)
bc0c38d1 2273{
12883efb 2274 struct ring_buffer *buffer = iter->trace_buffer->buffer;
bc0c38d1 2275 struct trace_entry *ent, *next = NULL;
aa27497c 2276 unsigned long lost_events = 0, next_lost = 0;
b04cc6b1 2277 int cpu_file = iter->cpu_file;
3928a8a2 2278 u64 next_ts = 0, ts;
bc0c38d1 2279 int next_cpu = -1;
12b5da34 2280 int next_size = 0;
bc0c38d1
SR
2281 int cpu;
2282
b04cc6b1
FW
2283 /*
2284 * If we are in a per_cpu trace file, don't bother by iterating over
2285 * all cpu and peek directly.
2286 */
ae3b5093 2287 if (cpu_file > RING_BUFFER_ALL_CPUS) {
b04cc6b1
FW
2288 if (ring_buffer_empty_cpu(buffer, cpu_file))
2289 return NULL;
bc21b478 2290 ent = peek_next_entry(iter, cpu_file, ent_ts, missing_events);
b04cc6b1
FW
2291 if (ent_cpu)
2292 *ent_cpu = cpu_file;
2293
2294 return ent;
2295 }
2296
ab46428c 2297 for_each_tracing_cpu(cpu) {
dd0e545f 2298
3928a8a2
SR
2299 if (ring_buffer_empty_cpu(buffer, cpu))
2300 continue;
dd0e545f 2301
bc21b478 2302 ent = peek_next_entry(iter, cpu, &ts, &lost_events);
dd0e545f 2303
cdd31cd2
IM
2304 /*
2305 * Pick the entry with the smallest timestamp:
2306 */
3928a8a2 2307 if (ent && (!next || ts < next_ts)) {
bc0c38d1
SR
2308 next = ent;
2309 next_cpu = cpu;
3928a8a2 2310 next_ts = ts;
bc21b478 2311 next_lost = lost_events;
12b5da34 2312 next_size = iter->ent_size;
bc0c38d1
SR
2313 }
2314 }
2315
12b5da34
SR
2316 iter->ent_size = next_size;
2317
bc0c38d1
SR
2318 if (ent_cpu)
2319 *ent_cpu = next_cpu;
2320
3928a8a2
SR
2321 if (ent_ts)
2322 *ent_ts = next_ts;
2323
bc21b478
SR
2324 if (missing_events)
2325 *missing_events = next_lost;
2326
bc0c38d1
SR
2327 return next;
2328}
2329
dd0e545f 2330/* Find the next real entry, without updating the iterator itself */
c4a8e8be
FW
2331struct trace_entry *trace_find_next_entry(struct trace_iterator *iter,
2332 int *ent_cpu, u64 *ent_ts)
bc0c38d1 2333{
bc21b478 2334 return __find_next_entry(iter, ent_cpu, NULL, ent_ts);
dd0e545f
SR
2335}
2336
2337/* Find the next real entry, and increment the iterator to the next entry */
955b61e5 2338void *trace_find_next_entry_inc(struct trace_iterator *iter)
dd0e545f 2339{
bc21b478
SR
2340 iter->ent = __find_next_entry(iter, &iter->cpu,
2341 &iter->lost_events, &iter->ts);
dd0e545f 2342
3928a8a2 2343 if (iter->ent)
e2ac8ef5 2344 trace_iterator_increment(iter);
dd0e545f 2345
3928a8a2 2346 return iter->ent ? iter : NULL;
b3806b43 2347}
bc0c38d1 2348
e309b41d 2349static void trace_consume(struct trace_iterator *iter)
b3806b43 2350{
12883efb 2351 ring_buffer_consume(iter->trace_buffer->buffer, iter->cpu, &iter->ts,
bc21b478 2352 &iter->lost_events);
bc0c38d1
SR
2353}
2354
e309b41d 2355static void *s_next(struct seq_file *m, void *v, loff_t *pos)
bc0c38d1
SR
2356{
2357 struct trace_iterator *iter = m->private;
bc0c38d1 2358 int i = (int)*pos;
4e3c3333 2359 void *ent;
bc0c38d1 2360
a63ce5b3
SR
2361 WARN_ON_ONCE(iter->leftover);
2362
bc0c38d1
SR
2363 (*pos)++;
2364
2365 /* can't go backwards */
2366 if (iter->idx > i)
2367 return NULL;
2368
2369 if (iter->idx < 0)
955b61e5 2370 ent = trace_find_next_entry_inc(iter);
bc0c38d1
SR
2371 else
2372 ent = iter;
2373
2374 while (ent && iter->idx < i)
955b61e5 2375 ent = trace_find_next_entry_inc(iter);
bc0c38d1
SR
2376
2377 iter->pos = *pos;
2378
bc0c38d1
SR
2379 return ent;
2380}
2381
955b61e5 2382void tracing_iter_reset(struct trace_iterator *iter, int cpu)
2f26ebd5 2383{
2f26ebd5
SR
2384 struct ring_buffer_event *event;
2385 struct ring_buffer_iter *buf_iter;
2386 unsigned long entries = 0;
2387 u64 ts;
2388
12883efb 2389 per_cpu_ptr(iter->trace_buffer->data, cpu)->skipped_entries = 0;
2f26ebd5 2390
6d158a81
SR
2391 buf_iter = trace_buffer_iter(iter, cpu);
2392 if (!buf_iter)
2f26ebd5
SR
2393 return;
2394
2f26ebd5
SR
2395 ring_buffer_iter_reset(buf_iter);
2396
2397 /*
2398 * We could have the case with the max latency tracers
2399 * that a reset never took place on a cpu. This is evident
2400 * by the timestamp being before the start of the buffer.
2401 */
2402 while ((event = ring_buffer_iter_peek(buf_iter, &ts))) {
12883efb 2403 if (ts >= iter->trace_buffer->time_start)
2f26ebd5
SR
2404 break;
2405 entries++;
2406 ring_buffer_read(buf_iter, NULL);
2407 }
2408
12883efb 2409 per_cpu_ptr(iter->trace_buffer->data, cpu)->skipped_entries = entries;
2f26ebd5
SR
2410}
2411
d7350c3f 2412/*
d7350c3f
FW
2413 * The current tracer is copied to avoid a global locking
2414 * all around.
2415 */
bc0c38d1
SR
2416static void *s_start(struct seq_file *m, loff_t *pos)
2417{
2418 struct trace_iterator *iter = m->private;
2b6080f2 2419 struct trace_array *tr = iter->tr;
b04cc6b1 2420 int cpu_file = iter->cpu_file;
bc0c38d1
SR
2421 void *p = NULL;
2422 loff_t l = 0;
3928a8a2 2423 int cpu;
bc0c38d1 2424
2fd196ec
HT
2425 /*
2426 * copy the tracer to avoid using a global lock all around.
2427 * iter->trace is a copy of current_trace, the pointer to the
2428 * name may be used instead of a strcmp(), as iter->trace->name
2429 * will point to the same string as current_trace->name.
2430 */
bc0c38d1 2431 mutex_lock(&trace_types_lock);
2b6080f2
SR
2432 if (unlikely(tr->current_trace && iter->trace->name != tr->current_trace->name))
2433 *iter->trace = *tr->current_trace;
d7350c3f 2434 mutex_unlock(&trace_types_lock);
bc0c38d1 2435
12883efb 2436#ifdef CONFIG_TRACER_MAX_TRACE
debdd57f
HT
2437 if (iter->snapshot && iter->trace->use_max_tr)
2438 return ERR_PTR(-EBUSY);
12883efb 2439#endif
debdd57f
HT
2440
2441 if (!iter->snapshot)
2442 atomic_inc(&trace_record_cmdline_disabled);
bc0c38d1 2443
bc0c38d1
SR
2444 if (*pos != iter->pos) {
2445 iter->ent = NULL;
2446 iter->cpu = 0;
2447 iter->idx = -1;
2448
ae3b5093 2449 if (cpu_file == RING_BUFFER_ALL_CPUS) {
b04cc6b1 2450 for_each_tracing_cpu(cpu)
2f26ebd5 2451 tracing_iter_reset(iter, cpu);
b04cc6b1 2452 } else
2f26ebd5 2453 tracing_iter_reset(iter, cpu_file);
bc0c38d1 2454
ac91d854 2455 iter->leftover = 0;
bc0c38d1
SR
2456 for (p = iter; p && l < *pos; p = s_next(m, p, &l))
2457 ;
2458
2459 } else {
a63ce5b3
SR
2460 /*
2461 * If we overflowed the seq_file before, then we want
2462 * to just reuse the trace_seq buffer again.
2463 */
2464 if (iter->leftover)
2465 p = iter;
2466 else {
2467 l = *pos - 1;
2468 p = s_next(m, p, &l);
2469 }
bc0c38d1
SR
2470 }
2471
4f535968 2472 trace_event_read_lock();
7e53bd42 2473 trace_access_lock(cpu_file);
bc0c38d1
SR
2474 return p;
2475}
2476
2477static void s_stop(struct seq_file *m, void *p)
2478{
7e53bd42
LJ
2479 struct trace_iterator *iter = m->private;
2480
12883efb 2481#ifdef CONFIG_TRACER_MAX_TRACE
debdd57f
HT
2482 if (iter->snapshot && iter->trace->use_max_tr)
2483 return;
12883efb 2484#endif
debdd57f
HT
2485
2486 if (!iter->snapshot)
2487 atomic_dec(&trace_record_cmdline_disabled);
12883efb 2488
7e53bd42 2489 trace_access_unlock(iter->cpu_file);
4f535968 2490 trace_event_read_unlock();
bc0c38d1
SR
2491}
2492
39eaf7ef 2493static void
12883efb
SRRH
2494get_total_entries(struct trace_buffer *buf,
2495 unsigned long *total, unsigned long *entries)
39eaf7ef
SR
2496{
2497 unsigned long count;
2498 int cpu;
2499
2500 *total = 0;
2501 *entries = 0;
2502
2503 for_each_tracing_cpu(cpu) {
12883efb 2504 count = ring_buffer_entries_cpu(buf->buffer, cpu);
39eaf7ef
SR
2505 /*
2506 * If this buffer has skipped entries, then we hold all
2507 * entries for the trace and we need to ignore the
2508 * ones before the time stamp.
2509 */
12883efb
SRRH
2510 if (per_cpu_ptr(buf->data, cpu)->skipped_entries) {
2511 count -= per_cpu_ptr(buf->data, cpu)->skipped_entries;
39eaf7ef
SR
2512 /* total is the same as the entries */
2513 *total += count;
2514 } else
2515 *total += count +
12883efb 2516 ring_buffer_overrun_cpu(buf->buffer, cpu);
39eaf7ef
SR
2517 *entries += count;
2518 }
2519}
2520
e309b41d 2521static void print_lat_help_header(struct seq_file *m)
bc0c38d1 2522{
d79ac28f
RV
2523 seq_puts(m, "# _------=> CPU# \n"
2524 "# / _-----=> irqs-off \n"
2525 "# | / _----=> need-resched \n"
2526 "# || / _---=> hardirq/softirq \n"
2527 "# ||| / _--=> preempt-depth \n"
2528 "# |||| / delay \n"
2529 "# cmd pid ||||| time | caller \n"
2530 "# \\ / ||||| \\ | / \n");
bc0c38d1
SR
2531}
2532
12883efb 2533static void print_event_info(struct trace_buffer *buf, struct seq_file *m)
bc0c38d1 2534{
39eaf7ef
SR
2535 unsigned long total;
2536 unsigned long entries;
2537
12883efb 2538 get_total_entries(buf, &total, &entries);
39eaf7ef
SR
2539 seq_printf(m, "# entries-in-buffer/entries-written: %lu/%lu #P:%d\n",
2540 entries, total, num_online_cpus());
2541 seq_puts(m, "#\n");
2542}
2543
12883efb 2544static void print_func_help_header(struct trace_buffer *buf, struct seq_file *m)
39eaf7ef 2545{
12883efb 2546 print_event_info(buf, m);
d79ac28f
RV
2547 seq_puts(m, "# TASK-PID CPU# TIMESTAMP FUNCTION\n"
2548 "# | | | | |\n");
bc0c38d1
SR
2549}
2550
12883efb 2551static void print_func_help_header_irq(struct trace_buffer *buf, struct seq_file *m)
77271ce4 2552{
12883efb 2553 print_event_info(buf, m);
d79ac28f
RV
2554 seq_puts(m, "# _-----=> irqs-off\n"
2555 "# / _----=> need-resched\n"
2556 "# | / _---=> hardirq/softirq\n"
2557 "# || / _--=> preempt-depth\n"
2558 "# ||| / delay\n"
2559 "# TASK-PID CPU# |||| TIMESTAMP FUNCTION\n"
2560 "# | | | |||| | |\n");
77271ce4 2561}
bc0c38d1 2562
62b915f1 2563void
bc0c38d1
SR
2564print_trace_header(struct seq_file *m, struct trace_iterator *iter)
2565{
2566 unsigned long sym_flags = (trace_flags & TRACE_ITER_SYM_MASK);
12883efb
SRRH
2567 struct trace_buffer *buf = iter->trace_buffer;
2568 struct trace_array_cpu *data = per_cpu_ptr(buf->data, buf->cpu);
2b6080f2 2569 struct tracer *type = iter->trace;
39eaf7ef
SR
2570 unsigned long entries;
2571 unsigned long total;
bc0c38d1
SR
2572 const char *name = "preemption";
2573
d840f718 2574 name = type->name;
bc0c38d1 2575
12883efb 2576 get_total_entries(buf, &total, &entries);
bc0c38d1 2577
888b55dc 2578 seq_printf(m, "# %s latency trace v1.1.5 on %s\n",
bc0c38d1 2579 name, UTS_RELEASE);
888b55dc 2580 seq_puts(m, "# -----------------------------------"
bc0c38d1 2581 "---------------------------------\n");
888b55dc 2582 seq_printf(m, "# latency: %lu us, #%lu/%lu, CPU#%d |"
bc0c38d1 2583 " (M:%s VP:%d, KP:%d, SP:%d HP:%d",
57f50be1 2584 nsecs_to_usecs(data->saved_latency),
bc0c38d1 2585 entries,
4c11d7ae 2586 total,
12883efb 2587 buf->cpu,
bc0c38d1
SR
2588#if defined(CONFIG_PREEMPT_NONE)
2589 "server",
2590#elif defined(CONFIG_PREEMPT_VOLUNTARY)
2591 "desktop",
b5c21b45 2592#elif defined(CONFIG_PREEMPT)
bc0c38d1
SR
2593 "preempt",
2594#else
2595 "unknown",
2596#endif
2597 /* These are reserved for later use */
2598 0, 0, 0, 0);
2599#ifdef CONFIG_SMP
2600 seq_printf(m, " #P:%d)\n", num_online_cpus());
2601#else
2602 seq_puts(m, ")\n");
2603#endif
888b55dc
KM
2604 seq_puts(m, "# -----------------\n");
2605 seq_printf(m, "# | task: %.16s-%d "
bc0c38d1 2606 "(uid:%d nice:%ld policy:%ld rt_prio:%ld)\n",
d20b92ab
EB
2607 data->comm, data->pid,
2608 from_kuid_munged(seq_user_ns(m), data->uid), data->nice,
bc0c38d1 2609 data->policy, data->rt_priority);
888b55dc 2610 seq_puts(m, "# -----------------\n");
bc0c38d1
SR
2611
2612 if (data->critical_start) {
888b55dc 2613 seq_puts(m, "# => started at: ");
214023c3
SR
2614 seq_print_ip_sym(&iter->seq, data->critical_start, sym_flags);
2615 trace_print_seq(m, &iter->seq);
888b55dc 2616 seq_puts(m, "\n# => ended at: ");
214023c3
SR
2617 seq_print_ip_sym(&iter->seq, data->critical_end, sym_flags);
2618 trace_print_seq(m, &iter->seq);
8248ac05 2619 seq_puts(m, "\n#\n");
bc0c38d1
SR
2620 }
2621
888b55dc 2622 seq_puts(m, "#\n");
bc0c38d1
SR
2623}
2624
a309720c
SR
2625static void test_cpu_buff_start(struct trace_iterator *iter)
2626{
2627 struct trace_seq *s = &iter->seq;
2628
12ef7d44
SR
2629 if (!(trace_flags & TRACE_ITER_ANNOTATE))
2630 return;
2631
2632 if (!(iter->iter_flags & TRACE_FILE_ANNOTATE))
2633 return;
2634
4462344e 2635 if (cpumask_test_cpu(iter->cpu, iter->started))
a309720c
SR
2636 return;
2637
12883efb 2638 if (per_cpu_ptr(iter->trace_buffer->data, iter->cpu)->skipped_entries)
2f26ebd5
SR
2639 return;
2640
4462344e 2641 cpumask_set_cpu(iter->cpu, iter->started);
b0dfa978
FW
2642
2643 /* Don't print started cpu buffer for the first entry of the trace */
2644 if (iter->idx > 1)
2645 trace_seq_printf(s, "##### CPU %u buffer started ####\n",
2646 iter->cpu);
a309720c
SR
2647}
2648
2c4f035f 2649static enum print_line_t print_trace_fmt(struct trace_iterator *iter)
bc0c38d1 2650{
214023c3 2651 struct trace_seq *s = &iter->seq;
bc0c38d1 2652 unsigned long sym_flags = (trace_flags & TRACE_ITER_SYM_MASK);
4e3c3333 2653 struct trace_entry *entry;
f633cef0 2654 struct trace_event *event;
bc0c38d1 2655
4e3c3333 2656 entry = iter->ent;
dd0e545f 2657
a309720c
SR
2658 test_cpu_buff_start(iter);
2659
c4a8e8be 2660 event = ftrace_find_event(entry->type);
bc0c38d1 2661
c4a8e8be 2662 if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2663 if (iter->iter_flags & TRACE_FILE_LAT_FMT)
2664 trace_print_lat_context(iter);
2665 else
2666 trace_print_context(iter);
c4a8e8be 2667 }
bc0c38d1 2668
19a7fe20
SRRH
2669 if (trace_seq_has_overflowed(s))
2670 return TRACE_TYPE_PARTIAL_LINE;
2671
268ccda0 2672 if (event)
a9a57763 2673 return event->funcs->trace(iter, sym_flags, event);
d9793bd8 2674
19a7fe20 2675 trace_seq_printf(s, "Unknown type %d\n", entry->type);
02b67518 2676
19a7fe20 2677 return trace_handle_return(s);
bc0c38d1
SR
2678}
2679
2c4f035f 2680static enum print_line_t print_raw_fmt(struct trace_iterator *iter)
f9896bf3
IM
2681{
2682 struct trace_seq *s = &iter->seq;
2683 struct trace_entry *entry;
f633cef0 2684 struct trace_event *event;
f9896bf3
IM
2685
2686 entry = iter->ent;
dd0e545f 2687
19a7fe20
SRRH
2688 if (trace_flags & TRACE_ITER_CONTEXT_INFO)
2689 trace_seq_printf(s, "%d %d %llu ",
2690 entry->pid, iter->cpu, iter->ts);
2691
2692 if (trace_seq_has_overflowed(s))
2693 return TRACE_TYPE_PARTIAL_LINE;
f9896bf3 2694
f633cef0 2695 event = ftrace_find_event(entry->type);
268ccda0 2696 if (event)
a9a57763 2697 return event->funcs->raw(iter, 0, event);
d9793bd8 2698
19a7fe20 2699 trace_seq_printf(s, "%d ?\n", entry->type);
777e208d 2700
19a7fe20 2701 return trace_handle_return(s);
f9896bf3
IM
2702}
2703
2c4f035f 2704static enum print_line_t print_hex_fmt(struct trace_iterator *iter)
5e3ca0ec
IM
2705{
2706 struct trace_seq *s = &iter->seq;
2707 unsigned char newline = '\n';
2708 struct trace_entry *entry;
f633cef0 2709 struct trace_event *event;
5e3ca0ec
IM
2710
2711 entry = iter->ent;
dd0e545f 2712
c4a8e8be 2713 if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2714 SEQ_PUT_HEX_FIELD(s, entry->pid);
2715 SEQ_PUT_HEX_FIELD(s, iter->cpu);
2716 SEQ_PUT_HEX_FIELD(s, iter->ts);
2717 if (trace_seq_has_overflowed(s))
2718 return TRACE_TYPE_PARTIAL_LINE;
c4a8e8be 2719 }
5e3ca0ec 2720
f633cef0 2721 event = ftrace_find_event(entry->type);
268ccda0 2722 if (event) {
a9a57763 2723 enum print_line_t ret = event->funcs->hex(iter, 0, event);
d9793bd8
ACM
2724 if (ret != TRACE_TYPE_HANDLED)
2725 return ret;
2726 }
7104f300 2727
19a7fe20 2728 SEQ_PUT_FIELD(s, newline);
5e3ca0ec 2729
19a7fe20 2730 return trace_handle_return(s);
5e3ca0ec
IM
2731}
2732
2c4f035f 2733static enum print_line_t print_bin_fmt(struct trace_iterator *iter)
cb0f12aa
IM
2734{
2735 struct trace_seq *s = &iter->seq;
2736 struct trace_entry *entry;
f633cef0 2737 struct trace_event *event;
cb0f12aa
IM
2738
2739 entry = iter->ent;
dd0e545f 2740
c4a8e8be 2741 if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
19a7fe20
SRRH
2742 SEQ_PUT_FIELD(s, entry->pid);
2743 SEQ_PUT_FIELD(s, iter->cpu);
2744 SEQ_PUT_FIELD(s, iter->ts);
2745 if (trace_seq_has_overflowed(s))
2746 return TRACE_TYPE_PARTIAL_LINE;
c4a8e8be 2747 }
cb0f12aa 2748
f633cef0 2749 event = ftrace_find_event(entry->type);
a9a57763
SR
2750 return event ? event->funcs->binary(iter, 0, event) :
2751 TRACE_TYPE_HANDLED;
cb0f12aa
IM
2752}
2753
62b915f1 2754int trace_empty(struct trace_iterator *iter)
bc0c38d1 2755{
6d158a81 2756 struct ring_buffer_iter *buf_iter;
bc0c38d1
SR
2757 int cpu;
2758
9aba60fe 2759 /* If we are looking at one CPU buffer, only check that one */
ae3b5093 2760 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
9aba60fe 2761 cpu = iter->cpu_file;
6d158a81
SR
2762 buf_iter = trace_buffer_iter(iter, cpu);
2763 if (buf_iter) {
2764 if (!ring_buffer_iter_empty(buf_iter))
9aba60fe
SR
2765 return 0;
2766 } else {
12883efb 2767 if (!ring_buffer_empty_cpu(iter->trace_buffer->buffer, cpu))
9aba60fe
SR
2768 return 0;
2769 }
2770 return 1;
2771 }
2772
ab46428c 2773 for_each_tracing_cpu(cpu) {
6d158a81
SR
2774 buf_iter = trace_buffer_iter(iter, cpu);
2775 if (buf_iter) {
2776 if (!ring_buffer_iter_empty(buf_iter))
d769041f
SR
2777 return 0;
2778 } else {
12883efb 2779 if (!ring_buffer_empty_cpu(iter->trace_buffer->buffer, cpu))
d769041f
SR
2780 return 0;
2781 }
bc0c38d1 2782 }
d769041f 2783
797d3712 2784 return 1;
bc0c38d1
SR
2785}
2786
4f535968 2787/* Called with trace_event_read_lock() held. */
955b61e5 2788enum print_line_t print_trace_line(struct trace_iterator *iter)
f9896bf3 2789{
2c4f035f
FW
2790 enum print_line_t ret;
2791
19a7fe20
SRRH
2792 if (iter->lost_events) {
2793 trace_seq_printf(&iter->seq, "CPU:%d [LOST %lu EVENTS]\n",
2794 iter->cpu, iter->lost_events);
2795 if (trace_seq_has_overflowed(&iter->seq))
2796 return TRACE_TYPE_PARTIAL_LINE;
2797 }
bc21b478 2798
2c4f035f
FW
2799 if (iter->trace && iter->trace->print_line) {
2800 ret = iter->trace->print_line(iter);
2801 if (ret != TRACE_TYPE_UNHANDLED)
2802 return ret;
2803 }
72829bc3 2804
09ae7234
SRRH
2805 if (iter->ent->type == TRACE_BPUTS &&
2806 trace_flags & TRACE_ITER_PRINTK &&
2807 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
2808 return trace_print_bputs_msg_only(iter);
2809
48ead020
FW
2810 if (iter->ent->type == TRACE_BPRINT &&
2811 trace_flags & TRACE_ITER_PRINTK &&
2812 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
5ef841f6 2813 return trace_print_bprintk_msg_only(iter);
48ead020 2814
66896a85
FW
2815 if (iter->ent->type == TRACE_PRINT &&
2816 trace_flags & TRACE_ITER_PRINTK &&
2817 trace_flags & TRACE_ITER_PRINTK_MSGONLY)
5ef841f6 2818 return trace_print_printk_msg_only(iter);
66896a85 2819
cb0f12aa
IM
2820 if (trace_flags & TRACE_ITER_BIN)
2821 return print_bin_fmt(iter);
2822
5e3ca0ec
IM
2823 if (trace_flags & TRACE_ITER_HEX)
2824 return print_hex_fmt(iter);
2825
f9896bf3
IM
2826 if (trace_flags & TRACE_ITER_RAW)
2827 return print_raw_fmt(iter);
2828
f9896bf3
IM
2829 return print_trace_fmt(iter);
2830}
2831
7e9a49ef
JO
2832void trace_latency_header(struct seq_file *m)
2833{
2834 struct trace_iterator *iter = m->private;
2835
2836 /* print nothing if the buffers are empty */
2837 if (trace_empty(iter))
2838 return;
2839
2840 if (iter->iter_flags & TRACE_FILE_LAT_FMT)
2841 print_trace_header(m, iter);
2842
2843 if (!(trace_flags & TRACE_ITER_VERBOSE))
2844 print_lat_help_header(m);
2845}
2846
62b915f1
JO
2847void trace_default_header(struct seq_file *m)
2848{
2849 struct trace_iterator *iter = m->private;
2850
f56e7f8e
JO
2851 if (!(trace_flags & TRACE_ITER_CONTEXT_INFO))
2852 return;
2853
62b915f1
JO
2854 if (iter->iter_flags & TRACE_FILE_LAT_FMT) {
2855 /* print nothing if the buffers are empty */
2856 if (trace_empty(iter))
2857 return;
2858 print_trace_header(m, iter);
2859 if (!(trace_flags & TRACE_ITER_VERBOSE))
2860 print_lat_help_header(m);
2861 } else {
77271ce4
SR
2862 if (!(trace_flags & TRACE_ITER_VERBOSE)) {
2863 if (trace_flags & TRACE_ITER_IRQ_INFO)
12883efb 2864 print_func_help_header_irq(iter->trace_buffer, m);
77271ce4 2865 else
12883efb 2866 print_func_help_header(iter->trace_buffer, m);
77271ce4 2867 }
62b915f1
JO
2868 }
2869}
2870
e0a413f6
SR
2871static void test_ftrace_alive(struct seq_file *m)
2872{
2873 if (!ftrace_is_dead())
2874 return;
d79ac28f
RV
2875 seq_puts(m, "# WARNING: FUNCTION TRACING IS CORRUPTED\n"
2876 "# MAY BE MISSING FUNCTION EVENTS\n");
e0a413f6
SR
2877}
2878
d8741e2e 2879#ifdef CONFIG_TRACER_MAX_TRACE
f1affcaa 2880static void show_snapshot_main_help(struct seq_file *m)
d8741e2e 2881{
d79ac28f
RV
2882 seq_puts(m, "# echo 0 > snapshot : Clears and frees snapshot buffer\n"
2883 "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
2884 "# Takes a snapshot of the main buffer.\n"
2885 "# echo 2 > snapshot : Clears snapshot buffer (but does not allocate or free)\n"
2886 "# (Doesn't have to be '2' works with any number that\n"
2887 "# is not a '0' or '1')\n");
d8741e2e 2888}
f1affcaa
SRRH
2889
2890static void show_snapshot_percpu_help(struct seq_file *m)
2891{
fa6f0cc7 2892 seq_puts(m, "# echo 0 > snapshot : Invalid for per_cpu snapshot file.\n");
f1affcaa 2893#ifdef CONFIG_RING_BUFFER_ALLOW_SWAP
d79ac28f
RV
2894 seq_puts(m, "# echo 1 > snapshot : Allocates snapshot buffer, if not already allocated.\n"
2895 "# Takes a snapshot of the main buffer for this cpu.\n");
f1affcaa 2896#else
d79ac28f
RV
2897 seq_puts(m, "# echo 1 > snapshot : Not supported with this kernel.\n"
2898 "# Must use main snapshot file to allocate.\n");
f1affcaa 2899#endif
d79ac28f
RV
2900 seq_puts(m, "# echo 2 > snapshot : Clears this cpu's snapshot buffer (but does not allocate)\n"
2901 "# (Doesn't have to be '2' works with any number that\n"
2902 "# is not a '0' or '1')\n");
f1affcaa
SRRH
2903}
2904
d8741e2e
SRRH
2905static void print_snapshot_help(struct seq_file *m, struct trace_iterator *iter)
2906{
45ad21ca 2907 if (iter->tr->allocated_snapshot)
fa6f0cc7 2908 seq_puts(m, "#\n# * Snapshot is allocated *\n#\n");
d8741e2e 2909 else
fa6f0cc7 2910 seq_puts(m, "#\n# * Snapshot is freed *\n#\n");
d8741e2e 2911
fa6f0cc7 2912 seq_puts(m, "# Snapshot commands:\n");
f1affcaa
SRRH
2913 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
2914 show_snapshot_main_help(m);
2915 else
2916 show_snapshot_percpu_help(m);
d8741e2e
SRRH
2917}
2918#else
2919/* Should never be called */
2920static inline void print_snapshot_help(struct seq_file *m, struct trace_iterator *iter) { }
2921#endif
2922
bc0c38d1
SR
2923static int s_show(struct seq_file *m, void *v)
2924{
2925 struct trace_iterator *iter = v;
a63ce5b3 2926 int ret;
bc0c38d1
SR
2927
2928 if (iter->ent == NULL) {
2929 if (iter->tr) {
2930 seq_printf(m, "# tracer: %s\n", iter->trace->name);
2931 seq_puts(m, "#\n");
e0a413f6 2932 test_ftrace_alive(m);
bc0c38d1 2933 }
d8741e2e
SRRH
2934 if (iter->snapshot && trace_empty(iter))
2935 print_snapshot_help(m, iter);
2936 else if (iter->trace && iter->trace->print_header)
8bba1bf5 2937 iter->trace->print_header(m);
62b915f1
JO
2938 else
2939 trace_default_header(m);
2940
a63ce5b3
SR
2941 } else if (iter->leftover) {
2942 /*
2943 * If we filled the seq_file buffer earlier, we
2944 * want to just show it now.
2945 */
2946 ret = trace_print_seq(m, &iter->seq);
2947
2948 /* ret should this time be zero, but you never know */
2949 iter->leftover = ret;
2950
bc0c38d1 2951 } else {
f9896bf3 2952 print_trace_line(iter);
a63ce5b3
SR
2953 ret = trace_print_seq(m, &iter->seq);
2954 /*
2955 * If we overflow the seq_file buffer, then it will
2956 * ask us for this data again at start up.
2957 * Use that instead.
2958 * ret is 0 if seq_file write succeeded.
2959 * -1 otherwise.
2960 */
2961 iter->leftover = ret;
bc0c38d1
SR
2962 }
2963
2964 return 0;
2965}
2966
649e9c70
ON
2967/*
2968 * Should be used after trace_array_get(), trace_types_lock
2969 * ensures that i_cdev was already initialized.
2970 */
2971static inline int tracing_get_cpu(struct inode *inode)
2972{
2973 if (inode->i_cdev) /* See trace_create_cpu_file() */
2974 return (long)inode->i_cdev - 1;
2975 return RING_BUFFER_ALL_CPUS;
2976}
2977
88e9d34c 2978static const struct seq_operations tracer_seq_ops = {
4bf39a94
IM
2979 .start = s_start,
2980 .next = s_next,
2981 .stop = s_stop,
2982 .show = s_show,
bc0c38d1
SR
2983};
2984
e309b41d 2985static struct trace_iterator *
6484c71c 2986__tracing_open(struct inode *inode, struct file *file, bool snapshot)
bc0c38d1 2987{
6484c71c 2988 struct trace_array *tr = inode->i_private;
bc0c38d1 2989 struct trace_iterator *iter;
50e18b94 2990 int cpu;
bc0c38d1 2991
85a2f9b4
SR
2992 if (tracing_disabled)
2993 return ERR_PTR(-ENODEV);
60a11774 2994
50e18b94 2995 iter = __seq_open_private(file, &tracer_seq_ops, sizeof(*iter));
85a2f9b4
SR
2996 if (!iter)
2997 return ERR_PTR(-ENOMEM);
bc0c38d1 2998
6d158a81
SR
2999 iter->buffer_iter = kzalloc(sizeof(*iter->buffer_iter) * num_possible_cpus(),
3000 GFP_KERNEL);
93574fcc
DC
3001 if (!iter->buffer_iter)
3002 goto release;
3003
d7350c3f
FW
3004 /*
3005 * We make a copy of the current tracer to avoid concurrent
3006 * changes on it while we are reading.
3007 */
bc0c38d1 3008 mutex_lock(&trace_types_lock);
d7350c3f 3009 iter->trace = kzalloc(sizeof(*iter->trace), GFP_KERNEL);
85a2f9b4 3010 if (!iter->trace)
d7350c3f 3011 goto fail;
85a2f9b4 3012
2b6080f2 3013 *iter->trace = *tr->current_trace;
d7350c3f 3014
79f55997 3015 if (!zalloc_cpumask_var(&iter->started, GFP_KERNEL))
b0dfa978
FW
3016 goto fail;
3017
12883efb
SRRH
3018 iter->tr = tr;
3019
3020#ifdef CONFIG_TRACER_MAX_TRACE
2b6080f2
SR
3021 /* Currently only the top directory has a snapshot */
3022 if (tr->current_trace->print_max || snapshot)
12883efb 3023 iter->trace_buffer = &tr->max_buffer;
bc0c38d1 3024 else
12883efb
SRRH
3025#endif
3026 iter->trace_buffer = &tr->trace_buffer;
debdd57f 3027 iter->snapshot = snapshot;
bc0c38d1 3028 iter->pos = -1;
6484c71c 3029 iter->cpu_file = tracing_get_cpu(inode);
d7350c3f 3030 mutex_init(&iter->mutex);
bc0c38d1 3031
8bba1bf5
MM
3032 /* Notify the tracer early; before we stop tracing. */
3033 if (iter->trace && iter->trace->open)
a93751ca 3034 iter->trace->open(iter);
8bba1bf5 3035
12ef7d44 3036 /* Annotate start of buffers if we had overruns */
12883efb 3037 if (ring_buffer_overruns(iter->trace_buffer->buffer))
12ef7d44
SR
3038 iter->iter_flags |= TRACE_FILE_ANNOTATE;
3039
8be0709f 3040 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
58e8eedf 3041 if (trace_clocks[tr->clock_id].in_ns)
8be0709f
DS
3042 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
3043
debdd57f
HT
3044 /* stop the trace while dumping if we are not opening "snapshot" */
3045 if (!iter->snapshot)
2b6080f2 3046 tracing_stop_tr(tr);
2f26ebd5 3047
ae3b5093 3048 if (iter->cpu_file == RING_BUFFER_ALL_CPUS) {
b04cc6b1 3049 for_each_tracing_cpu(cpu) {
b04cc6b1 3050 iter->buffer_iter[cpu] =
12883efb 3051 ring_buffer_read_prepare(iter->trace_buffer->buffer, cpu);
72c9ddfd
DM
3052 }
3053 ring_buffer_read_prepare_sync();
3054 for_each_tracing_cpu(cpu) {
3055 ring_buffer_read_start(iter->buffer_iter[cpu]);
2f26ebd5 3056 tracing_iter_reset(iter, cpu);
b04cc6b1
FW
3057 }
3058 } else {
3059 cpu = iter->cpu_file;
3928a8a2 3060 iter->buffer_iter[cpu] =
12883efb 3061 ring_buffer_read_prepare(iter->trace_buffer->buffer, cpu);
72c9ddfd
DM
3062 ring_buffer_read_prepare_sync();
3063 ring_buffer_read_start(iter->buffer_iter[cpu]);
2f26ebd5 3064 tracing_iter_reset(iter, cpu);
3928a8a2
SR
3065 }
3066
bc0c38d1
SR
3067 mutex_unlock(&trace_types_lock);
3068
bc0c38d1 3069 return iter;
3928a8a2 3070
d7350c3f 3071 fail:
3928a8a2 3072 mutex_unlock(&trace_types_lock);
d7350c3f 3073 kfree(iter->trace);
6d158a81 3074 kfree(iter->buffer_iter);
93574fcc 3075release:
50e18b94
JO
3076 seq_release_private(inode, file);
3077 return ERR_PTR(-ENOMEM);
bc0c38d1
SR
3078}
3079
3080int tracing_open_generic(struct inode *inode, struct file *filp)
3081{
60a11774
SR
3082 if (tracing_disabled)
3083 return -ENODEV;
3084
bc0c38d1
SR
3085 filp->private_data = inode->i_private;
3086 return 0;
3087}
3088
2e86421d
GB
3089bool tracing_is_disabled(void)
3090{
3091 return (tracing_disabled) ? true: false;
3092}
3093
7b85af63
SRRH
3094/*
3095 * Open and update trace_array ref count.
3096 * Must have the current trace_array passed to it.
3097 */
dcc30223 3098static int tracing_open_generic_tr(struct inode *inode, struct file *filp)
7b85af63
SRRH
3099{
3100 struct trace_array *tr = inode->i_private;
3101
3102 if (tracing_disabled)
3103 return -ENODEV;
3104
3105 if (trace_array_get(tr) < 0)
3106 return -ENODEV;
3107
3108 filp->private_data = inode->i_private;
3109
3110 return 0;
7b85af63
SRRH
3111}
3112
4fd27358 3113static int tracing_release(struct inode *inode, struct file *file)
bc0c38d1 3114{
6484c71c 3115 struct trace_array *tr = inode->i_private;
907f2784 3116 struct seq_file *m = file->private_data;
4acd4d00 3117 struct trace_iterator *iter;
3928a8a2 3118 int cpu;
bc0c38d1 3119
ff451961 3120 if (!(file->f_mode & FMODE_READ)) {
6484c71c 3121 trace_array_put(tr);
4acd4d00 3122 return 0;
ff451961 3123 }
4acd4d00 3124
6484c71c 3125 /* Writes do not use seq_file */
4acd4d00 3126 iter = m->private;
bc0c38d1 3127 mutex_lock(&trace_types_lock);
a695cb58 3128
3928a8a2
SR
3129 for_each_tracing_cpu(cpu) {
3130 if (iter->buffer_iter[cpu])
3131 ring_buffer_read_finish(iter->buffer_iter[cpu]);
3132 }
3133
bc0c38d1
SR
3134 if (iter->trace && iter->trace->close)
3135 iter->trace->close(iter);
3136
debdd57f
HT
3137 if (!iter->snapshot)
3138 /* reenable tracing if it was previously enabled */
2b6080f2 3139 tracing_start_tr(tr);
f77d09a3
AL
3140
3141 __trace_array_put(tr);
3142
bc0c38d1
SR
3143 mutex_unlock(&trace_types_lock);
3144
d7350c3f 3145 mutex_destroy(&iter->mutex);
b0dfa978 3146 free_cpumask_var(iter->started);
d7350c3f 3147 kfree(iter->trace);
6d158a81 3148 kfree(iter->buffer_iter);
50e18b94 3149 seq_release_private(inode, file);
ff451961 3150
bc0c38d1
SR
3151 return 0;
3152}
3153
7b85af63
SRRH
3154static int tracing_release_generic_tr(struct inode *inode, struct file *file)
3155{
3156 struct trace_array *tr = inode->i_private;
3157
3158 trace_array_put(tr);
bc0c38d1
SR
3159 return 0;
3160}
3161
7b85af63
SRRH
3162static int tracing_single_release_tr(struct inode *inode, struct file *file)
3163{
3164 struct trace_array *tr = inode->i_private;
3165
3166 trace_array_put(tr);
3167
3168 return single_release(inode, file);
3169}
3170
bc0c38d1
SR
3171static int tracing_open(struct inode *inode, struct file *file)
3172{
6484c71c 3173 struct trace_array *tr = inode->i_private;
85a2f9b4
SR
3174 struct trace_iterator *iter;
3175 int ret = 0;
bc0c38d1 3176
ff451961
SRRH
3177 if (trace_array_get(tr) < 0)
3178 return -ENODEV;
3179
4acd4d00 3180 /* If this file was open for write, then erase contents */
6484c71c
ON
3181 if ((file->f_mode & FMODE_WRITE) && (file->f_flags & O_TRUNC)) {
3182 int cpu = tracing_get_cpu(inode);
3183
3184 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 3185 tracing_reset_online_cpus(&tr->trace_buffer);
4acd4d00 3186 else
6484c71c 3187 tracing_reset(&tr->trace_buffer, cpu);
4acd4d00 3188 }
bc0c38d1 3189
4acd4d00 3190 if (file->f_mode & FMODE_READ) {
6484c71c 3191 iter = __tracing_open(inode, file, false);
4acd4d00
SR
3192 if (IS_ERR(iter))
3193 ret = PTR_ERR(iter);
3194 else if (trace_flags & TRACE_ITER_LATENCY_FMT)
3195 iter->iter_flags |= TRACE_FILE_LAT_FMT;
3196 }
ff451961
SRRH
3197
3198 if (ret < 0)
3199 trace_array_put(tr);
3200
bc0c38d1
SR
3201 return ret;
3202}
3203
607e2ea1
SRRH
3204/*
3205 * Some tracers are not suitable for instance buffers.
3206 * A tracer is always available for the global array (toplevel)
3207 * or if it explicitly states that it is.
3208 */
3209static bool
3210trace_ok_for_array(struct tracer *t, struct trace_array *tr)
3211{
3212 return (tr->flags & TRACE_ARRAY_FL_GLOBAL) || t->allow_instances;
3213}
3214
3215/* Find the next tracer that this trace array may use */
3216static struct tracer *
3217get_tracer_for_array(struct trace_array *tr, struct tracer *t)
3218{
3219 while (t && !trace_ok_for_array(t, tr))
3220 t = t->next;
3221
3222 return t;
3223}
3224
e309b41d 3225static void *
bc0c38d1
SR
3226t_next(struct seq_file *m, void *v, loff_t *pos)
3227{
607e2ea1 3228 struct trace_array *tr = m->private;
f129e965 3229 struct tracer *t = v;
bc0c38d1
SR
3230
3231 (*pos)++;
3232
3233 if (t)
607e2ea1 3234 t = get_tracer_for_array(tr, t->next);
bc0c38d1 3235
bc0c38d1
SR
3236 return t;
3237}
3238
3239static void *t_start(struct seq_file *m, loff_t *pos)
3240{
607e2ea1 3241 struct trace_array *tr = m->private;
f129e965 3242 struct tracer *t;
bc0c38d1
SR
3243 loff_t l = 0;
3244
3245 mutex_lock(&trace_types_lock);
607e2ea1
SRRH
3246
3247 t = get_tracer_for_array(tr, trace_types);
3248 for (; t && l < *pos; t = t_next(m, t, &l))
3249 ;
bc0c38d1
SR
3250
3251 return t;
3252}
3253
3254static void t_stop(struct seq_file *m, void *p)
3255{
3256 mutex_unlock(&trace_types_lock);
3257}
3258
3259static int t_show(struct seq_file *m, void *v)
3260{
3261 struct tracer *t = v;
3262
3263 if (!t)
3264 return 0;
3265
fa6f0cc7 3266 seq_puts(m, t->name);
bc0c38d1
SR
3267 if (t->next)
3268 seq_putc(m, ' ');
3269 else
3270 seq_putc(m, '\n');
3271
3272 return 0;
3273}
3274
88e9d34c 3275static const struct seq_operations show_traces_seq_ops = {
4bf39a94
IM
3276 .start = t_start,
3277 .next = t_next,
3278 .stop = t_stop,
3279 .show = t_show,
bc0c38d1
SR
3280};
3281
3282static int show_traces_open(struct inode *inode, struct file *file)
3283{
607e2ea1
SRRH
3284 struct trace_array *tr = inode->i_private;
3285 struct seq_file *m;
3286 int ret;
3287
60a11774
SR
3288 if (tracing_disabled)
3289 return -ENODEV;
3290
607e2ea1
SRRH
3291 ret = seq_open(file, &show_traces_seq_ops);
3292 if (ret)
3293 return ret;
3294
3295 m = file->private_data;
3296 m->private = tr;
3297
3298 return 0;
bc0c38d1
SR
3299}
3300
4acd4d00
SR
3301static ssize_t
3302tracing_write_stub(struct file *filp, const char __user *ubuf,
3303 size_t count, loff_t *ppos)
3304{
3305 return count;
3306}
3307
098c879e 3308loff_t tracing_lseek(struct file *file, loff_t offset, int whence)
364829b1 3309{
098c879e
SRRH
3310 int ret;
3311
364829b1 3312 if (file->f_mode & FMODE_READ)
098c879e 3313 ret = seq_lseek(file, offset, whence);
364829b1 3314 else
098c879e
SRRH
3315 file->f_pos = ret = 0;
3316
3317 return ret;
364829b1
SP
3318}
3319
5e2336a0 3320static const struct file_operations tracing_fops = {
4bf39a94
IM
3321 .open = tracing_open,
3322 .read = seq_read,
4acd4d00 3323 .write = tracing_write_stub,
098c879e 3324 .llseek = tracing_lseek,
4bf39a94 3325 .release = tracing_release,
bc0c38d1
SR
3326};
3327
5e2336a0 3328static const struct file_operations show_traces_fops = {
c7078de1
IM
3329 .open = show_traces_open,
3330 .read = seq_read,
3331 .release = seq_release,
b444786f 3332 .llseek = seq_lseek,
c7078de1
IM
3333};
3334
36dfe925
IM
3335/*
3336 * The tracer itself will not take this lock, but still we want
3337 * to provide a consistent cpumask to user-space:
3338 */
3339static DEFINE_MUTEX(tracing_cpumask_update_lock);
3340
3341/*
3342 * Temporary storage for the character representation of the
3343 * CPU bitmask (and one more byte for the newline):
3344 */
3345static char mask_str[NR_CPUS + 1];
3346
c7078de1
IM
3347static ssize_t
3348tracing_cpumask_read(struct file *filp, char __user *ubuf,
3349 size_t count, loff_t *ppos)
3350{
ccfe9e42 3351 struct trace_array *tr = file_inode(filp)->i_private;
36dfe925 3352 int len;
c7078de1
IM
3353
3354 mutex_lock(&tracing_cpumask_update_lock);
36dfe925 3355
ccfe9e42 3356 len = cpumask_scnprintf(mask_str, count, tr->tracing_cpumask);
36dfe925
IM
3357 if (count - len < 2) {
3358 count = -EINVAL;
3359 goto out_err;
3360 }
3361 len += sprintf(mask_str + len, "\n");
3362 count = simple_read_from_buffer(ubuf, count, ppos, mask_str, NR_CPUS+1);
3363
3364out_err:
c7078de1
IM
3365 mutex_unlock(&tracing_cpumask_update_lock);
3366
3367 return count;
3368}
3369
3370static ssize_t
3371tracing_cpumask_write(struct file *filp, const char __user *ubuf,
3372 size_t count, loff_t *ppos)
3373{
ccfe9e42 3374 struct trace_array *tr = file_inode(filp)->i_private;
9e01c1b7 3375 cpumask_var_t tracing_cpumask_new;
2b6080f2 3376 int err, cpu;
9e01c1b7
RR
3377
3378 if (!alloc_cpumask_var(&tracing_cpumask_new, GFP_KERNEL))
3379 return -ENOMEM;
c7078de1 3380
9e01c1b7 3381 err = cpumask_parse_user(ubuf, count, tracing_cpumask_new);
c7078de1 3382 if (err)
36dfe925
IM
3383 goto err_unlock;
3384
215368e8
LZ
3385 mutex_lock(&tracing_cpumask_update_lock);
3386
a5e25883 3387 local_irq_disable();
0b9b12c1 3388 arch_spin_lock(&tr->max_lock);
ab46428c 3389 for_each_tracing_cpu(cpu) {
36dfe925
IM
3390 /*
3391 * Increase/decrease the disabled counter if we are
3392 * about to flip a bit in the cpumask:
3393 */
ccfe9e42 3394 if (cpumask_test_cpu(cpu, tr->tracing_cpumask) &&
9e01c1b7 3395 !cpumask_test_cpu(cpu, tracing_cpumask_new)) {
12883efb
SRRH
3396 atomic_inc(&per_cpu_ptr(tr->trace_buffer.data, cpu)->disabled);
3397 ring_buffer_record_disable_cpu(tr->trace_buffer.buffer, cpu);
36dfe925 3398 }
ccfe9e42 3399 if (!cpumask_test_cpu(cpu, tr->tracing_cpumask) &&
9e01c1b7 3400 cpumask_test_cpu(cpu, tracing_cpumask_new)) {
12883efb
SRRH
3401 atomic_dec(&per_cpu_ptr(tr->trace_buffer.data, cpu)->disabled);
3402 ring_buffer_record_enable_cpu(tr->trace_buffer.buffer, cpu);
36dfe925
IM
3403 }
3404 }
0b9b12c1 3405 arch_spin_unlock(&tr->max_lock);
a5e25883 3406 local_irq_enable();
36dfe925 3407
ccfe9e42 3408 cpumask_copy(tr->tracing_cpumask, tracing_cpumask_new);
36dfe925
IM
3409
3410 mutex_unlock(&tracing_cpumask_update_lock);
9e01c1b7 3411 free_cpumask_var(tracing_cpumask_new);
c7078de1
IM
3412
3413 return count;
36dfe925
IM
3414
3415err_unlock:
215368e8 3416 free_cpumask_var(tracing_cpumask_new);
36dfe925
IM
3417
3418 return err;
c7078de1
IM
3419}
3420
5e2336a0 3421static const struct file_operations tracing_cpumask_fops = {
ccfe9e42 3422 .open = tracing_open_generic_tr,
c7078de1
IM
3423 .read = tracing_cpumask_read,
3424 .write = tracing_cpumask_write,
ccfe9e42 3425 .release = tracing_release_generic_tr,
b444786f 3426 .llseek = generic_file_llseek,
bc0c38d1
SR
3427};
3428
fdb372ed 3429static int tracing_trace_options_show(struct seq_file *m, void *v)
bc0c38d1 3430{
d8e83d26 3431 struct tracer_opt *trace_opts;
2b6080f2 3432 struct trace_array *tr = m->private;
d8e83d26 3433 u32 tracer_flags;
d8e83d26 3434 int i;
adf9f195 3435
d8e83d26 3436 mutex_lock(&trace_types_lock);
2b6080f2
SR
3437 tracer_flags = tr->current_trace->flags->val;
3438 trace_opts = tr->current_trace->flags->opts;
d8e83d26 3439
bc0c38d1
SR
3440 for (i = 0; trace_options[i]; i++) {
3441 if (trace_flags & (1 << i))
fdb372ed 3442 seq_printf(m, "%s\n", trace_options[i]);
bc0c38d1 3443 else
fdb372ed 3444 seq_printf(m, "no%s\n", trace_options[i]);
bc0c38d1
SR
3445 }
3446
adf9f195
FW
3447 for (i = 0; trace_opts[i].name; i++) {
3448 if (tracer_flags & trace_opts[i].bit)
fdb372ed 3449 seq_printf(m, "%s\n", trace_opts[i].name);
adf9f195 3450 else
fdb372ed 3451 seq_printf(m, "no%s\n", trace_opts[i].name);
adf9f195 3452 }
d8e83d26 3453 mutex_unlock(&trace_types_lock);
adf9f195 3454
fdb372ed 3455 return 0;
bc0c38d1 3456}
bc0c38d1 3457
8c1a49ae 3458static int __set_tracer_option(struct trace_array *tr,
8d18eaaf
LZ
3459 struct tracer_flags *tracer_flags,
3460 struct tracer_opt *opts, int neg)
3461{
8c1a49ae 3462 struct tracer *trace = tr->current_trace;
8d18eaaf 3463 int ret;
bc0c38d1 3464
8c1a49ae 3465 ret = trace->set_flag(tr, tracer_flags->val, opts->bit, !neg);
8d18eaaf
LZ
3466 if (ret)
3467 return ret;
3468
3469 if (neg)
3470 tracer_flags->val &= ~opts->bit;
3471 else
3472 tracer_flags->val |= opts->bit;
3473 return 0;
bc0c38d1
SR
3474}
3475
adf9f195 3476/* Try to assign a tracer specific option */
8c1a49ae 3477static int set_tracer_option(struct trace_array *tr, char *cmp, int neg)
adf9f195 3478{
8c1a49ae 3479 struct tracer *trace = tr->current_trace;
7770841e 3480 struct tracer_flags *tracer_flags = trace->flags;
adf9f195 3481 struct tracer_opt *opts = NULL;
8d18eaaf 3482 int i;
adf9f195 3483
7770841e
Z
3484 for (i = 0; tracer_flags->opts[i].name; i++) {
3485 opts = &tracer_flags->opts[i];
adf9f195 3486
8d18eaaf 3487 if (strcmp(cmp, opts->name) == 0)
8c1a49ae 3488 return __set_tracer_option(tr, trace->flags, opts, neg);
adf9f195 3489 }
adf9f195 3490
8d18eaaf 3491 return -EINVAL;
adf9f195
FW
3492}
3493
613f04a0
SRRH
3494/* Some tracers require overwrite to stay enabled */
3495int trace_keep_overwrite(struct tracer *tracer, u32 mask, int set)
3496{
3497 if (tracer->enabled && (mask & TRACE_ITER_OVERWRITE) && !set)
3498 return -1;
3499
3500 return 0;
3501}
3502
2b6080f2 3503int set_tracer_flag(struct trace_array *tr, unsigned int mask, int enabled)
af4617bd
SR
3504{
3505 /* do nothing if flag is already set */
3506 if (!!(trace_flags & mask) == !!enabled)
613f04a0
SRRH
3507 return 0;
3508
3509 /* Give the tracer a chance to approve the change */
2b6080f2 3510 if (tr->current_trace->flag_changed)
bf6065b5 3511 if (tr->current_trace->flag_changed(tr, mask, !!enabled))
613f04a0 3512 return -EINVAL;
af4617bd
SR
3513
3514 if (enabled)
3515 trace_flags |= mask;
3516 else
3517 trace_flags &= ~mask;
e870e9a1
LZ
3518
3519 if (mask == TRACE_ITER_RECORD_CMD)
3520 trace_event_enable_cmd_record(enabled);
750912fa 3521
80902822 3522 if (mask == TRACE_ITER_OVERWRITE) {
12883efb 3523 ring_buffer_change_overwrite(tr->trace_buffer.buffer, enabled);
80902822 3524#ifdef CONFIG_TRACER_MAX_TRACE
12883efb 3525 ring_buffer_change_overwrite(tr->max_buffer.buffer, enabled);
80902822
SRRH
3526#endif
3527 }
81698831
SR
3528
3529 if (mask == TRACE_ITER_PRINTK)
3530 trace_printk_start_stop_comm(enabled);
613f04a0
SRRH
3531
3532 return 0;
af4617bd
SR
3533}
3534
2b6080f2 3535static int trace_set_options(struct trace_array *tr, char *option)
bc0c38d1 3536{
8d18eaaf 3537 char *cmp;
bc0c38d1 3538 int neg = 0;
613f04a0 3539 int ret = -ENODEV;
bc0c38d1
SR
3540 int i;
3541
7bcfaf54 3542 cmp = strstrip(option);
bc0c38d1 3543
8d18eaaf 3544 if (strncmp(cmp, "no", 2) == 0) {
bc0c38d1
SR
3545 neg = 1;
3546 cmp += 2;
3547 }
3548
69d34da2
SRRH
3549 mutex_lock(&trace_types_lock);
3550
bc0c38d1 3551 for (i = 0; trace_options[i]; i++) {
8d18eaaf 3552 if (strcmp(cmp, trace_options[i]) == 0) {
2b6080f2 3553 ret = set_tracer_flag(tr, 1 << i, !neg);
bc0c38d1
SR
3554 break;
3555 }
3556 }
adf9f195
FW
3557
3558 /* If no option could be set, test the specific tracer options */
69d34da2 3559 if (!trace_options[i])
8c1a49ae 3560 ret = set_tracer_option(tr, cmp, neg);
69d34da2
SRRH
3561
3562 mutex_unlock(&trace_types_lock);
bc0c38d1 3563
7bcfaf54
SR
3564 return ret;
3565}
3566
3567static ssize_t
3568tracing_trace_options_write(struct file *filp, const char __user *ubuf,
3569 size_t cnt, loff_t *ppos)
3570{
2b6080f2
SR
3571 struct seq_file *m = filp->private_data;
3572 struct trace_array *tr = m->private;
7bcfaf54 3573 char buf[64];
613f04a0 3574 int ret;
7bcfaf54
SR
3575
3576 if (cnt >= sizeof(buf))
3577 return -EINVAL;
3578
3579 if (copy_from_user(&buf, ubuf, cnt))
3580 return -EFAULT;
3581
a8dd2176
SR
3582 buf[cnt] = 0;
3583
2b6080f2 3584 ret = trace_set_options(tr, buf);
613f04a0
SRRH
3585 if (ret < 0)
3586 return ret;
7bcfaf54 3587
cf8517cf 3588 *ppos += cnt;
bc0c38d1
SR
3589
3590 return cnt;
3591}
3592
fdb372ed
LZ
3593static int tracing_trace_options_open(struct inode *inode, struct file *file)
3594{
7b85af63 3595 struct trace_array *tr = inode->i_private;
f77d09a3 3596 int ret;
7b85af63 3597
fdb372ed
LZ
3598 if (tracing_disabled)
3599 return -ENODEV;
2b6080f2 3600
7b85af63
SRRH
3601 if (trace_array_get(tr) < 0)
3602 return -ENODEV;
3603
f77d09a3
AL
3604 ret = single_open(file, tracing_trace_options_show, inode->i_private);
3605 if (ret < 0)
3606 trace_array_put(tr);
3607
3608 return ret;
fdb372ed
LZ
3609}
3610
5e2336a0 3611static const struct file_operations tracing_iter_fops = {
fdb372ed
LZ
3612 .open = tracing_trace_options_open,
3613 .read = seq_read,
3614 .llseek = seq_lseek,
7b85af63 3615 .release = tracing_single_release_tr,
ee6bce52 3616 .write = tracing_trace_options_write,
bc0c38d1
SR
3617};
3618
7bd2f24c
IM
3619static const char readme_msg[] =
3620 "tracing mini-HOWTO:\n\n"
22f45649
SRRH
3621 "# echo 0 > tracing_on : quick way to disable tracing\n"
3622 "# echo 1 > tracing_on : quick way to re-enable tracing\n\n"
3623 " Important files:\n"
3624 " trace\t\t\t- The static contents of the buffer\n"
3625 "\t\t\t To clear the buffer write into this file: echo > trace\n"
3626 " trace_pipe\t\t- A consuming read to see the contents of the buffer\n"
3627 " current_tracer\t- function and latency tracers\n"
3628 " available_tracers\t- list of configured tracers for current_tracer\n"
3629 " buffer_size_kb\t- view and modify size of per cpu buffer\n"
3630 " buffer_total_size_kb - view total size of all cpu buffers\n\n"
3631 " trace_clock\t\t-change the clock used to order events\n"
3632 " local: Per cpu clock but may not be synced across CPUs\n"
3633 " global: Synced across CPUs but slows tracing down.\n"
3634 " counter: Not a clock, but just an increment\n"
3635 " uptime: Jiffy counter from time of boot\n"
3636 " perf: Same clock that perf events use\n"
3637#ifdef CONFIG_X86_64
3638 " x86-tsc: TSC cycle counter\n"
3639#endif
3640 "\n trace_marker\t\t- Writes into this file writes into the kernel buffer\n"
3641 " tracing_cpumask\t- Limit which CPUs to trace\n"
3642 " instances\t\t- Make sub-buffers with: mkdir instances/foo\n"
3643 "\t\t\t Remove sub-buffer with rmdir\n"
3644 " trace_options\t\t- Set format or modify how tracing happens\n"
71485c45
SRRH
3645 "\t\t\t Disable an option by adding a suffix 'no' to the\n"
3646 "\t\t\t option name\n"
939c7a4f 3647 " saved_cmdlines_size\t- echo command number in here to store comm-pid list\n"
22f45649
SRRH
3648#ifdef CONFIG_DYNAMIC_FTRACE
3649 "\n available_filter_functions - list of functions that can be filtered on\n"
71485c45
SRRH
3650 " set_ftrace_filter\t- echo function name in here to only trace these\n"
3651 "\t\t\t functions\n"
3652 "\t accepts: func_full_name, *func_end, func_begin*, *func_middle*\n"
3653 "\t modules: Can select a group via module\n"
3654 "\t Format: :mod:<module-name>\n"
3655 "\t example: echo :mod:ext3 > set_ftrace_filter\n"
3656 "\t triggers: a command to perform when function is hit\n"
3657 "\t Format: <function>:<trigger>[:count]\n"
3658 "\t trigger: traceon, traceoff\n"
3659 "\t\t enable_event:<system>:<event>\n"
3660 "\t\t disable_event:<system>:<event>\n"
22f45649 3661#ifdef CONFIG_STACKTRACE
71485c45 3662 "\t\t stacktrace\n"
22f45649
SRRH
3663#endif
3664#ifdef CONFIG_TRACER_SNAPSHOT
71485c45 3665 "\t\t snapshot\n"
22f45649 3666#endif
17a280ea
SRRH
3667 "\t\t dump\n"
3668 "\t\t cpudump\n"
71485c45
SRRH
3669 "\t example: echo do_fault:traceoff > set_ftrace_filter\n"
3670 "\t echo do_trap:traceoff:3 > set_ftrace_filter\n"
3671 "\t The first one will disable tracing every time do_fault is hit\n"
3672 "\t The second will disable tracing at most 3 times when do_trap is hit\n"
3673 "\t The first time do trap is hit and it disables tracing, the\n"
3674 "\t counter will decrement to 2. If tracing is already disabled,\n"
3675 "\t the counter will not decrement. It only decrements when the\n"
3676 "\t trigger did work\n"
3677 "\t To remove trigger without count:\n"
3678 "\t echo '!<function>:<trigger> > set_ftrace_filter\n"
3679 "\t To remove trigger with a count:\n"
3680 "\t echo '!<function>:<trigger>:0 > set_ftrace_filter\n"
22f45649 3681 " set_ftrace_notrace\t- echo function name in here to never trace.\n"
71485c45
SRRH
3682 "\t accepts: func_full_name, *func_end, func_begin*, *func_middle*\n"
3683 "\t modules: Can select a group via module command :mod:\n"
3684 "\t Does not accept triggers\n"
22f45649
SRRH
3685#endif /* CONFIG_DYNAMIC_FTRACE */
3686#ifdef CONFIG_FUNCTION_TRACER
71485c45
SRRH
3687 " set_ftrace_pid\t- Write pid(s) to only function trace those pids\n"
3688 "\t\t (function)\n"
22f45649
SRRH
3689#endif
3690#ifdef CONFIG_FUNCTION_GRAPH_TRACER
3691 " set_graph_function\t- Trace the nested calls of a function (function_graph)\n"
d048a8c7 3692 " set_graph_notrace\t- Do not trace the nested calls of a function (function_graph)\n"
22f45649
SRRH
3693 " max_graph_depth\t- Trace a limited depth of nested calls (0 is unlimited)\n"
3694#endif
3695#ifdef CONFIG_TRACER_SNAPSHOT
71485c45
SRRH
3696 "\n snapshot\t\t- Like 'trace' but shows the content of the static\n"
3697 "\t\t\t snapshot buffer. Read the contents for more\n"
3698 "\t\t\t information\n"
22f45649 3699#endif
991821c8 3700#ifdef CONFIG_STACK_TRACER
22f45649
SRRH
3701 " stack_trace\t\t- Shows the max stack trace when active\n"
3702 " stack_max_size\t- Shows current max stack size that was traced\n"
71485c45
SRRH
3703 "\t\t\t Write into this file to reset the max size (trigger a\n"
3704 "\t\t\t new trace)\n"
22f45649 3705#ifdef CONFIG_DYNAMIC_FTRACE
71485c45
SRRH
3706 " stack_trace_filter\t- Like set_ftrace_filter but limits what stack_trace\n"
3707 "\t\t\t traces\n"
22f45649 3708#endif
991821c8 3709#endif /* CONFIG_STACK_TRACER */
26f25564
TZ
3710 " events/\t\t- Directory containing all trace event subsystems:\n"
3711 " enable\t\t- Write 0/1 to enable/disable tracing of all events\n"
3712 " events/<system>/\t- Directory containing all trace events for <system>:\n"
71485c45
SRRH
3713 " enable\t\t- Write 0/1 to enable/disable tracing of all <system>\n"
3714 "\t\t\t events\n"
26f25564 3715 " filter\t\t- If set, only events passing filter are traced\n"
71485c45
SRRH
3716 " events/<system>/<event>/\t- Directory containing control files for\n"
3717 "\t\t\t <event>:\n"
26f25564
TZ
3718 " enable\t\t- Write 0/1 to enable/disable tracing of <event>\n"
3719 " filter\t\t- If set, only events passing filter are traced\n"
3720 " trigger\t\t- If set, a command to perform when event is hit\n"
71485c45
SRRH
3721 "\t Format: <trigger>[:count][if <filter>]\n"
3722 "\t trigger: traceon, traceoff\n"
3723 "\t enable_event:<system>:<event>\n"
3724 "\t disable_event:<system>:<event>\n"
26f25564 3725#ifdef CONFIG_STACKTRACE
71485c45 3726 "\t\t stacktrace\n"
26f25564
TZ
3727#endif
3728#ifdef CONFIG_TRACER_SNAPSHOT
71485c45 3729 "\t\t snapshot\n"
26f25564 3730#endif
71485c45
SRRH
3731 "\t example: echo traceoff > events/block/block_unplug/trigger\n"
3732 "\t echo traceoff:3 > events/block/block_unplug/trigger\n"
3733 "\t echo 'enable_event:kmem:kmalloc:3 if nr_rq > 1' > \\\n"
3734 "\t events/block/block_unplug/trigger\n"
3735 "\t The first disables tracing every time block_unplug is hit.\n"
3736 "\t The second disables tracing the first 3 times block_unplug is hit.\n"
3737 "\t The third enables the kmalloc event the first 3 times block_unplug\n"
3738 "\t is hit and has value of greater than 1 for the 'nr_rq' event field.\n"
3739 "\t Like function triggers, the counter is only decremented if it\n"
3740 "\t enabled or disabled tracing.\n"
3741 "\t To remove a trigger without a count:\n"
3742 "\t echo '!<trigger> > <system>/<event>/trigger\n"
3743 "\t To remove a trigger with a count:\n"
3744 "\t echo '!<trigger>:0 > <system>/<event>/trigger\n"
3745 "\t Filters can be ignored when removing a trigger.\n"
7bd2f24c
IM
3746;
3747
3748static ssize_t
3749tracing_readme_read(struct file *filp, char __user *ubuf,
3750 size_t cnt, loff_t *ppos)
3751{
3752 return simple_read_from_buffer(ubuf, cnt, ppos,
3753 readme_msg, strlen(readme_msg));
3754}
3755
5e2336a0 3756static const struct file_operations tracing_readme_fops = {
c7078de1
IM
3757 .open = tracing_open_generic,
3758 .read = tracing_readme_read,
b444786f 3759 .llseek = generic_file_llseek,
7bd2f24c
IM
3760};
3761
42584c81
YY
3762static void *saved_cmdlines_next(struct seq_file *m, void *v, loff_t *pos)
3763{
3764 unsigned int *ptr = v;
69abe6a5 3765
42584c81
YY
3766 if (*pos || m->count)
3767 ptr++;
69abe6a5 3768
42584c81 3769 (*pos)++;
69abe6a5 3770
939c7a4f
YY
3771 for (; ptr < &savedcmd->map_cmdline_to_pid[savedcmd->cmdline_num];
3772 ptr++) {
42584c81
YY
3773 if (*ptr == -1 || *ptr == NO_CMDLINE_MAP)
3774 continue;
69abe6a5 3775
42584c81
YY
3776 return ptr;
3777 }
69abe6a5 3778
42584c81
YY
3779 return NULL;
3780}
3781
3782static void *saved_cmdlines_start(struct seq_file *m, loff_t *pos)
3783{
3784 void *v;
3785 loff_t l = 0;
69abe6a5 3786
4c27e756
SRRH
3787 preempt_disable();
3788 arch_spin_lock(&trace_cmdline_lock);
3789
939c7a4f 3790 v = &savedcmd->map_cmdline_to_pid[0];
42584c81
YY
3791 while (l <= *pos) {
3792 v = saved_cmdlines_next(m, v, &l);
3793 if (!v)
3794 return NULL;
69abe6a5
AP
3795 }
3796
42584c81
YY
3797 return v;
3798}
3799
3800static void saved_cmdlines_stop(struct seq_file *m, void *v)
3801{
4c27e756
SRRH
3802 arch_spin_unlock(&trace_cmdline_lock);
3803 preempt_enable();
42584c81 3804}
69abe6a5 3805
42584c81
YY
3806static int saved_cmdlines_show(struct seq_file *m, void *v)
3807{
3808 char buf[TASK_COMM_LEN];
3809 unsigned int *pid = v;
69abe6a5 3810
4c27e756 3811 __trace_find_cmdline(*pid, buf);
42584c81
YY
3812 seq_printf(m, "%d %s\n", *pid, buf);
3813 return 0;
3814}
3815
3816static const struct seq_operations tracing_saved_cmdlines_seq_ops = {
3817 .start = saved_cmdlines_start,
3818 .next = saved_cmdlines_next,
3819 .stop = saved_cmdlines_stop,
3820 .show = saved_cmdlines_show,
3821};
3822
3823static int tracing_saved_cmdlines_open(struct inode *inode, struct file *filp)
3824{
3825 if (tracing_disabled)
3826 return -ENODEV;
3827
3828 return seq_open(filp, &tracing_saved_cmdlines_seq_ops);
69abe6a5
AP
3829}
3830
3831static const struct file_operations tracing_saved_cmdlines_fops = {
42584c81
YY
3832 .open = tracing_saved_cmdlines_open,
3833 .read = seq_read,
3834 .llseek = seq_lseek,
3835 .release = seq_release,
69abe6a5
AP
3836};
3837
939c7a4f
YY
3838static ssize_t
3839tracing_saved_cmdlines_size_read(struct file *filp, char __user *ubuf,
3840 size_t cnt, loff_t *ppos)
3841{
3842 char buf[64];
3843 int r;
3844
3845 arch_spin_lock(&trace_cmdline_lock);
a6af8fbf 3846 r = scnprintf(buf, sizeof(buf), "%u\n", savedcmd->cmdline_num);
939c7a4f
YY
3847 arch_spin_unlock(&trace_cmdline_lock);
3848
3849 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
3850}
3851
3852static void free_saved_cmdlines_buffer(struct saved_cmdlines_buffer *s)
3853{
3854 kfree(s->saved_cmdlines);
3855 kfree(s->map_cmdline_to_pid);
3856 kfree(s);
3857}
3858
3859static int tracing_resize_saved_cmdlines(unsigned int val)
3860{
3861 struct saved_cmdlines_buffer *s, *savedcmd_temp;
3862
a6af8fbf 3863 s = kmalloc(sizeof(*s), GFP_KERNEL);
939c7a4f
YY
3864 if (!s)
3865 return -ENOMEM;
3866
3867 if (allocate_cmdlines_buffer(val, s) < 0) {
3868 kfree(s);
3869 return -ENOMEM;
3870 }
3871
3872 arch_spin_lock(&trace_cmdline_lock);
3873 savedcmd_temp = savedcmd;
3874 savedcmd = s;
3875 arch_spin_unlock(&trace_cmdline_lock);
3876 free_saved_cmdlines_buffer(savedcmd_temp);
3877
3878 return 0;
3879}
3880
3881static ssize_t
3882tracing_saved_cmdlines_size_write(struct file *filp, const char __user *ubuf,
3883 size_t cnt, loff_t *ppos)
3884{
3885 unsigned long val;
3886 int ret;
3887
3888 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
3889 if (ret)
3890 return ret;
3891
3892 /* must have at least 1 entry or less than PID_MAX_DEFAULT */
3893 if (!val || val > PID_MAX_DEFAULT)
3894 return -EINVAL;
3895
3896 ret = tracing_resize_saved_cmdlines((unsigned int)val);
3897 if (ret < 0)
3898 return ret;
3899
3900 *ppos += cnt;
3901
3902 return cnt;
3903}
3904
3905static const struct file_operations tracing_saved_cmdlines_size_fops = {
3906 .open = tracing_open_generic,
3907 .read = tracing_saved_cmdlines_size_read,
3908 .write = tracing_saved_cmdlines_size_write,
3909};
3910
bc0c38d1
SR
3911static ssize_t
3912tracing_set_trace_read(struct file *filp, char __user *ubuf,
3913 size_t cnt, loff_t *ppos)
3914{
2b6080f2 3915 struct trace_array *tr = filp->private_data;
ee6c2c1b 3916 char buf[MAX_TRACER_SIZE+2];
bc0c38d1
SR
3917 int r;
3918
3919 mutex_lock(&trace_types_lock);
2b6080f2 3920 r = sprintf(buf, "%s\n", tr->current_trace->name);
bc0c38d1
SR
3921 mutex_unlock(&trace_types_lock);
3922
4bf39a94 3923 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
bc0c38d1
SR
3924}
3925
b6f11df2
ACM
3926int tracer_init(struct tracer *t, struct trace_array *tr)
3927{
12883efb 3928 tracing_reset_online_cpus(&tr->trace_buffer);
b6f11df2
ACM
3929 return t->init(tr);
3930}
3931
12883efb 3932static void set_buffer_entries(struct trace_buffer *buf, unsigned long val)
438ced17
VN
3933{
3934 int cpu;
737223fb 3935
438ced17 3936 for_each_tracing_cpu(cpu)
12883efb 3937 per_cpu_ptr(buf->data, cpu)->entries = val;
438ced17
VN
3938}
3939
12883efb 3940#ifdef CONFIG_TRACER_MAX_TRACE
d60da506 3941/* resize @tr's buffer to the size of @size_tr's entries */
12883efb
SRRH
3942static int resize_buffer_duplicate_size(struct trace_buffer *trace_buf,
3943 struct trace_buffer *size_buf, int cpu_id)
d60da506
HT
3944{
3945 int cpu, ret = 0;
3946
3947 if (cpu_id == RING_BUFFER_ALL_CPUS) {
3948 for_each_tracing_cpu(cpu) {
12883efb
SRRH
3949 ret = ring_buffer_resize(trace_buf->buffer,
3950 per_cpu_ptr(size_buf->data, cpu)->entries, cpu);
d60da506
HT
3951 if (ret < 0)
3952 break;
12883efb
SRRH
3953 per_cpu_ptr(trace_buf->data, cpu)->entries =
3954 per_cpu_ptr(size_buf->data, cpu)->entries;
d60da506
HT
3955 }
3956 } else {
12883efb
SRRH
3957 ret = ring_buffer_resize(trace_buf->buffer,
3958 per_cpu_ptr(size_buf->data, cpu_id)->entries, cpu_id);
d60da506 3959 if (ret == 0)
12883efb
SRRH
3960 per_cpu_ptr(trace_buf->data, cpu_id)->entries =
3961 per_cpu_ptr(size_buf->data, cpu_id)->entries;
d60da506
HT
3962 }
3963
3964 return ret;
3965}
12883efb 3966#endif /* CONFIG_TRACER_MAX_TRACE */
d60da506 3967
2b6080f2
SR
3968static int __tracing_resize_ring_buffer(struct trace_array *tr,
3969 unsigned long size, int cpu)
73c5162a
SR
3970{
3971 int ret;
3972
3973 /*
3974 * If kernel or user changes the size of the ring buffer
a123c52b
SR
3975 * we use the size that was given, and we can forget about
3976 * expanding it later.
73c5162a 3977 */
55034cd6 3978 ring_buffer_expanded = true;
73c5162a 3979
b382ede6 3980 /* May be called before buffers are initialized */
12883efb 3981 if (!tr->trace_buffer.buffer)
b382ede6
SR
3982 return 0;
3983
12883efb 3984 ret = ring_buffer_resize(tr->trace_buffer.buffer, size, cpu);
73c5162a
SR
3985 if (ret < 0)
3986 return ret;
3987
12883efb 3988#ifdef CONFIG_TRACER_MAX_TRACE
2b6080f2
SR
3989 if (!(tr->flags & TRACE_ARRAY_FL_GLOBAL) ||
3990 !tr->current_trace->use_max_tr)
ef710e10
KM
3991 goto out;
3992
12883efb 3993 ret = ring_buffer_resize(tr->max_buffer.buffer, size, cpu);
73c5162a 3994 if (ret < 0) {
12883efb
SRRH
3995 int r = resize_buffer_duplicate_size(&tr->trace_buffer,
3996 &tr->trace_buffer, cpu);
73c5162a 3997 if (r < 0) {
a123c52b
SR
3998 /*
3999 * AARGH! We are left with different
4000 * size max buffer!!!!
4001 * The max buffer is our "snapshot" buffer.
4002 * When a tracer needs a snapshot (one of the
4003 * latency tracers), it swaps the max buffer
4004 * with the saved snap shot. We succeeded to
4005 * update the size of the main buffer, but failed to
4006 * update the size of the max buffer. But when we tried
4007 * to reset the main buffer to the original size, we
4008 * failed there too. This is very unlikely to
4009 * happen, but if it does, warn and kill all
4010 * tracing.
4011 */
73c5162a
SR
4012 WARN_ON(1);
4013 tracing_disabled = 1;
4014 }
4015 return ret;
4016 }
4017
438ced17 4018 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 4019 set_buffer_entries(&tr->max_buffer, size);
438ced17 4020 else
12883efb 4021 per_cpu_ptr(tr->max_buffer.data, cpu)->entries = size;
438ced17 4022
ef710e10 4023 out:
12883efb
SRRH
4024#endif /* CONFIG_TRACER_MAX_TRACE */
4025
438ced17 4026 if (cpu == RING_BUFFER_ALL_CPUS)
12883efb 4027 set_buffer_entries(&tr->trace_buffer, size);
438ced17 4028 else
12883efb 4029 per_cpu_ptr(tr->trace_buffer.data, cpu)->entries = size;
73c5162a
SR
4030
4031 return ret;
4032}
4033
2b6080f2
SR
4034static ssize_t tracing_resize_ring_buffer(struct trace_array *tr,
4035 unsigned long size, int cpu_id)
4f271a2a 4036{
83f40318 4037 int ret = size;
4f271a2a
VN
4038
4039 mutex_lock(&trace_types_lock);
4040
438ced17
VN
4041 if (cpu_id != RING_BUFFER_ALL_CPUS) {
4042 /* make sure, this cpu is enabled in the mask */
4043 if (!cpumask_test_cpu(cpu_id, tracing_buffer_mask)) {
4044 ret = -EINVAL;
4045 goto out;
4046 }
4047 }
4f271a2a 4048
2b6080f2 4049 ret = __tracing_resize_ring_buffer(tr, size, cpu_id);
4f271a2a
VN
4050 if (ret < 0)
4051 ret = -ENOMEM;
4052
438ced17 4053out:
4f271a2a
VN
4054 mutex_unlock(&trace_types_lock);
4055
4056 return ret;
4057}
4058
ef710e10 4059
1852fcce
SR
4060/**
4061 * tracing_update_buffers - used by tracing facility to expand ring buffers
4062 *
4063 * To save on memory when the tracing is never used on a system with it
4064 * configured in. The ring buffers are set to a minimum size. But once
4065 * a user starts to use the tracing facility, then they need to grow
4066 * to their default size.
4067 *
4068 * This function is to be called when a tracer is about to be used.
4069 */
4070int tracing_update_buffers(void)
4071{
4072 int ret = 0;
4073
1027fcb2 4074 mutex_lock(&trace_types_lock);
1852fcce 4075 if (!ring_buffer_expanded)
2b6080f2 4076 ret = __tracing_resize_ring_buffer(&global_trace, trace_buf_size,
438ced17 4077 RING_BUFFER_ALL_CPUS);
1027fcb2 4078 mutex_unlock(&trace_types_lock);
1852fcce
SR
4079
4080 return ret;
4081}
4082
577b785f
SR
4083struct trace_option_dentry;
4084
4085static struct trace_option_dentry *
2b6080f2 4086create_trace_option_files(struct trace_array *tr, struct tracer *tracer);
577b785f
SR
4087
4088static void
4089destroy_trace_option_files(struct trace_option_dentry *topts);
4090
6b450d25
SRRH
4091/*
4092 * Used to clear out the tracer before deletion of an instance.
4093 * Must have trace_types_lock held.
4094 */
4095static void tracing_set_nop(struct trace_array *tr)
4096{
4097 if (tr->current_trace == &nop_trace)
4098 return;
4099
50512ab5 4100 tr->current_trace->enabled--;
6b450d25
SRRH
4101
4102 if (tr->current_trace->reset)
4103 tr->current_trace->reset(tr);
4104
4105 tr->current_trace = &nop_trace;
4106}
4107
607e2ea1 4108static int tracing_set_tracer(struct trace_array *tr, const char *buf)
bc0c38d1 4109{
577b785f 4110 static struct trace_option_dentry *topts;
bc0c38d1 4111 struct tracer *t;
12883efb 4112#ifdef CONFIG_TRACER_MAX_TRACE
34600f0e 4113 bool had_max_tr;
12883efb 4114#endif
d9e54076 4115 int ret = 0;
bc0c38d1 4116
1027fcb2
SR
4117 mutex_lock(&trace_types_lock);
4118
73c5162a 4119 if (!ring_buffer_expanded) {
2b6080f2 4120 ret = __tracing_resize_ring_buffer(tr, trace_buf_size,
438ced17 4121 RING_BUFFER_ALL_CPUS);
73c5162a 4122 if (ret < 0)
59f586db 4123 goto out;
73c5162a
SR
4124 ret = 0;
4125 }
4126
bc0c38d1
SR
4127 for (t = trace_types; t; t = t->next) {
4128 if (strcmp(t->name, buf) == 0)
4129 break;
4130 }
c2931e05
FW
4131 if (!t) {
4132 ret = -EINVAL;
4133 goto out;
4134 }
2b6080f2 4135 if (t == tr->current_trace)
bc0c38d1
SR
4136 goto out;
4137
607e2ea1
SRRH
4138 /* Some tracers are only allowed for the top level buffer */
4139 if (!trace_ok_for_array(t, tr)) {
4140 ret = -EINVAL;
4141 goto out;
4142 }
4143
cf6ab6d9
SRRH
4144 /* If trace pipe files are being read, we can't change the tracer */
4145 if (tr->current_trace->ref) {
4146 ret = -EBUSY;
4147 goto out;
4148 }
4149
9f029e83 4150 trace_branch_disable();
613f04a0 4151
50512ab5 4152 tr->current_trace->enabled--;
613f04a0 4153
2b6080f2
SR
4154 if (tr->current_trace->reset)
4155 tr->current_trace->reset(tr);
34600f0e 4156
12883efb 4157 /* Current trace needs to be nop_trace before synchronize_sched */
2b6080f2 4158 tr->current_trace = &nop_trace;
34600f0e 4159
45ad21ca
SRRH
4160#ifdef CONFIG_TRACER_MAX_TRACE
4161 had_max_tr = tr->allocated_snapshot;
34600f0e
SR
4162
4163 if (had_max_tr && !t->use_max_tr) {
4164 /*
4165 * We need to make sure that the update_max_tr sees that
4166 * current_trace changed to nop_trace to keep it from
4167 * swapping the buffers after we resize it.
4168 * The update_max_tr is called from interrupts disabled
4169 * so a synchronized_sched() is sufficient.
4170 */
4171 synchronize_sched();
3209cff4 4172 free_snapshot(tr);
ef710e10 4173 }
12883efb 4174#endif
f1b21c9a
SRRH
4175 /* Currently, only the top instance has options */
4176 if (tr->flags & TRACE_ARRAY_FL_GLOBAL) {
4177 destroy_trace_option_files(topts);
4178 topts = create_trace_option_files(tr, t);
4179 }
12883efb
SRRH
4180
4181#ifdef CONFIG_TRACER_MAX_TRACE
34600f0e 4182 if (t->use_max_tr && !had_max_tr) {
3209cff4 4183 ret = alloc_snapshot(tr);
d60da506
HT
4184 if (ret < 0)
4185 goto out;
ef710e10 4186 }
12883efb 4187#endif
577b785f 4188
1c80025a 4189 if (t->init) {
b6f11df2 4190 ret = tracer_init(t, tr);
1c80025a
FW
4191 if (ret)
4192 goto out;
4193 }
bc0c38d1 4194
2b6080f2 4195 tr->current_trace = t;
50512ab5 4196 tr->current_trace->enabled++;
9f029e83 4197 trace_branch_enable(tr);
bc0c38d1
SR
4198 out:
4199 mutex_unlock(&trace_types_lock);
4200
d9e54076
PZ
4201 return ret;
4202}
4203
4204static ssize_t
4205tracing_set_trace_write(struct file *filp, const char __user *ubuf,
4206 size_t cnt, loff_t *ppos)
4207{
607e2ea1 4208 struct trace_array *tr = filp->private_data;
ee6c2c1b 4209 char buf[MAX_TRACER_SIZE+1];
d9e54076
PZ
4210 int i;
4211 size_t ret;
e6e7a65a
FW
4212 int err;
4213
4214 ret = cnt;
d9e54076 4215
ee6c2c1b
LZ
4216 if (cnt > MAX_TRACER_SIZE)
4217 cnt = MAX_TRACER_SIZE;
d9e54076
PZ
4218
4219 if (copy_from_user(&buf, ubuf, cnt))
4220 return -EFAULT;
4221
4222 buf[cnt] = 0;
4223
4224 /* strip ending whitespace. */
4225 for (i = cnt - 1; i > 0 && isspace(buf[i]); i--)
4226 buf[i] = 0;
4227
607e2ea1 4228 err = tracing_set_tracer(tr, buf);
e6e7a65a
FW
4229 if (err)
4230 return err;
d9e54076 4231
cf8517cf 4232 *ppos += ret;
bc0c38d1 4233
c2931e05 4234 return ret;
bc0c38d1
SR
4235}
4236
4237static ssize_t
6508fa76
SF
4238tracing_nsecs_read(unsigned long *ptr, char __user *ubuf,
4239 size_t cnt, loff_t *ppos)
bc0c38d1 4240{
bc0c38d1
SR
4241 char buf[64];
4242 int r;
4243
cffae437 4244 r = snprintf(buf, sizeof(buf), "%ld\n",
bc0c38d1 4245 *ptr == (unsigned long)-1 ? -1 : nsecs_to_usecs(*ptr));
cffae437
SR
4246 if (r > sizeof(buf))
4247 r = sizeof(buf);
4bf39a94 4248 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
bc0c38d1
SR
4249}
4250
4251static ssize_t
6508fa76
SF
4252tracing_nsecs_write(unsigned long *ptr, const char __user *ubuf,
4253 size_t cnt, loff_t *ppos)
bc0c38d1 4254{
5e39841c 4255 unsigned long val;
c6caeeb1 4256 int ret;
bc0c38d1 4257
22fe9b54
PH
4258 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
4259 if (ret)
c6caeeb1 4260 return ret;
bc0c38d1
SR
4261
4262 *ptr = val * 1000;
4263
4264 return cnt;
4265}
4266
6508fa76
SF
4267static ssize_t
4268tracing_thresh_read(struct file *filp, char __user *ubuf,
4269 size_t cnt, loff_t *ppos)
4270{
4271 return tracing_nsecs_read(&tracing_thresh, ubuf, cnt, ppos);
4272}
4273
4274static ssize_t
4275tracing_thresh_write(struct file *filp, const char __user *ubuf,
4276 size_t cnt, loff_t *ppos)
4277{
4278 struct trace_array *tr = filp->private_data;
4279 int ret;
4280
4281 mutex_lock(&trace_types_lock);
4282 ret = tracing_nsecs_write(&tracing_thresh, ubuf, cnt, ppos);
4283 if (ret < 0)
4284 goto out;
4285
4286 if (tr->current_trace->update_thresh) {
4287 ret = tr->current_trace->update_thresh(tr);
4288 if (ret < 0)
4289 goto out;
4290 }
4291
4292 ret = cnt;
4293out:
4294 mutex_unlock(&trace_types_lock);
4295
4296 return ret;
4297}
4298
4299static ssize_t
4300tracing_max_lat_read(struct file *filp, char __user *ubuf,
4301 size_t cnt, loff_t *ppos)
4302{
4303 return tracing_nsecs_read(filp->private_data, ubuf, cnt, ppos);
4304}
4305
4306static ssize_t
4307tracing_max_lat_write(struct file *filp, const char __user *ubuf,
4308 size_t cnt, loff_t *ppos)
4309{
4310 return tracing_nsecs_write(filp->private_data, ubuf, cnt, ppos);
4311}
4312
b3806b43
SR
4313static int tracing_open_pipe(struct inode *inode, struct file *filp)
4314{
15544209 4315 struct trace_array *tr = inode->i_private;
b3806b43 4316 struct trace_iterator *iter;
b04cc6b1 4317 int ret = 0;
b3806b43
SR
4318
4319 if (tracing_disabled)
4320 return -ENODEV;
4321
7b85af63
SRRH
4322 if (trace_array_get(tr) < 0)
4323 return -ENODEV;
4324
b04cc6b1
FW
4325 mutex_lock(&trace_types_lock);
4326
b3806b43
SR
4327 /* create a buffer to store the information to pass to userspace */
4328 iter = kzalloc(sizeof(*iter), GFP_KERNEL);
b04cc6b1
FW
4329 if (!iter) {
4330 ret = -ENOMEM;
f77d09a3 4331 __trace_array_put(tr);
b04cc6b1
FW
4332 goto out;
4333 }
b3806b43 4334
3a161d99 4335 trace_seq_init(&iter->seq);
d716ff71 4336 iter->trace = tr->current_trace;
d7350c3f 4337
4462344e 4338 if (!alloc_cpumask_var(&iter->started, GFP_KERNEL)) {
b04cc6b1 4339 ret = -ENOMEM;
d7350c3f 4340 goto fail;
4462344e
RR
4341 }
4342
a309720c 4343 /* trace pipe does not show start of buffer */
4462344e 4344 cpumask_setall(iter->started);
a309720c 4345
112f38a7
SR
4346 if (trace_flags & TRACE_ITER_LATENCY_FMT)
4347 iter->iter_flags |= TRACE_FILE_LAT_FMT;
4348
8be0709f 4349 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
58e8eedf 4350 if (trace_clocks[tr->clock_id].in_ns)
8be0709f
DS
4351 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
4352
15544209
ON
4353 iter->tr = tr;
4354 iter->trace_buffer = &tr->trace_buffer;
4355 iter->cpu_file = tracing_get_cpu(inode);
d7350c3f 4356 mutex_init(&iter->mutex);
b3806b43
SR
4357 filp->private_data = iter;
4358
107bad8b
SR
4359 if (iter->trace->pipe_open)
4360 iter->trace->pipe_open(iter);
107bad8b 4361
b444786f 4362 nonseekable_open(inode, filp);
cf6ab6d9
SRRH
4363
4364 tr->current_trace->ref++;
b04cc6b1
FW
4365out:
4366 mutex_unlock(&trace_types_lock);
4367 return ret;
d7350c3f
FW
4368
4369fail:
4370 kfree(iter->trace);
4371 kfree(iter);
7b85af63 4372 __trace_array_put(tr);
d7350c3f
FW
4373 mutex_unlock(&trace_types_lock);
4374 return ret;
b3806b43
SR
4375}
4376
4377static int tracing_release_pipe(struct inode *inode, struct file *file)
4378{
4379 struct trace_iterator *iter = file->private_data;
15544209 4380 struct trace_array *tr = inode->i_private;
b3806b43 4381
b04cc6b1
FW
4382 mutex_lock(&trace_types_lock);
4383
cf6ab6d9
SRRH
4384 tr->current_trace->ref--;
4385
29bf4a5e 4386 if (iter->trace->pipe_close)
c521efd1
SR
4387 iter->trace->pipe_close(iter);
4388
b04cc6b1
FW
4389 mutex_unlock(&trace_types_lock);
4390
4462344e 4391 free_cpumask_var(iter->started);
d7350c3f 4392 mutex_destroy(&iter->mutex);
b3806b43 4393 kfree(iter);
b3806b43 4394
7b85af63
SRRH
4395 trace_array_put(tr);
4396
b3806b43
SR
4397 return 0;
4398}
4399
2a2cc8f7 4400static unsigned int
cc60cdc9 4401trace_poll(struct trace_iterator *iter, struct file *filp, poll_table *poll_table)
2a2cc8f7 4402{
15693458
SRRH
4403 /* Iterators are static, they should be filled or empty */
4404 if (trace_buffer_iter(iter, iter->cpu_file))
4405 return POLLIN | POLLRDNORM;
2a2cc8f7 4406
15693458 4407 if (trace_flags & TRACE_ITER_BLOCK)
2a2cc8f7
SSP
4408 /*
4409 * Always select as readable when in blocking mode
4410 */
4411 return POLLIN | POLLRDNORM;
15693458 4412 else
12883efb 4413 return ring_buffer_poll_wait(iter->trace_buffer->buffer, iter->cpu_file,
15693458 4414 filp, poll_table);
2a2cc8f7 4415}
2a2cc8f7 4416
cc60cdc9
SR
4417static unsigned int
4418tracing_poll_pipe(struct file *filp, poll_table *poll_table)
4419{
4420 struct trace_iterator *iter = filp->private_data;
4421
4422 return trace_poll(iter, filp, poll_table);
2a2cc8f7
SSP
4423}
4424
d716ff71 4425/* Must be called with iter->mutex held. */
ff98781b 4426static int tracing_wait_pipe(struct file *filp)
b3806b43
SR
4427{
4428 struct trace_iterator *iter = filp->private_data;
8b8b3683 4429 int ret;
b3806b43 4430
b3806b43 4431 while (trace_empty(iter)) {
2dc8f095 4432
107bad8b 4433 if ((filp->f_flags & O_NONBLOCK)) {
ff98781b 4434 return -EAGAIN;
107bad8b 4435 }
2dc8f095 4436
b3806b43 4437 /*
250bfd3d 4438 * We block until we read something and tracing is disabled.
b3806b43
SR
4439 * We still block if tracing is disabled, but we have never
4440 * read anything. This allows a user to cat this file, and
4441 * then enable tracing. But after we have read something,
4442 * we give an EOF when tracing is again disabled.
4443 *
4444 * iter->pos will be 0 if we haven't read anything.
4445 */
10246fa3 4446 if (!tracing_is_on() && iter->pos)
b3806b43 4447 break;
f4874261
SRRH
4448
4449 mutex_unlock(&iter->mutex);
4450
e30f53aa 4451 ret = wait_on_pipe(iter, false);
f4874261
SRRH
4452
4453 mutex_lock(&iter->mutex);
4454
8b8b3683
SRRH
4455 if (ret)
4456 return ret;
b3806b43
SR
4457 }
4458
ff98781b
EGM
4459 return 1;
4460}
4461
4462/*
4463 * Consumer reader.
4464 */
4465static ssize_t
4466tracing_read_pipe(struct file *filp, char __user *ubuf,
4467 size_t cnt, loff_t *ppos)
4468{
4469 struct trace_iterator *iter = filp->private_data;
4470 ssize_t sret;
4471
4472 /* return any leftover data */
4473 sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
4474 if (sret != -EBUSY)
4475 return sret;
4476
f9520750 4477 trace_seq_init(&iter->seq);
ff98781b 4478
d7350c3f
FW
4479 /*
4480 * Avoid more than one consumer on a single file descriptor
4481 * This is just a matter of traces coherency, the ring buffer itself
4482 * is protected.
4483 */
4484 mutex_lock(&iter->mutex);
ff98781b
EGM
4485 if (iter->trace->read) {
4486 sret = iter->trace->read(iter, filp, ubuf, cnt, ppos);
4487 if (sret)
4488 goto out;
4489 }
4490
4491waitagain:
4492 sret = tracing_wait_pipe(filp);
4493 if (sret <= 0)
4494 goto out;
4495
b3806b43 4496 /* stop when tracing is finished */
ff98781b
EGM
4497 if (trace_empty(iter)) {
4498 sret = 0;
107bad8b 4499 goto out;
ff98781b 4500 }
b3806b43
SR
4501
4502 if (cnt >= PAGE_SIZE)
4503 cnt = PAGE_SIZE - 1;
4504
53d0aa77 4505 /* reset all but tr, trace, and overruns */
53d0aa77
SR
4506 memset(&iter->seq, 0,
4507 sizeof(struct trace_iterator) -
4508 offsetof(struct trace_iterator, seq));
ed5467da 4509 cpumask_clear(iter->started);
4823ed7e 4510 iter->pos = -1;
b3806b43 4511
4f535968 4512 trace_event_read_lock();
7e53bd42 4513 trace_access_lock(iter->cpu_file);
955b61e5 4514 while (trace_find_next_entry_inc(iter) != NULL) {
2c4f035f 4515 enum print_line_t ret;
5ac48378 4516 int save_len = iter->seq.seq.len;
088b1e42 4517
f9896bf3 4518 ret = print_trace_line(iter);
2c4f035f 4519 if (ret == TRACE_TYPE_PARTIAL_LINE) {
088b1e42 4520 /* don't print partial lines */
5ac48378 4521 iter->seq.seq.len = save_len;
b3806b43 4522 break;
088b1e42 4523 }
b91facc3
FW
4524 if (ret != TRACE_TYPE_NO_CONSUME)
4525 trace_consume(iter);
b3806b43 4526
5ac48378 4527 if (trace_seq_used(&iter->seq) >= cnt)
b3806b43 4528 break;
ee5e51f5
JO
4529
4530 /*
4531 * Setting the full flag means we reached the trace_seq buffer
4532 * size and we should leave by partial output condition above.
4533 * One of the trace_seq_* functions is not used properly.
4534 */
4535 WARN_ONCE(iter->seq.full, "full flag set for trace type %d",
4536 iter->ent->type);
b3806b43 4537 }
7e53bd42 4538 trace_access_unlock(iter->cpu_file);
4f535968 4539 trace_event_read_unlock();
b3806b43 4540
b3806b43 4541 /* Now copy what we have to the user */
6c6c2796 4542 sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
5ac48378 4543 if (iter->seq.seq.readpos >= trace_seq_used(&iter->seq))
f9520750 4544 trace_seq_init(&iter->seq);
9ff4b974
PP
4545
4546 /*
25985edc 4547 * If there was nothing to send to user, in spite of consuming trace
9ff4b974
PP
4548 * entries, go back to wait for more entries.
4549 */
6c6c2796 4550 if (sret == -EBUSY)
9ff4b974 4551 goto waitagain;
b3806b43 4552
107bad8b 4553out:
d7350c3f 4554 mutex_unlock(&iter->mutex);
107bad8b 4555
6c6c2796 4556 return sret;
b3806b43
SR
4557}
4558
3c56819b
EGM
4559static void tracing_spd_release_pipe(struct splice_pipe_desc *spd,
4560 unsigned int idx)
4561{
4562 __free_page(spd->pages[idx]);
4563}
4564
28dfef8f 4565static const struct pipe_buf_operations tracing_pipe_buf_ops = {
34cd4998 4566 .can_merge = 0,
34cd4998 4567 .confirm = generic_pipe_buf_confirm,
92fdd98c 4568 .release = generic_pipe_buf_release,
34cd4998
SR
4569 .steal = generic_pipe_buf_steal,
4570 .get = generic_pipe_buf_get,
3c56819b
EGM
4571};
4572
34cd4998 4573static size_t
fa7c7f6e 4574tracing_fill_pipe_page(size_t rem, struct trace_iterator *iter)
34cd4998
SR
4575{
4576 size_t count;
74f06bb7 4577 int save_len;
34cd4998
SR
4578 int ret;
4579
4580 /* Seq buffer is page-sized, exactly what we need. */
4581 for (;;) {
74f06bb7 4582 save_len = iter->seq.seq.len;
34cd4998 4583 ret = print_trace_line(iter);
74f06bb7
SRRH
4584
4585 if (trace_seq_has_overflowed(&iter->seq)) {
4586 iter->seq.seq.len = save_len;
34cd4998
SR
4587 break;
4588 }
74f06bb7
SRRH
4589
4590 /*
4591 * This should not be hit, because it should only
4592 * be set if the iter->seq overflowed. But check it
4593 * anyway to be safe.
4594 */
34cd4998 4595 if (ret == TRACE_TYPE_PARTIAL_LINE) {
74f06bb7
SRRH
4596 iter->seq.seq.len = save_len;
4597 break;
4598 }
4599
5ac48378 4600 count = trace_seq_used(&iter->seq) - save_len;
74f06bb7
SRRH
4601 if (rem < count) {
4602 rem = 0;
4603 iter->seq.seq.len = save_len;
34cd4998
SR
4604 break;
4605 }
4606
74e7ff8c
LJ
4607 if (ret != TRACE_TYPE_NO_CONSUME)
4608 trace_consume(iter);
34cd4998 4609 rem -= count;
955b61e5 4610 if (!trace_find_next_entry_inc(iter)) {
34cd4998
SR
4611 rem = 0;
4612 iter->ent = NULL;
4613 break;
4614 }
4615 }
4616
4617 return rem;
4618}
4619
3c56819b
EGM
4620static ssize_t tracing_splice_read_pipe(struct file *filp,
4621 loff_t *ppos,
4622 struct pipe_inode_info *pipe,
4623 size_t len,
4624 unsigned int flags)
4625{
35f3d14d
JA
4626 struct page *pages_def[PIPE_DEF_BUFFERS];
4627 struct partial_page partial_def[PIPE_DEF_BUFFERS];
3c56819b
EGM
4628 struct trace_iterator *iter = filp->private_data;
4629 struct splice_pipe_desc spd = {
35f3d14d
JA
4630 .pages = pages_def,
4631 .partial = partial_def,
34cd4998 4632 .nr_pages = 0, /* This gets updated below. */
047fe360 4633 .nr_pages_max = PIPE_DEF_BUFFERS,
34cd4998
SR
4634 .flags = flags,
4635 .ops = &tracing_pipe_buf_ops,
4636 .spd_release = tracing_spd_release_pipe,
3c56819b
EGM
4637 };
4638 ssize_t ret;
34cd4998 4639 size_t rem;
3c56819b
EGM
4640 unsigned int i;
4641
35f3d14d
JA
4642 if (splice_grow_spd(pipe, &spd))
4643 return -ENOMEM;
4644
d7350c3f 4645 mutex_lock(&iter->mutex);
3c56819b
EGM
4646
4647 if (iter->trace->splice_read) {
4648 ret = iter->trace->splice_read(iter, filp,
4649 ppos, pipe, len, flags);
4650 if (ret)
34cd4998 4651 goto out_err;
3c56819b
EGM
4652 }
4653
4654 ret = tracing_wait_pipe(filp);
4655 if (ret <= 0)
34cd4998 4656 goto out_err;
3c56819b 4657
955b61e5 4658 if (!iter->ent && !trace_find_next_entry_inc(iter)) {
3c56819b 4659 ret = -EFAULT;
34cd4998 4660 goto out_err;
3c56819b
EGM
4661 }
4662
4f535968 4663 trace_event_read_lock();
7e53bd42 4664 trace_access_lock(iter->cpu_file);
4f535968 4665
3c56819b 4666 /* Fill as many pages as possible. */
a786c06d 4667 for (i = 0, rem = len; i < spd.nr_pages_max && rem; i++) {
35f3d14d
JA
4668 spd.pages[i] = alloc_page(GFP_KERNEL);
4669 if (!spd.pages[i])
34cd4998 4670 break;
3c56819b 4671
fa7c7f6e 4672 rem = tracing_fill_pipe_page(rem, iter);
3c56819b
EGM
4673
4674 /* Copy the data into the page, so we can start over. */
4675 ret = trace_seq_to_buffer(&iter->seq,
35f3d14d 4676 page_address(spd.pages[i]),
5ac48378 4677 trace_seq_used(&iter->seq));
3c56819b 4678 if (ret < 0) {
35f3d14d 4679 __free_page(spd.pages[i]);
3c56819b
EGM
4680 break;
4681 }
35f3d14d 4682 spd.partial[i].offset = 0;
5ac48378 4683 spd.partial[i].len = trace_seq_used(&iter->seq);
3c56819b 4684
f9520750 4685 trace_seq_init(&iter->seq);
3c56819b
EGM
4686 }
4687
7e53bd42 4688 trace_access_unlock(iter->cpu_file);
4f535968 4689 trace_event_read_unlock();
d7350c3f 4690 mutex_unlock(&iter->mutex);
3c56819b
EGM
4691
4692 spd.nr_pages = i;
4693
35f3d14d
JA
4694 ret = splice_to_pipe(pipe, &spd);
4695out:
047fe360 4696 splice_shrink_spd(&spd);
35f3d14d 4697 return ret;
3c56819b 4698
34cd4998 4699out_err:
d7350c3f 4700 mutex_unlock(&iter->mutex);
35f3d14d 4701 goto out;
3c56819b
EGM
4702}
4703
a98a3c3f
SR
4704static ssize_t
4705tracing_entries_read(struct file *filp, char __user *ubuf,
4706 size_t cnt, loff_t *ppos)
4707{
0bc392ee
ON
4708 struct inode *inode = file_inode(filp);
4709 struct trace_array *tr = inode->i_private;
4710 int cpu = tracing_get_cpu(inode);
438ced17
VN
4711 char buf[64];
4712 int r = 0;
4713 ssize_t ret;
a98a3c3f 4714
db526ca3 4715 mutex_lock(&trace_types_lock);
438ced17 4716
0bc392ee 4717 if (cpu == RING_BUFFER_ALL_CPUS) {
438ced17
VN
4718 int cpu, buf_size_same;
4719 unsigned long size;
4720
4721 size = 0;
4722 buf_size_same = 1;
4723 /* check if all cpu sizes are same */
4724 for_each_tracing_cpu(cpu) {
4725 /* fill in the size from first enabled cpu */
4726 if (size == 0)
12883efb
SRRH
4727 size = per_cpu_ptr(tr->trace_buffer.data, cpu)->entries;
4728 if (size != per_cpu_ptr(tr->trace_buffer.data, cpu)->entries) {
438ced17
VN
4729 buf_size_same = 0;
4730 break;
4731 }
4732 }
4733
4734 if (buf_size_same) {
4735 if (!ring_buffer_expanded)
4736 r = sprintf(buf, "%lu (expanded: %lu)\n",
4737 size >> 10,
4738 trace_buf_size >> 10);
4739 else
4740 r = sprintf(buf, "%lu\n", size >> 10);
4741 } else
4742 r = sprintf(buf, "X\n");
4743 } else
0bc392ee 4744 r = sprintf(buf, "%lu\n", per_cpu_ptr(tr->trace_buffer.data, cpu)->entries >> 10);
438ced17 4745
db526ca3
SR
4746 mutex_unlock(&trace_types_lock);
4747
438ced17
VN
4748 ret = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
4749 return ret;
a98a3c3f
SR
4750}
4751
4752static ssize_t
4753tracing_entries_write(struct file *filp, const char __user *ubuf,
4754 size_t cnt, loff_t *ppos)
4755{
0bc392ee
ON
4756 struct inode *inode = file_inode(filp);
4757 struct trace_array *tr = inode->i_private;
a98a3c3f 4758 unsigned long val;
4f271a2a 4759 int ret;
a98a3c3f 4760
22fe9b54
PH
4761 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
4762 if (ret)
c6caeeb1 4763 return ret;
a98a3c3f
SR
4764
4765 /* must have at least 1 entry */
4766 if (!val)
4767 return -EINVAL;
4768
1696b2b0
SR
4769 /* value is in KB */
4770 val <<= 10;
0bc392ee 4771 ret = tracing_resize_ring_buffer(tr, val, tracing_get_cpu(inode));
4f271a2a
VN
4772 if (ret < 0)
4773 return ret;
a98a3c3f 4774
cf8517cf 4775 *ppos += cnt;
a98a3c3f 4776
4f271a2a
VN
4777 return cnt;
4778}
bf5e6519 4779
f81ab074
VN
4780static ssize_t
4781tracing_total_entries_read(struct file *filp, char __user *ubuf,
4782 size_t cnt, loff_t *ppos)
4783{
4784 struct trace_array *tr = filp->private_data;
4785 char buf[64];
4786 int r, cpu;
4787 unsigned long size = 0, expanded_size = 0;
4788
4789 mutex_lock(&trace_types_lock);
4790 for_each_tracing_cpu(cpu) {
12883efb 4791 size += per_cpu_ptr(tr->trace_buffer.data, cpu)->entries >> 10;
f81ab074
VN
4792 if (!ring_buffer_expanded)
4793 expanded_size += trace_buf_size >> 10;
4794 }
4795 if (ring_buffer_expanded)
4796 r = sprintf(buf, "%lu\n", size);
4797 else
4798 r = sprintf(buf, "%lu (expanded: %lu)\n", size, expanded_size);
4799 mutex_unlock(&trace_types_lock);
4800
4801 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
4802}
4803
4f271a2a
VN
4804static ssize_t
4805tracing_free_buffer_write(struct file *filp, const char __user *ubuf,
4806 size_t cnt, loff_t *ppos)
4807{
4808 /*
4809 * There is no need to read what the user has written, this function
4810 * is just to make sure that there is no error when "echo" is used
4811 */
4812
4813 *ppos += cnt;
a98a3c3f
SR
4814
4815 return cnt;
4816}
4817
4f271a2a
VN
4818static int
4819tracing_free_buffer_release(struct inode *inode, struct file *filp)
4820{
2b6080f2
SR
4821 struct trace_array *tr = inode->i_private;
4822
cf30cf67
SR
4823 /* disable tracing ? */
4824 if (trace_flags & TRACE_ITER_STOP_ON_FREE)
711e1243 4825 tracer_tracing_off(tr);
4f271a2a 4826 /* resize the ring buffer to 0 */
2b6080f2 4827 tracing_resize_ring_buffer(tr, 0, RING_BUFFER_ALL_CPUS);
4f271a2a 4828
7b85af63
SRRH
4829 trace_array_put(tr);
4830
4f271a2a
VN
4831 return 0;
4832}
4833
5bf9a1ee
PP
4834static ssize_t
4835tracing_mark_write(struct file *filp, const char __user *ubuf,
4836 size_t cnt, loff_t *fpos)
4837{
d696b58c 4838 unsigned long addr = (unsigned long)ubuf;
2d71619c 4839 struct trace_array *tr = filp->private_data;
d696b58c
SR
4840 struct ring_buffer_event *event;
4841 struct ring_buffer *buffer;
4842 struct print_entry *entry;
4843 unsigned long irq_flags;
4844 struct page *pages[2];
6edb2a8a 4845 void *map_page[2];
d696b58c
SR
4846 int nr_pages = 1;
4847 ssize_t written;
d696b58c
SR
4848 int offset;
4849 int size;
4850 int len;
4851 int ret;
6edb2a8a 4852 int i;
5bf9a1ee 4853
c76f0694 4854 if (tracing_disabled)
5bf9a1ee
PP
4855 return -EINVAL;
4856
5224c3a3
MSB
4857 if (!(trace_flags & TRACE_ITER_MARKERS))
4858 return -EINVAL;
4859
5bf9a1ee
PP
4860 if (cnt > TRACE_BUF_SIZE)
4861 cnt = TRACE_BUF_SIZE;
4862
d696b58c
SR
4863 /*
4864 * Userspace is injecting traces into the kernel trace buffer.
4865 * We want to be as non intrusive as possible.
4866 * To do so, we do not want to allocate any special buffers
4867 * or take any locks, but instead write the userspace data
4868 * straight into the ring buffer.
4869 *
4870 * First we need to pin the userspace buffer into memory,
4871 * which, most likely it is, because it just referenced it.
4872 * But there's no guarantee that it is. By using get_user_pages_fast()
4873 * and kmap_atomic/kunmap_atomic() we can get access to the
4874 * pages directly. We then write the data directly into the
4875 * ring buffer.
4876 */
4877 BUILD_BUG_ON(TRACE_BUF_SIZE >= PAGE_SIZE);
5bf9a1ee 4878
d696b58c
SR
4879 /* check if we cross pages */
4880 if ((addr & PAGE_MASK) != ((addr + cnt) & PAGE_MASK))
4881 nr_pages = 2;
4882
4883 offset = addr & (PAGE_SIZE - 1);
4884 addr &= PAGE_MASK;
4885
4886 ret = get_user_pages_fast(addr, nr_pages, 0, pages);
4887 if (ret < nr_pages) {
4888 while (--ret >= 0)
4889 put_page(pages[ret]);
4890 written = -EFAULT;
4891 goto out;
5bf9a1ee 4892 }
d696b58c 4893
6edb2a8a
SR
4894 for (i = 0; i < nr_pages; i++)
4895 map_page[i] = kmap_atomic(pages[i]);
d696b58c
SR
4896
4897 local_save_flags(irq_flags);
4898 size = sizeof(*entry) + cnt + 2; /* possible \n added */
2d71619c 4899 buffer = tr->trace_buffer.buffer;
d696b58c
SR
4900 event = trace_buffer_lock_reserve(buffer, TRACE_PRINT, size,
4901 irq_flags, preempt_count());
4902 if (!event) {
4903 /* Ring buffer disabled, return as if not open for write */
4904 written = -EBADF;
4905 goto out_unlock;
5bf9a1ee 4906 }
d696b58c
SR
4907
4908 entry = ring_buffer_event_data(event);
4909 entry->ip = _THIS_IP_;
4910
4911 if (nr_pages == 2) {
4912 len = PAGE_SIZE - offset;
6edb2a8a
SR
4913 memcpy(&entry->buf, map_page[0] + offset, len);
4914 memcpy(&entry->buf[len], map_page[1], cnt - len);
c13d2f7c 4915 } else
6edb2a8a 4916 memcpy(&entry->buf, map_page[0] + offset, cnt);
5bf9a1ee 4917
d696b58c
SR
4918 if (entry->buf[cnt - 1] != '\n') {
4919 entry->buf[cnt] = '\n';
4920 entry->buf[cnt + 1] = '\0';
4921 } else
4922 entry->buf[cnt] = '\0';
4923
7ffbd48d 4924 __buffer_unlock_commit(buffer, event);
5bf9a1ee 4925
d696b58c 4926 written = cnt;
5bf9a1ee 4927
d696b58c 4928 *fpos += written;
1aa54bca 4929
d696b58c 4930 out_unlock:
6edb2a8a
SR
4931 for (i = 0; i < nr_pages; i++){
4932 kunmap_atomic(map_page[i]);
4933 put_page(pages[i]);
4934 }
d696b58c 4935 out:
1aa54bca 4936 return written;
5bf9a1ee
PP
4937}
4938
13f16d20 4939static int tracing_clock_show(struct seq_file *m, void *v)
5079f326 4940{
2b6080f2 4941 struct trace_array *tr = m->private;
5079f326
Z
4942 int i;
4943
4944 for (i = 0; i < ARRAY_SIZE(trace_clocks); i++)
13f16d20 4945 seq_printf(m,
5079f326 4946 "%s%s%s%s", i ? " " : "",
2b6080f2
SR
4947 i == tr->clock_id ? "[" : "", trace_clocks[i].name,
4948 i == tr->clock_id ? "]" : "");
13f16d20 4949 seq_putc(m, '\n');
5079f326 4950
13f16d20 4951 return 0;
5079f326
Z
4952}
4953
e1e232ca 4954static int tracing_set_clock(struct trace_array *tr, const char *clockstr)
5079f326 4955{
5079f326
Z
4956 int i;
4957
5079f326
Z
4958 for (i = 0; i < ARRAY_SIZE(trace_clocks); i++) {
4959 if (strcmp(trace_clocks[i].name, clockstr) == 0)
4960 break;
4961 }
4962 if (i == ARRAY_SIZE(trace_clocks))
4963 return -EINVAL;
4964
5079f326
Z
4965 mutex_lock(&trace_types_lock);
4966
2b6080f2
SR
4967 tr->clock_id = i;
4968
12883efb 4969 ring_buffer_set_clock(tr->trace_buffer.buffer, trace_clocks[i].func);
5079f326 4970
60303ed3
DS
4971 /*
4972 * New clock may not be consistent with the previous clock.
4973 * Reset the buffer so that it doesn't have incomparable timestamps.
4974 */
9457158b 4975 tracing_reset_online_cpus(&tr->trace_buffer);
12883efb
SRRH
4976
4977#ifdef CONFIG_TRACER_MAX_TRACE
4978 if (tr->flags & TRACE_ARRAY_FL_GLOBAL && tr->max_buffer.buffer)
4979 ring_buffer_set_clock(tr->max_buffer.buffer, trace_clocks[i].func);
9457158b 4980 tracing_reset_online_cpus(&tr->max_buffer);
12883efb 4981#endif
60303ed3 4982
5079f326
Z
4983 mutex_unlock(&trace_types_lock);
4984
e1e232ca
SR
4985 return 0;
4986}
4987
4988static ssize_t tracing_clock_write(struct file *filp, const char __user *ubuf,
4989 size_t cnt, loff_t *fpos)
4990{
4991 struct seq_file *m = filp->private_data;
4992 struct trace_array *tr = m->private;
4993 char buf[64];
4994 const char *clockstr;
4995 int ret;
4996
4997 if (cnt >= sizeof(buf))
4998 return -EINVAL;
4999
5000 if (copy_from_user(&buf, ubuf, cnt))
5001 return -EFAULT;
5002
5003 buf[cnt] = 0;
5004
5005 clockstr = strstrip(buf);
5006
5007 ret = tracing_set_clock(tr, clockstr);
5008 if (ret)
5009 return ret;
5010
5079f326
Z
5011 *fpos += cnt;
5012
5013 return cnt;
5014}
5015
13f16d20
LZ
5016static int tracing_clock_open(struct inode *inode, struct file *file)
5017{
7b85af63
SRRH
5018 struct trace_array *tr = inode->i_private;
5019 int ret;
5020
13f16d20
LZ
5021 if (tracing_disabled)
5022 return -ENODEV;
2b6080f2 5023
7b85af63
SRRH
5024 if (trace_array_get(tr))
5025 return -ENODEV;
5026
5027 ret = single_open(file, tracing_clock_show, inode->i_private);
5028 if (ret < 0)
5029 trace_array_put(tr);
5030
5031 return ret;
13f16d20
LZ
5032}
5033
6de58e62
SRRH
5034struct ftrace_buffer_info {
5035 struct trace_iterator iter;
5036 void *spare;
5037 unsigned int read;
5038};
5039
debdd57f
HT
5040#ifdef CONFIG_TRACER_SNAPSHOT
5041static int tracing_snapshot_open(struct inode *inode, struct file *file)
5042{
6484c71c 5043 struct trace_array *tr = inode->i_private;
debdd57f 5044 struct trace_iterator *iter;
2b6080f2 5045 struct seq_file *m;
debdd57f
HT
5046 int ret = 0;
5047
ff451961
SRRH
5048 if (trace_array_get(tr) < 0)
5049 return -ENODEV;
5050
debdd57f 5051 if (file->f_mode & FMODE_READ) {
6484c71c 5052 iter = __tracing_open(inode, file, true);
debdd57f
HT
5053 if (IS_ERR(iter))
5054 ret = PTR_ERR(iter);
2b6080f2
SR
5055 } else {
5056 /* Writes still need the seq_file to hold the private data */
f77d09a3 5057 ret = -ENOMEM;
2b6080f2
SR
5058 m = kzalloc(sizeof(*m), GFP_KERNEL);
5059 if (!m)
f77d09a3 5060 goto out;
2b6080f2
SR
5061 iter = kzalloc(sizeof(*iter), GFP_KERNEL);
5062 if (!iter) {
5063 kfree(m);
f77d09a3 5064 goto out;
2b6080f2 5065 }
f77d09a3
AL
5066 ret = 0;
5067
ff451961 5068 iter->tr = tr;
6484c71c
ON
5069 iter->trace_buffer = &tr->max_buffer;
5070 iter->cpu_file = tracing_get_cpu(inode);
2b6080f2
SR
5071 m->private = iter;
5072 file->private_data = m;
debdd57f 5073 }
f77d09a3 5074out:
ff451961
SRRH
5075 if (ret < 0)
5076 trace_array_put(tr);
5077
debdd57f
HT
5078 return ret;
5079}
5080
5081static ssize_t
5082tracing_snapshot_write(struct file *filp, const char __user *ubuf, size_t cnt,
5083 loff_t *ppos)
5084{
2b6080f2
SR
5085 struct seq_file *m = filp->private_data;
5086 struct trace_iterator *iter = m->private;
5087 struct trace_array *tr = iter->tr;
debdd57f
HT
5088 unsigned long val;
5089 int ret;
5090
5091 ret = tracing_update_buffers();
5092 if (ret < 0)
5093 return ret;
5094
5095 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
5096 if (ret)
5097 return ret;
5098
5099 mutex_lock(&trace_types_lock);
5100
2b6080f2 5101 if (tr->current_trace->use_max_tr) {
debdd57f
HT
5102 ret = -EBUSY;
5103 goto out;
5104 }
5105
5106 switch (val) {
5107 case 0:
f1affcaa
SRRH
5108 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
5109 ret = -EINVAL;
5110 break;
debdd57f 5111 }
3209cff4
SRRH
5112 if (tr->allocated_snapshot)
5113 free_snapshot(tr);
debdd57f
HT
5114 break;
5115 case 1:
f1affcaa
SRRH
5116/* Only allow per-cpu swap if the ring buffer supports it */
5117#ifndef CONFIG_RING_BUFFER_ALLOW_SWAP
5118 if (iter->cpu_file != RING_BUFFER_ALL_CPUS) {
5119 ret = -EINVAL;
5120 break;
5121 }
5122#endif
45ad21ca 5123 if (!tr->allocated_snapshot) {
3209cff4 5124 ret = alloc_snapshot(tr);
debdd57f
HT
5125 if (ret < 0)
5126 break;
debdd57f 5127 }
debdd57f
HT
5128 local_irq_disable();
5129 /* Now, we're going to swap */
f1affcaa 5130 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
ce9bae55 5131 update_max_tr(tr, current, smp_processor_id());
f1affcaa 5132 else
ce9bae55 5133 update_max_tr_single(tr, current, iter->cpu_file);
debdd57f
HT
5134 local_irq_enable();
5135 break;
5136 default:
45ad21ca 5137 if (tr->allocated_snapshot) {
f1affcaa
SRRH
5138 if (iter->cpu_file == RING_BUFFER_ALL_CPUS)
5139 tracing_reset_online_cpus(&tr->max_buffer);
5140 else
5141 tracing_reset(&tr->max_buffer, iter->cpu_file);
5142 }
debdd57f
HT
5143 break;
5144 }
5145
5146 if (ret >= 0) {
5147 *ppos += cnt;
5148 ret = cnt;
5149 }
5150out:
5151 mutex_unlock(&trace_types_lock);
5152 return ret;
5153}
2b6080f2
SR
5154
5155static int tracing_snapshot_release(struct inode *inode, struct file *file)
5156{
5157 struct seq_file *m = file->private_data;
ff451961
SRRH
5158 int ret;
5159
5160 ret = tracing_release(inode, file);
2b6080f2
SR
5161
5162 if (file->f_mode & FMODE_READ)
ff451961 5163 return ret;
2b6080f2
SR
5164
5165 /* If write only, the seq_file is just a stub */
5166 if (m)
5167 kfree(m->private);
5168 kfree(m);
5169
5170 return 0;
5171}
5172
6de58e62
SRRH
5173static int tracing_buffers_open(struct inode *inode, struct file *filp);
5174static ssize_t tracing_buffers_read(struct file *filp, char __user *ubuf,
5175 size_t count, loff_t *ppos);
5176static int tracing_buffers_release(struct inode *inode, struct file *file);
5177static ssize_t tracing_buffers_splice_read(struct file *file, loff_t *ppos,
5178 struct pipe_inode_info *pipe, size_t len, unsigned int flags);
5179
5180static int snapshot_raw_open(struct inode *inode, struct file *filp)
5181{
5182 struct ftrace_buffer_info *info;
5183 int ret;
5184
5185 ret = tracing_buffers_open(inode, filp);
5186 if (ret < 0)
5187 return ret;
5188
5189 info = filp->private_data;
5190
5191 if (info->iter.trace->use_max_tr) {
5192 tracing_buffers_release(inode, filp);
5193 return -EBUSY;
5194 }
5195
5196 info->iter.snapshot = true;
5197 info->iter.trace_buffer = &info->iter.tr->max_buffer;
5198
5199 return ret;
5200}
5201
debdd57f
HT
5202#endif /* CONFIG_TRACER_SNAPSHOT */
5203
5204
6508fa76
SF
5205static const struct file_operations tracing_thresh_fops = {
5206 .open = tracing_open_generic,
5207 .read = tracing_thresh_read,
5208 .write = tracing_thresh_write,
5209 .llseek = generic_file_llseek,
5210};
5211
5e2336a0 5212static const struct file_operations tracing_max_lat_fops = {
4bf39a94
IM
5213 .open = tracing_open_generic,
5214 .read = tracing_max_lat_read,
5215 .write = tracing_max_lat_write,
b444786f 5216 .llseek = generic_file_llseek,
bc0c38d1
SR
5217};
5218
5e2336a0 5219static const struct file_operations set_tracer_fops = {
4bf39a94
IM
5220 .open = tracing_open_generic,
5221 .read = tracing_set_trace_read,
5222 .write = tracing_set_trace_write,
b444786f 5223 .llseek = generic_file_llseek,
bc0c38d1
SR
5224};
5225
5e2336a0 5226static const struct file_operations tracing_pipe_fops = {
4bf39a94 5227 .open = tracing_open_pipe,
2a2cc8f7 5228 .poll = tracing_poll_pipe,
4bf39a94 5229 .read = tracing_read_pipe,
3c56819b 5230 .splice_read = tracing_splice_read_pipe,
4bf39a94 5231 .release = tracing_release_pipe,
b444786f 5232 .llseek = no_llseek,
b3806b43
SR
5233};
5234
5e2336a0 5235static const struct file_operations tracing_entries_fops = {
0bc392ee 5236 .open = tracing_open_generic_tr,
a98a3c3f
SR
5237 .read = tracing_entries_read,
5238 .write = tracing_entries_write,
b444786f 5239 .llseek = generic_file_llseek,
0bc392ee 5240 .release = tracing_release_generic_tr,
a98a3c3f
SR
5241};
5242
f81ab074 5243static const struct file_operations tracing_total_entries_fops = {
7b85af63 5244 .open = tracing_open_generic_tr,
f81ab074
VN
5245 .read = tracing_total_entries_read,
5246 .llseek = generic_file_llseek,
7b85af63 5247 .release = tracing_release_generic_tr,
f81ab074
VN
5248};
5249
4f271a2a 5250static const struct file_operations tracing_free_buffer_fops = {
7b85af63 5251 .open = tracing_open_generic_tr,
4f271a2a
VN
5252 .write = tracing_free_buffer_write,
5253 .release = tracing_free_buffer_release,
5254};
5255
5e2336a0 5256static const struct file_operations tracing_mark_fops = {
7b85af63 5257 .open = tracing_open_generic_tr,
5bf9a1ee 5258 .write = tracing_mark_write,
b444786f 5259 .llseek = generic_file_llseek,
7b85af63 5260 .release = tracing_release_generic_tr,
5bf9a1ee
PP
5261};
5262
5079f326 5263static const struct file_operations trace_clock_fops = {
13f16d20
LZ
5264 .open = tracing_clock_open,
5265 .read = seq_read,
5266 .llseek = seq_lseek,
7b85af63 5267 .release = tracing_single_release_tr,
5079f326
Z
5268 .write = tracing_clock_write,
5269};
5270
debdd57f
HT
5271#ifdef CONFIG_TRACER_SNAPSHOT
5272static const struct file_operations snapshot_fops = {
5273 .open = tracing_snapshot_open,
5274 .read = seq_read,
5275 .write = tracing_snapshot_write,
098c879e 5276 .llseek = tracing_lseek,
2b6080f2 5277 .release = tracing_snapshot_release,
debdd57f 5278};
debdd57f 5279
6de58e62
SRRH
5280static const struct file_operations snapshot_raw_fops = {
5281 .open = snapshot_raw_open,
5282 .read = tracing_buffers_read,
5283 .release = tracing_buffers_release,
5284 .splice_read = tracing_buffers_splice_read,
5285 .llseek = no_llseek,
2cadf913
SR
5286};
5287
6de58e62
SRRH
5288#endif /* CONFIG_TRACER_SNAPSHOT */
5289
2cadf913
SR
5290static int tracing_buffers_open(struct inode *inode, struct file *filp)
5291{
46ef2be0 5292 struct trace_array *tr = inode->i_private;
2cadf913 5293 struct ftrace_buffer_info *info;
7b85af63 5294 int ret;
2cadf913
SR
5295
5296 if (tracing_disabled)
5297 return -ENODEV;
5298
7b85af63
SRRH
5299 if (trace_array_get(tr) < 0)
5300 return -ENODEV;
5301
2cadf913 5302 info = kzalloc(sizeof(*info), GFP_KERNEL);
7b85af63
SRRH
5303 if (!info) {
5304 trace_array_put(tr);
2cadf913 5305 return -ENOMEM;
7b85af63 5306 }
2cadf913 5307
a695cb58
SRRH
5308 mutex_lock(&trace_types_lock);
5309
cc60cdc9 5310 info->iter.tr = tr;
46ef2be0 5311 info->iter.cpu_file = tracing_get_cpu(inode);
b627344f 5312 info->iter.trace = tr->current_trace;
12883efb 5313 info->iter.trace_buffer = &tr->trace_buffer;
cc60cdc9 5314 info->spare = NULL;
2cadf913 5315 /* Force reading ring buffer for first read */
cc60cdc9 5316 info->read = (unsigned int)-1;
2cadf913
SR
5317
5318 filp->private_data = info;
5319
cf6ab6d9
SRRH
5320 tr->current_trace->ref++;
5321
a695cb58
SRRH
5322 mutex_unlock(&trace_types_lock);
5323
7b85af63
SRRH
5324 ret = nonseekable_open(inode, filp);
5325 if (ret < 0)
5326 trace_array_put(tr);
5327
5328 return ret;
2cadf913
SR
5329}
5330
cc60cdc9
SR
5331static unsigned int
5332tracing_buffers_poll(struct file *filp, poll_table *poll_table)
5333{
5334 struct ftrace_buffer_info *info = filp->private_data;
5335 struct trace_iterator *iter = &info->iter;
5336
5337 return trace_poll(iter, filp, poll_table);
5338}
5339
2cadf913
SR
5340static ssize_t
5341tracing_buffers_read(struct file *filp, char __user *ubuf,
5342 size_t count, loff_t *ppos)
5343{
5344 struct ftrace_buffer_info *info = filp->private_data;
cc60cdc9 5345 struct trace_iterator *iter = &info->iter;
2cadf913 5346 ssize_t ret;
6de58e62 5347 ssize_t size;
2cadf913 5348
2dc5d12b
SR
5349 if (!count)
5350 return 0;
5351
6de58e62 5352#ifdef CONFIG_TRACER_MAX_TRACE
d716ff71
SRRH
5353 if (iter->snapshot && iter->tr->current_trace->use_max_tr)
5354 return -EBUSY;
6de58e62
SRRH
5355#endif
5356
ddd538f3 5357 if (!info->spare)
12883efb
SRRH
5358 info->spare = ring_buffer_alloc_read_page(iter->trace_buffer->buffer,
5359 iter->cpu_file);
ddd538f3 5360 if (!info->spare)
d716ff71 5361 return -ENOMEM;
ddd538f3 5362
2cadf913
SR
5363 /* Do we have previous read data to read? */
5364 if (info->read < PAGE_SIZE)
5365 goto read;
5366
b627344f 5367 again:
cc60cdc9 5368 trace_access_lock(iter->cpu_file);
12883efb 5369 ret = ring_buffer_read_page(iter->trace_buffer->buffer,
2cadf913
SR
5370 &info->spare,
5371 count,
cc60cdc9
SR
5372 iter->cpu_file, 0);
5373 trace_access_unlock(iter->cpu_file);
2cadf913 5374
b627344f
SR
5375 if (ret < 0) {
5376 if (trace_empty(iter)) {
d716ff71
SRRH
5377 if ((filp->f_flags & O_NONBLOCK))
5378 return -EAGAIN;
5379
e30f53aa 5380 ret = wait_on_pipe(iter, false);
d716ff71
SRRH
5381 if (ret)
5382 return ret;
5383
b627344f
SR
5384 goto again;
5385 }
d716ff71 5386 return 0;
b627344f 5387 }
436fc280 5388
436fc280 5389 info->read = 0;
b627344f 5390 read:
2cadf913
SR
5391 size = PAGE_SIZE - info->read;
5392 if (size > count)
5393 size = count;
5394
5395 ret = copy_to_user(ubuf, info->spare + info->read, size);
d716ff71
SRRH
5396 if (ret == size)
5397 return -EFAULT;
5398
2dc5d12b
SR
5399 size -= ret;
5400
2cadf913
SR
5401 *ppos += size;
5402 info->read += size;
5403
5404 return size;
5405}
5406
5407static int tracing_buffers_release(struct inode *inode, struct file *file)
5408{
5409 struct ftrace_buffer_info *info = file->private_data;
cc60cdc9 5410 struct trace_iterator *iter = &info->iter;
2cadf913 5411
a695cb58
SRRH
5412 mutex_lock(&trace_types_lock);
5413
cf6ab6d9
SRRH
5414 iter->tr->current_trace->ref--;
5415
ff451961 5416 __trace_array_put(iter->tr);
2cadf913 5417
ddd538f3 5418 if (info->spare)
12883efb 5419 ring_buffer_free_read_page(iter->trace_buffer->buffer, info->spare);
2cadf913
SR
5420 kfree(info);
5421
a695cb58
SRRH
5422 mutex_unlock(&trace_types_lock);
5423
2cadf913
SR
5424 return 0;
5425}
5426
5427struct buffer_ref {
5428 struct ring_buffer *buffer;
5429 void *page;
5430 int ref;
5431};
5432
5433static void buffer_pipe_buf_release(struct pipe_inode_info *pipe,
5434 struct pipe_buffer *buf)
5435{
5436 struct buffer_ref *ref = (struct buffer_ref *)buf->private;
5437
5438 if (--ref->ref)
5439 return;
5440
5441 ring_buffer_free_read_page(ref->buffer, ref->page);
5442 kfree(ref);
5443 buf->private = 0;
5444}
5445
2cadf913
SR
5446static void buffer_pipe_buf_get(struct pipe_inode_info *pipe,
5447 struct pipe_buffer *buf)
5448{
5449 struct buffer_ref *ref = (struct buffer_ref *)buf->private;
5450
5451 ref->ref++;
5452}
5453
5454/* Pipe buffer operations for a buffer. */
28dfef8f 5455static const struct pipe_buf_operations buffer_pipe_buf_ops = {
2cadf913 5456 .can_merge = 0,
2cadf913
SR
5457 .confirm = generic_pipe_buf_confirm,
5458 .release = buffer_pipe_buf_release,
d55cb6cf 5459 .steal = generic_pipe_buf_steal,
2cadf913
SR
5460 .get = buffer_pipe_buf_get,
5461};
5462
5463/*
5464 * Callback from splice_to_pipe(), if we need to release some pages
5465 * at the end of the spd in case we error'ed out in filling the pipe.
5466 */
5467static void buffer_spd_release(struct splice_pipe_desc *spd, unsigned int i)
5468{
5469 struct buffer_ref *ref =
5470 (struct buffer_ref *)spd->partial[i].private;
5471
5472 if (--ref->ref)
5473 return;
5474
5475 ring_buffer_free_read_page(ref->buffer, ref->page);
5476 kfree(ref);
5477 spd->partial[i].private = 0;
5478}
5479
5480static ssize_t
5481tracing_buffers_splice_read(struct file *file, loff_t *ppos,
5482 struct pipe_inode_info *pipe, size_t len,
5483 unsigned int flags)
5484{
5485 struct ftrace_buffer_info *info = file->private_data;
cc60cdc9 5486 struct trace_iterator *iter = &info->iter;
35f3d14d
JA
5487 struct partial_page partial_def[PIPE_DEF_BUFFERS];
5488 struct page *pages_def[PIPE_DEF_BUFFERS];
2cadf913 5489 struct splice_pipe_desc spd = {
35f3d14d
JA
5490 .pages = pages_def,
5491 .partial = partial_def,
047fe360 5492 .nr_pages_max = PIPE_DEF_BUFFERS,
2cadf913
SR
5493 .flags = flags,
5494 .ops = &buffer_pipe_buf_ops,
5495 .spd_release = buffer_spd_release,
5496 };
5497 struct buffer_ref *ref;
93459c6c 5498 int entries, size, i;
07906da7 5499 ssize_t ret = 0;
2cadf913 5500
6de58e62 5501#ifdef CONFIG_TRACER_MAX_TRACE
d716ff71
SRRH
5502 if (iter->snapshot && iter->tr->current_trace->use_max_tr)
5503 return -EBUSY;
6de58e62
SRRH
5504#endif
5505
d716ff71
SRRH
5506 if (splice_grow_spd(pipe, &spd))
5507 return -ENOMEM;
35f3d14d 5508
d716ff71
SRRH
5509 if (*ppos & (PAGE_SIZE - 1))
5510 return -EINVAL;
93cfb3c9
LJ
5511
5512 if (len & (PAGE_SIZE - 1)) {
d716ff71
SRRH
5513 if (len < PAGE_SIZE)
5514 return -EINVAL;
93cfb3c9
LJ
5515 len &= PAGE_MASK;
5516 }
5517
cc60cdc9
SR
5518 again:
5519 trace_access_lock(iter->cpu_file);
12883efb 5520 entries = ring_buffer_entries_cpu(iter->trace_buffer->buffer, iter->cpu_file);
93459c6c 5521
a786c06d 5522 for (i = 0; i < spd.nr_pages_max && len && entries; i++, len -= PAGE_SIZE) {
2cadf913
SR
5523 struct page *page;
5524 int r;
5525
5526 ref = kzalloc(sizeof(*ref), GFP_KERNEL);
07906da7
RV
5527 if (!ref) {
5528 ret = -ENOMEM;
2cadf913 5529 break;
07906da7 5530 }
2cadf913 5531
7267fa68 5532 ref->ref = 1;
12883efb 5533 ref->buffer = iter->trace_buffer->buffer;
cc60cdc9 5534 ref->page = ring_buffer_alloc_read_page(ref->buffer, iter->cpu_file);
2cadf913 5535 if (!ref->page) {
07906da7 5536 ret = -ENOMEM;
2cadf913
SR
5537 kfree(ref);
5538 break;
5539 }
5540
5541 r = ring_buffer_read_page(ref->buffer, &ref->page,
cc60cdc9 5542 len, iter->cpu_file, 1);
2cadf913 5543 if (r < 0) {
7ea59064 5544 ring_buffer_free_read_page(ref->buffer, ref->page);
2cadf913
SR
5545 kfree(ref);
5546 break;
5547 }
5548
5549 /*
5550 * zero out any left over data, this is going to
5551 * user land.
5552 */
5553 size = ring_buffer_page_len(ref->page);
5554 if (size < PAGE_SIZE)
5555 memset(ref->page + size, 0, PAGE_SIZE - size);
5556
5557 page = virt_to_page(ref->page);
5558
5559 spd.pages[i] = page;
5560 spd.partial[i].len = PAGE_SIZE;
5561 spd.partial[i].offset = 0;
5562 spd.partial[i].private = (unsigned long)ref;
5563 spd.nr_pages++;
93cfb3c9 5564 *ppos += PAGE_SIZE;
93459c6c 5565
12883efb 5566 entries = ring_buffer_entries_cpu(iter->trace_buffer->buffer, iter->cpu_file);
2cadf913
SR
5567 }
5568
cc60cdc9 5569 trace_access_unlock(iter->cpu_file);
2cadf913
SR
5570 spd.nr_pages = i;
5571
5572 /* did we read anything? */
5573 if (!spd.nr_pages) {
07906da7 5574 if (ret)
d716ff71
SRRH
5575 return ret;
5576
5577 if ((file->f_flags & O_NONBLOCK) || (flags & SPLICE_F_NONBLOCK))
5578 return -EAGAIN;
07906da7 5579
e30f53aa 5580 ret = wait_on_pipe(iter, true);
8b8b3683 5581 if (ret)
d716ff71 5582 return ret;
e30f53aa 5583
cc60cdc9 5584 goto again;
2cadf913
SR
5585 }
5586
5587 ret = splice_to_pipe(pipe, &spd);
047fe360 5588 splice_shrink_spd(&spd);
6de58e62 5589
2cadf913
SR
5590 return ret;
5591}
5592
5593static const struct file_operations tracing_buffers_fops = {
5594 .open = tracing_buffers_open,
5595 .read = tracing_buffers_read,
cc60cdc9 5596 .poll = tracing_buffers_poll,
2cadf913
SR
5597 .release = tracing_buffers_release,
5598 .splice_read = tracing_buffers_splice_read,
5599 .llseek = no_llseek,
5600};
5601
c8d77183
SR
5602static ssize_t
5603tracing_stats_read(struct file *filp, char __user *ubuf,
5604 size_t count, loff_t *ppos)
5605{
4d3435b8
ON
5606 struct inode *inode = file_inode(filp);
5607 struct trace_array *tr = inode->i_private;
12883efb 5608 struct trace_buffer *trace_buf = &tr->trace_buffer;
4d3435b8 5609 int cpu = tracing_get_cpu(inode);
c8d77183
SR
5610 struct trace_seq *s;
5611 unsigned long cnt;
c64e148a
VN
5612 unsigned long long t;
5613 unsigned long usec_rem;
c8d77183 5614
e4f2d10f 5615 s = kmalloc(sizeof(*s), GFP_KERNEL);
c8d77183 5616 if (!s)
a646365c 5617 return -ENOMEM;
c8d77183
SR
5618
5619 trace_seq_init(s);
5620
12883efb 5621 cnt = ring_buffer_entries_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5622 trace_seq_printf(s, "entries: %ld\n", cnt);
5623
12883efb 5624 cnt = ring_buffer_overrun_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5625 trace_seq_printf(s, "overrun: %ld\n", cnt);
5626
12883efb 5627 cnt = ring_buffer_commit_overrun_cpu(trace_buf->buffer, cpu);
c8d77183
SR
5628 trace_seq_printf(s, "commit overrun: %ld\n", cnt);
5629
12883efb 5630 cnt = ring_buffer_bytes_cpu(trace_buf->buffer, cpu);
c64e148a
VN
5631 trace_seq_printf(s, "bytes: %ld\n", cnt);
5632
58e8eedf 5633 if (trace_clocks[tr->clock_id].in_ns) {
11043d8b 5634 /* local or global for trace_clock */
12883efb 5635 t = ns2usecs(ring_buffer_oldest_event_ts(trace_buf->buffer, cpu));
11043d8b
YY
5636 usec_rem = do_div(t, USEC_PER_SEC);
5637 trace_seq_printf(s, "oldest event ts: %5llu.%06lu\n",
5638 t, usec_rem);
5639
12883efb 5640 t = ns2usecs(ring_buffer_time_stamp(trace_buf->buffer, cpu));
11043d8b
YY
5641 usec_rem = do_div(t, USEC_PER_SEC);
5642 trace_seq_printf(s, "now ts: %5llu.%06lu\n", t, usec_rem);
5643 } else {
5644 /* counter or tsc mode for trace_clock */
5645 trace_seq_printf(s, "oldest event ts: %llu\n",
12883efb 5646 ring_buffer_oldest_event_ts(trace_buf->buffer, cpu));
c64e148a 5647
11043d8b 5648 trace_seq_printf(s, "now ts: %llu\n",
12883efb 5649 ring_buffer_time_stamp(trace_buf->buffer, cpu));
11043d8b 5650 }
c64e148a 5651
12883efb 5652 cnt = ring_buffer_dropped_events_cpu(trace_buf->buffer, cpu);
884bfe89
SP
5653 trace_seq_printf(s, "dropped events: %ld\n", cnt);
5654
12883efb 5655 cnt = ring_buffer_read_events_cpu(trace_buf->buffer, cpu);
ad964704
SRRH
5656 trace_seq_printf(s, "read events: %ld\n", cnt);
5657
5ac48378
SRRH
5658 count = simple_read_from_buffer(ubuf, count, ppos,
5659 s->buffer, trace_seq_used(s));
c8d77183
SR
5660
5661 kfree(s);
5662
5663 return count;
5664}
5665
5666static const struct file_operations tracing_stats_fops = {
4d3435b8 5667 .open = tracing_open_generic_tr,
c8d77183 5668 .read = tracing_stats_read,
b444786f 5669 .llseek = generic_file_llseek,
4d3435b8 5670 .release = tracing_release_generic_tr,
c8d77183
SR
5671};
5672
bc0c38d1
SR
5673#ifdef CONFIG_DYNAMIC_FTRACE
5674
b807c3d0
SR
5675int __weak ftrace_arch_read_dyn_info(char *buf, int size)
5676{
5677 return 0;
5678}
5679
bc0c38d1 5680static ssize_t
b807c3d0 5681tracing_read_dyn_info(struct file *filp, char __user *ubuf,
bc0c38d1
SR
5682 size_t cnt, loff_t *ppos)
5683{
a26a2a27
SR
5684 static char ftrace_dyn_info_buffer[1024];
5685 static DEFINE_MUTEX(dyn_info_mutex);
bc0c38d1 5686 unsigned long *p = filp->private_data;
b807c3d0 5687 char *buf = ftrace_dyn_info_buffer;
a26a2a27 5688 int size = ARRAY_SIZE(ftrace_dyn_info_buffer);
bc0c38d1
SR
5689 int r;
5690
b807c3d0
SR
5691 mutex_lock(&dyn_info_mutex);
5692 r = sprintf(buf, "%ld ", *p);
4bf39a94 5693
a26a2a27 5694 r += ftrace_arch_read_dyn_info(buf+r, (size-1)-r);
b807c3d0
SR
5695 buf[r++] = '\n';
5696
5697 r = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
5698
5699 mutex_unlock(&dyn_info_mutex);
5700
5701 return r;
bc0c38d1
SR
5702}
5703
5e2336a0 5704static const struct file_operations tracing_dyn_info_fops = {
4bf39a94 5705 .open = tracing_open_generic,
b807c3d0 5706 .read = tracing_read_dyn_info,
b444786f 5707 .llseek = generic_file_llseek,
bc0c38d1 5708};
77fd5c15 5709#endif /* CONFIG_DYNAMIC_FTRACE */
bc0c38d1 5710
77fd5c15
SRRH
5711#if defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE)
5712static void
5713ftrace_snapshot(unsigned long ip, unsigned long parent_ip, void **data)
5714{
5715 tracing_snapshot();
5716}
bc0c38d1 5717
77fd5c15
SRRH
5718static void
5719ftrace_count_snapshot(unsigned long ip, unsigned long parent_ip, void **data)
bc0c38d1 5720{
77fd5c15
SRRH
5721 unsigned long *count = (long *)data;
5722
5723 if (!*count)
5724 return;
bc0c38d1 5725
77fd5c15
SRRH
5726 if (*count != -1)
5727 (*count)--;
5728
5729 tracing_snapshot();
5730}
5731
5732static int
5733ftrace_snapshot_print(struct seq_file *m, unsigned long ip,
5734 struct ftrace_probe_ops *ops, void *data)
5735{
5736 long count = (long)data;
5737
5738 seq_printf(m, "%ps:", (void *)ip);
5739
fa6f0cc7 5740 seq_puts(m, "snapshot");
77fd5c15
SRRH
5741
5742 if (count == -1)
fa6f0cc7 5743 seq_puts(m, ":unlimited\n");
77fd5c15
SRRH
5744 else
5745 seq_printf(m, ":count=%ld\n", count);
5746
5747 return 0;
5748}
5749
5750static struct ftrace_probe_ops snapshot_probe_ops = {
5751 .func = ftrace_snapshot,
5752 .print = ftrace_snapshot_print,
5753};
5754
5755static struct ftrace_probe_ops snapshot_count_probe_ops = {
5756 .func = ftrace_count_snapshot,
5757 .print = ftrace_snapshot_print,
5758};
5759
5760static int
5761ftrace_trace_snapshot_callback(struct ftrace_hash *hash,
5762 char *glob, char *cmd, char *param, int enable)
5763{
5764 struct ftrace_probe_ops *ops;
5765 void *count = (void *)-1;
5766 char *number;
5767 int ret;
5768
5769 /* hash funcs only work with set_ftrace_filter */
5770 if (!enable)
5771 return -EINVAL;
5772
5773 ops = param ? &snapshot_count_probe_ops : &snapshot_probe_ops;
5774
5775 if (glob[0] == '!') {
5776 unregister_ftrace_function_probe_func(glob+1, ops);
5777 return 0;
5778 }
5779
5780 if (!param)
5781 goto out_reg;
5782
5783 number = strsep(&param, ":");
5784
5785 if (!strlen(number))
5786 goto out_reg;
5787
5788 /*
5789 * We use the callback data field (which is a pointer)
5790 * as our counter.
5791 */
5792 ret = kstrtoul(number, 0, (unsigned long *)&count);
5793 if (ret)
5794 return ret;
5795
5796 out_reg:
5797 ret = register_ftrace_function_probe(glob, ops, count);
5798
5799 if (ret >= 0)
5800 alloc_snapshot(&global_trace);
5801
5802 return ret < 0 ? ret : 0;
5803}
5804
5805static struct ftrace_func_command ftrace_snapshot_cmd = {
5806 .name = "snapshot",
5807 .func = ftrace_trace_snapshot_callback,
5808};
5809
38de93ab 5810static __init int register_snapshot_cmd(void)
77fd5c15
SRRH
5811{
5812 return register_ftrace_command(&ftrace_snapshot_cmd);
5813}
5814#else
38de93ab 5815static inline __init int register_snapshot_cmd(void) { return 0; }
77fd5c15 5816#endif /* defined(CONFIG_TRACER_SNAPSHOT) && defined(CONFIG_DYNAMIC_FTRACE) */
bc0c38d1 5817
c6028948 5818static struct dentry *tracing_init_dentry_tr(struct trace_array *tr)
bc0c38d1 5819{
2b6080f2
SR
5820 if (tr->dir)
5821 return tr->dir;
bc0c38d1 5822
3e1f60b8 5823 if (!debugfs_initialized())
14a5ae40 5824 return ERR_PTR(-ENODEV);
3e1f60b8 5825
2b6080f2
SR
5826 if (tr->flags & TRACE_ARRAY_FL_GLOBAL)
5827 tr->dir = debugfs_create_dir("tracing", NULL);
bc0c38d1 5828
687c878a
J
5829 if (!tr->dir)
5830 pr_warn_once("Could not create debugfs directory 'tracing'\n");
bc0c38d1 5831
2b6080f2 5832 return tr->dir;
bc0c38d1
SR
5833}
5834
2b6080f2
SR
5835struct dentry *tracing_init_dentry(void)
5836{
5837 return tracing_init_dentry_tr(&global_trace);
5838}
b04cc6b1 5839
2b6080f2 5840static struct dentry *tracing_dentry_percpu(struct trace_array *tr, int cpu)
b04cc6b1 5841{
b04cc6b1
FW
5842 struct dentry *d_tracer;
5843
2b6080f2
SR
5844 if (tr->percpu_dir)
5845 return tr->percpu_dir;
b04cc6b1 5846
2b6080f2 5847 d_tracer = tracing_init_dentry_tr(tr);
14a5ae40 5848 if (IS_ERR(d_tracer))
b04cc6b1
FW
5849 return NULL;
5850
2b6080f2 5851 tr->percpu_dir = debugfs_create_dir("per_cpu", d_tracer);
b04cc6b1 5852
2b6080f2
SR
5853 WARN_ONCE(!tr->percpu_dir,
5854 "Could not create debugfs directory 'per_cpu/%d'\n", cpu);
b04cc6b1 5855
2b6080f2 5856 return tr->percpu_dir;
b04cc6b1
FW
5857}
5858
649e9c70
ON
5859static struct dentry *
5860trace_create_cpu_file(const char *name, umode_t mode, struct dentry *parent,
5861 void *data, long cpu, const struct file_operations *fops)
5862{
5863 struct dentry *ret = trace_create_file(name, mode, parent, data, fops);
5864
5865 if (ret) /* See tracing_get_cpu() */
5866 ret->d_inode->i_cdev = (void *)(cpu + 1);
5867 return ret;
5868}
5869
2b6080f2
SR
5870static void
5871tracing_init_debugfs_percpu(struct trace_array *tr, long cpu)
b04cc6b1 5872{
2b6080f2 5873 struct dentry *d_percpu = tracing_dentry_percpu(tr, cpu);
5452af66 5874 struct dentry *d_cpu;
dd49a38c 5875 char cpu_dir[30]; /* 30 characters should be more than enough */
b04cc6b1 5876
0a3d7ce7
NK
5877 if (!d_percpu)
5878 return;
5879
dd49a38c 5880 snprintf(cpu_dir, 30, "cpu%ld", cpu);
8656e7a2
FW
5881 d_cpu = debugfs_create_dir(cpu_dir, d_percpu);
5882 if (!d_cpu) {
5883 pr_warning("Could not create debugfs '%s' entry\n", cpu_dir);
5884 return;
5885 }
b04cc6b1 5886
8656e7a2 5887 /* per cpu trace_pipe */
649e9c70 5888 trace_create_cpu_file("trace_pipe", 0444, d_cpu,
15544209 5889 tr, cpu, &tracing_pipe_fops);
b04cc6b1
FW
5890
5891 /* per cpu trace */
649e9c70 5892 trace_create_cpu_file("trace", 0644, d_cpu,
6484c71c 5893 tr, cpu, &tracing_fops);
7f96f93f 5894
649e9c70 5895 trace_create_cpu_file("trace_pipe_raw", 0444, d_cpu,
46ef2be0 5896 tr, cpu, &tracing_buffers_fops);
7f96f93f 5897
649e9c70 5898 trace_create_cpu_file("stats", 0444, d_cpu,
4d3435b8 5899 tr, cpu, &tracing_stats_fops);
438ced17 5900
649e9c70 5901 trace_create_cpu_file("buffer_size_kb", 0444, d_cpu,
0bc392ee 5902 tr, cpu, &tracing_entries_fops);
f1affcaa
SRRH
5903
5904#ifdef CONFIG_TRACER_SNAPSHOT
649e9c70 5905 trace_create_cpu_file("snapshot", 0644, d_cpu,
6484c71c 5906 tr, cpu, &snapshot_fops);
6de58e62 5907
649e9c70 5908 trace_create_cpu_file("snapshot_raw", 0444, d_cpu,
46ef2be0 5909 tr, cpu, &snapshot_raw_fops);
f1affcaa 5910#endif
b04cc6b1
FW
5911}
5912
60a11774
SR
5913#ifdef CONFIG_FTRACE_SELFTEST
5914/* Let selftest have access to static functions in this file */
5915#include "trace_selftest.c"
5916#endif
5917
577b785f
SR
5918struct trace_option_dentry {
5919 struct tracer_opt *opt;
5920 struct tracer_flags *flags;
2b6080f2 5921 struct trace_array *tr;
577b785f
SR
5922 struct dentry *entry;
5923};
5924
5925static ssize_t
5926trace_options_read(struct file *filp, char __user *ubuf, size_t cnt,
5927 loff_t *ppos)
5928{
5929 struct trace_option_dentry *topt = filp->private_data;
5930 char *buf;
5931
5932 if (topt->flags->val & topt->opt->bit)
5933 buf = "1\n";
5934 else
5935 buf = "0\n";
5936
5937 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
5938}
5939
5940static ssize_t
5941trace_options_write(struct file *filp, const char __user *ubuf, size_t cnt,
5942 loff_t *ppos)
5943{
5944 struct trace_option_dentry *topt = filp->private_data;
5945 unsigned long val;
577b785f
SR
5946 int ret;
5947
22fe9b54
PH
5948 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
5949 if (ret)
577b785f
SR
5950 return ret;
5951
8d18eaaf
LZ
5952 if (val != 0 && val != 1)
5953 return -EINVAL;
577b785f 5954
8d18eaaf 5955 if (!!(topt->flags->val & topt->opt->bit) != val) {
577b785f 5956 mutex_lock(&trace_types_lock);
8c1a49ae 5957 ret = __set_tracer_option(topt->tr, topt->flags,
c757bea9 5958 topt->opt, !val);
577b785f
SR
5959 mutex_unlock(&trace_types_lock);
5960 if (ret)
5961 return ret;
577b785f
SR
5962 }
5963
5964 *ppos += cnt;
5965
5966 return cnt;
5967}
5968
5969
5970static const struct file_operations trace_options_fops = {
5971 .open = tracing_open_generic,
5972 .read = trace_options_read,
5973 .write = trace_options_write,
b444786f 5974 .llseek = generic_file_llseek,
577b785f
SR
5975};
5976
a8259075
SR
5977static ssize_t
5978trace_options_core_read(struct file *filp, char __user *ubuf, size_t cnt,
5979 loff_t *ppos)
5980{
5981 long index = (long)filp->private_data;
5982 char *buf;
5983
5984 if (trace_flags & (1 << index))
5985 buf = "1\n";
5986 else
5987 buf = "0\n";
5988
5989 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
5990}
5991
5992static ssize_t
5993trace_options_core_write(struct file *filp, const char __user *ubuf, size_t cnt,
5994 loff_t *ppos)
5995{
2b6080f2 5996 struct trace_array *tr = &global_trace;
a8259075 5997 long index = (long)filp->private_data;
a8259075
SR
5998 unsigned long val;
5999 int ret;
6000
22fe9b54
PH
6001 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6002 if (ret)
a8259075
SR
6003 return ret;
6004
f2d84b65 6005 if (val != 0 && val != 1)
a8259075 6006 return -EINVAL;
69d34da2
SRRH
6007
6008 mutex_lock(&trace_types_lock);
2b6080f2 6009 ret = set_tracer_flag(tr, 1 << index, val);
69d34da2 6010 mutex_unlock(&trace_types_lock);
a8259075 6011
613f04a0
SRRH
6012 if (ret < 0)
6013 return ret;
6014
a8259075
SR
6015 *ppos += cnt;
6016
6017 return cnt;
6018}
6019
a8259075
SR
6020static const struct file_operations trace_options_core_fops = {
6021 .open = tracing_open_generic,
6022 .read = trace_options_core_read,
6023 .write = trace_options_core_write,
b444786f 6024 .llseek = generic_file_llseek,
a8259075
SR
6025};
6026
5452af66 6027struct dentry *trace_create_file(const char *name,
f4ae40a6 6028 umode_t mode,
5452af66
FW
6029 struct dentry *parent,
6030 void *data,
6031 const struct file_operations *fops)
6032{
6033 struct dentry *ret;
6034
6035 ret = debugfs_create_file(name, mode, parent, data, fops);
6036 if (!ret)
6037 pr_warning("Could not create debugfs '%s' entry\n", name);
6038
6039 return ret;
6040}
6041
6042
2b6080f2 6043static struct dentry *trace_options_init_dentry(struct trace_array *tr)
a8259075
SR
6044{
6045 struct dentry *d_tracer;
a8259075 6046
2b6080f2
SR
6047 if (tr->options)
6048 return tr->options;
a8259075 6049
2b6080f2 6050 d_tracer = tracing_init_dentry_tr(tr);
14a5ae40 6051 if (IS_ERR(d_tracer))
a8259075
SR
6052 return NULL;
6053
2b6080f2
SR
6054 tr->options = debugfs_create_dir("options", d_tracer);
6055 if (!tr->options) {
a8259075
SR
6056 pr_warning("Could not create debugfs directory 'options'\n");
6057 return NULL;
6058 }
6059
2b6080f2 6060 return tr->options;
a8259075
SR
6061}
6062
577b785f 6063static void
2b6080f2
SR
6064create_trace_option_file(struct trace_array *tr,
6065 struct trace_option_dentry *topt,
577b785f
SR
6066 struct tracer_flags *flags,
6067 struct tracer_opt *opt)
6068{
6069 struct dentry *t_options;
577b785f 6070
2b6080f2 6071 t_options = trace_options_init_dentry(tr);
577b785f
SR
6072 if (!t_options)
6073 return;
6074
6075 topt->flags = flags;
6076 topt->opt = opt;
2b6080f2 6077 topt->tr = tr;
577b785f 6078
5452af66 6079 topt->entry = trace_create_file(opt->name, 0644, t_options, topt,
577b785f
SR
6080 &trace_options_fops);
6081
577b785f
SR
6082}
6083
6084static struct trace_option_dentry *
2b6080f2 6085create_trace_option_files(struct trace_array *tr, struct tracer *tracer)
577b785f
SR
6086{
6087 struct trace_option_dentry *topts;
6088 struct tracer_flags *flags;
6089 struct tracer_opt *opts;
6090 int cnt;
6091
6092 if (!tracer)
6093 return NULL;
6094
6095 flags = tracer->flags;
6096
6097 if (!flags || !flags->opts)
6098 return NULL;
6099
6100 opts = flags->opts;
6101
6102 for (cnt = 0; opts[cnt].name; cnt++)
6103 ;
6104
0cfe8245 6105 topts = kcalloc(cnt + 1, sizeof(*topts), GFP_KERNEL);
577b785f
SR
6106 if (!topts)
6107 return NULL;
6108
6109 for (cnt = 0; opts[cnt].name; cnt++)
2b6080f2 6110 create_trace_option_file(tr, &topts[cnt], flags,
577b785f
SR
6111 &opts[cnt]);
6112
6113 return topts;
6114}
6115
6116static void
6117destroy_trace_option_files(struct trace_option_dentry *topts)
6118{
6119 int cnt;
6120
6121 if (!topts)
6122 return;
6123
3f4d8f78
FF
6124 for (cnt = 0; topts[cnt].opt; cnt++)
6125 debugfs_remove(topts[cnt].entry);
577b785f
SR
6126
6127 kfree(topts);
6128}
6129
a8259075 6130static struct dentry *
2b6080f2
SR
6131create_trace_option_core_file(struct trace_array *tr,
6132 const char *option, long index)
a8259075
SR
6133{
6134 struct dentry *t_options;
a8259075 6135
2b6080f2 6136 t_options = trace_options_init_dentry(tr);
a8259075
SR
6137 if (!t_options)
6138 return NULL;
6139
5452af66 6140 return trace_create_file(option, 0644, t_options, (void *)index,
a8259075 6141 &trace_options_core_fops);
a8259075
SR
6142}
6143
2b6080f2 6144static __init void create_trace_options_dir(struct trace_array *tr)
a8259075
SR
6145{
6146 struct dentry *t_options;
a8259075
SR
6147 int i;
6148
2b6080f2 6149 t_options = trace_options_init_dentry(tr);
a8259075
SR
6150 if (!t_options)
6151 return;
6152
5452af66 6153 for (i = 0; trace_options[i]; i++)
2b6080f2 6154 create_trace_option_core_file(tr, trace_options[i], i);
a8259075
SR
6155}
6156
499e5470
SR
6157static ssize_t
6158rb_simple_read(struct file *filp, char __user *ubuf,
6159 size_t cnt, loff_t *ppos)
6160{
348f0fc2 6161 struct trace_array *tr = filp->private_data;
499e5470
SR
6162 char buf[64];
6163 int r;
6164
10246fa3 6165 r = tracer_tracing_is_on(tr);
499e5470
SR
6166 r = sprintf(buf, "%d\n", r);
6167
6168 return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
6169}
6170
6171static ssize_t
6172rb_simple_write(struct file *filp, const char __user *ubuf,
6173 size_t cnt, loff_t *ppos)
6174{
348f0fc2 6175 struct trace_array *tr = filp->private_data;
12883efb 6176 struct ring_buffer *buffer = tr->trace_buffer.buffer;
499e5470
SR
6177 unsigned long val;
6178 int ret;
6179
6180 ret = kstrtoul_from_user(ubuf, cnt, 10, &val);
6181 if (ret)
6182 return ret;
6183
6184 if (buffer) {
2df8f8a6
SR
6185 mutex_lock(&trace_types_lock);
6186 if (val) {
10246fa3 6187 tracer_tracing_on(tr);
2b6080f2
SR
6188 if (tr->current_trace->start)
6189 tr->current_trace->start(tr);
2df8f8a6 6190 } else {
10246fa3 6191 tracer_tracing_off(tr);
2b6080f2
SR
6192 if (tr->current_trace->stop)
6193 tr->current_trace->stop(tr);
2df8f8a6
SR
6194 }
6195 mutex_unlock(&trace_types_lock);
499e5470
SR
6196 }
6197
6198 (*ppos)++;
6199
6200 return cnt;
6201}
6202
6203static const struct file_operations rb_simple_fops = {
7b85af63 6204 .open = tracing_open_generic_tr,
499e5470
SR
6205 .read = rb_simple_read,
6206 .write = rb_simple_write,
7b85af63 6207 .release = tracing_release_generic_tr,
499e5470
SR
6208 .llseek = default_llseek,
6209};
6210
277ba044
SR
6211struct dentry *trace_instance_dir;
6212
6213static void
6214init_tracer_debugfs(struct trace_array *tr, struct dentry *d_tracer);
6215
55034cd6
SRRH
6216static int
6217allocate_trace_buffer(struct trace_array *tr, struct trace_buffer *buf, int size)
277ba044
SR
6218{
6219 enum ring_buffer_flags rb_flags;
737223fb
SRRH
6220
6221 rb_flags = trace_flags & TRACE_ITER_OVERWRITE ? RB_FL_OVERWRITE : 0;
6222
dced341b
SRRH
6223 buf->tr = tr;
6224
55034cd6
SRRH
6225 buf->buffer = ring_buffer_alloc(size, rb_flags);
6226 if (!buf->buffer)
6227 return -ENOMEM;
737223fb 6228
55034cd6
SRRH
6229 buf->data = alloc_percpu(struct trace_array_cpu);
6230 if (!buf->data) {
6231 ring_buffer_free(buf->buffer);
6232 return -ENOMEM;
6233 }
737223fb 6234
737223fb
SRRH
6235 /* Allocate the first page for all buffers */
6236 set_buffer_entries(&tr->trace_buffer,
6237 ring_buffer_size(tr->trace_buffer.buffer, 0));
6238
55034cd6
SRRH
6239 return 0;
6240}
737223fb 6241
55034cd6
SRRH
6242static int allocate_trace_buffers(struct trace_array *tr, int size)
6243{
6244 int ret;
737223fb 6245
55034cd6
SRRH
6246 ret = allocate_trace_buffer(tr, &tr->trace_buffer, size);
6247 if (ret)
6248 return ret;
737223fb 6249
55034cd6
SRRH
6250#ifdef CONFIG_TRACER_MAX_TRACE
6251 ret = allocate_trace_buffer(tr, &tr->max_buffer,
6252 allocate_snapshot ? size : 1);
6253 if (WARN_ON(ret)) {
737223fb 6254 ring_buffer_free(tr->trace_buffer.buffer);
55034cd6
SRRH
6255 free_percpu(tr->trace_buffer.data);
6256 return -ENOMEM;
6257 }
6258 tr->allocated_snapshot = allocate_snapshot;
737223fb 6259
55034cd6
SRRH
6260 /*
6261 * Only the top level trace array gets its snapshot allocated
6262 * from the kernel command line.
6263 */
6264 allocate_snapshot = false;
737223fb 6265#endif
55034cd6 6266 return 0;
737223fb
SRRH
6267}
6268
f0b70cc4
SRRH
6269static void free_trace_buffer(struct trace_buffer *buf)
6270{
6271 if (buf->buffer) {
6272 ring_buffer_free(buf->buffer);
6273 buf->buffer = NULL;
6274 free_percpu(buf->data);
6275 buf->data = NULL;
6276 }
6277}
6278
23aaa3c1
SRRH
6279static void free_trace_buffers(struct trace_array *tr)
6280{
6281 if (!tr)
6282 return;
6283
f0b70cc4 6284 free_trace_buffer(&tr->trace_buffer);
23aaa3c1
SRRH
6285
6286#ifdef CONFIG_TRACER_MAX_TRACE
f0b70cc4 6287 free_trace_buffer(&tr->max_buffer);
23aaa3c1
SRRH
6288#endif
6289}
6290
737223fb
SRRH
6291static int new_instance_create(const char *name)
6292{
277ba044
SR
6293 struct trace_array *tr;
6294 int ret;
277ba044
SR
6295
6296 mutex_lock(&trace_types_lock);
6297
6298 ret = -EEXIST;
6299 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
6300 if (tr->name && strcmp(tr->name, name) == 0)
6301 goto out_unlock;
6302 }
6303
6304 ret = -ENOMEM;
6305 tr = kzalloc(sizeof(*tr), GFP_KERNEL);
6306 if (!tr)
6307 goto out_unlock;
6308
6309 tr->name = kstrdup(name, GFP_KERNEL);
6310 if (!tr->name)
6311 goto out_free_tr;
6312
ccfe9e42
AL
6313 if (!alloc_cpumask_var(&tr->tracing_cpumask, GFP_KERNEL))
6314 goto out_free_tr;
6315
6316 cpumask_copy(tr->tracing_cpumask, cpu_all_mask);
6317
277ba044
SR
6318 raw_spin_lock_init(&tr->start_lock);
6319
0b9b12c1
SRRH
6320 tr->max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
6321
277ba044
SR
6322 tr->current_trace = &nop_trace;
6323
6324 INIT_LIST_HEAD(&tr->systems);
6325 INIT_LIST_HEAD(&tr->events);
6326
737223fb 6327 if (allocate_trace_buffers(tr, trace_buf_size) < 0)
277ba044
SR
6328 goto out_free_tr;
6329
277ba044
SR
6330 tr->dir = debugfs_create_dir(name, trace_instance_dir);
6331 if (!tr->dir)
6332 goto out_free_tr;
6333
6334 ret = event_trace_add_tracer(tr->dir, tr);
609e85a7
AL
6335 if (ret) {
6336 debugfs_remove_recursive(tr->dir);
277ba044 6337 goto out_free_tr;
609e85a7 6338 }
277ba044
SR
6339
6340 init_tracer_debugfs(tr, tr->dir);
6341
6342 list_add(&tr->list, &ftrace_trace_arrays);
6343
6344 mutex_unlock(&trace_types_lock);
6345
6346 return 0;
6347
6348 out_free_tr:
23aaa3c1 6349 free_trace_buffers(tr);
ccfe9e42 6350 free_cpumask_var(tr->tracing_cpumask);
277ba044
SR
6351 kfree(tr->name);
6352 kfree(tr);
6353
6354 out_unlock:
6355 mutex_unlock(&trace_types_lock);
6356
6357 return ret;
6358
6359}
6360
0c8916c3
SR
6361static int instance_delete(const char *name)
6362{
6363 struct trace_array *tr;
6364 int found = 0;
6365 int ret;
6366
6367 mutex_lock(&trace_types_lock);
6368
6369 ret = -ENODEV;
6370 list_for_each_entry(tr, &ftrace_trace_arrays, list) {
6371 if (tr->name && strcmp(tr->name, name) == 0) {
6372 found = 1;
6373 break;
6374 }
6375 }
6376 if (!found)
6377 goto out_unlock;
6378
a695cb58 6379 ret = -EBUSY;
cf6ab6d9 6380 if (tr->ref || (tr->current_trace && tr->current_trace->ref))
a695cb58
SRRH
6381 goto out_unlock;
6382
0c8916c3
SR
6383 list_del(&tr->list);
6384
6b450d25 6385 tracing_set_nop(tr);
0c8916c3 6386 event_trace_del_tracer(tr);
591dffda 6387 ftrace_destroy_function_files(tr);
0c8916c3 6388 debugfs_remove_recursive(tr->dir);
a9fcaaac 6389 free_trace_buffers(tr);
0c8916c3
SR
6390
6391 kfree(tr->name);
6392 kfree(tr);
6393
6394 ret = 0;
6395
6396 out_unlock:
6397 mutex_unlock(&trace_types_lock);
6398
6399 return ret;
6400}
6401
277ba044
SR
6402static int instance_mkdir (struct inode *inode, struct dentry *dentry, umode_t mode)
6403{
6404 struct dentry *parent;
6405 int ret;
6406
6407 /* Paranoid: Make sure the parent is the "instances" directory */
946e51f2 6408 parent = hlist_entry(inode->i_dentry.first, struct dentry, d_u.d_alias);
277ba044
SR
6409 if (WARN_ON_ONCE(parent != trace_instance_dir))
6410 return -ENOENT;
6411
6412 /*
6413 * The inode mutex is locked, but debugfs_create_dir() will also
6414 * take the mutex. As the instances directory can not be destroyed
6415 * or changed in any other way, it is safe to unlock it, and
6416 * let the dentry try. If two users try to make the same dir at
6417 * the same time, then the new_instance_create() will determine the
6418 * winner.
6419 */
6420 mutex_unlock(&inode->i_mutex);
6421
6422 ret = new_instance_create(dentry->d_iname);
6423
6424 mutex_lock(&inode->i_mutex);
6425
6426 return ret;
6427}
6428
0c8916c3
SR
6429static int instance_rmdir(struct inode *inode, struct dentry *dentry)
6430{
6431 struct dentry *parent;
6432 int ret;
6433
6434 /* Paranoid: Make sure the parent is the "instances" directory */
946e51f2 6435 parent = hlist_entry(inode->i_dentry.first, struct dentry, d_u.d_alias);
0c8916c3
SR
6436 if (WARN_ON_ONCE(parent != trace_instance_dir))
6437 return -ENOENT;
6438
6439 /* The caller did a dget() on dentry */
6440 mutex_unlock(&dentry->d_inode->i_mutex);
6441
6442 /*
6443 * The inode mutex is locked, but debugfs_create_dir() will also
6444 * take the mutex. As the instances directory can not be destroyed
6445 * or changed in any other way, it is safe to unlock it, and
6446 * let the dentry try. If two users try to make the same dir at
6447 * the same time, then the instance_delete() will determine the
6448 * winner.
6449 */
6450 mutex_unlock(&inode->i_mutex);
6451
6452 ret = instance_delete(dentry->d_iname);
6453
6454 mutex_lock_nested(&inode->i_mutex, I_MUTEX_PARENT);
6455 mutex_lock(&dentry->d_inode->i_mutex);
6456
6457 return ret;
6458}
6459
277ba044
SR
6460static const struct inode_operations instance_dir_inode_operations = {
6461 .lookup = simple_lookup,
6462 .mkdir = instance_mkdir,
0c8916c3 6463 .rmdir = instance_rmdir,
277ba044
SR
6464};
6465
6466static __init void create_trace_instances(struct dentry *d_tracer)
6467{
6468 trace_instance_dir = debugfs_create_dir("instances", d_tracer);
6469 if (WARN_ON(!trace_instance_dir))
6470 return;
6471
6472 /* Hijack the dir inode operations, to allow mkdir */
6473 trace_instance_dir->d_inode->i_op = &instance_dir_inode_operations;
6474}
6475
2b6080f2
SR
6476static void
6477init_tracer_debugfs(struct trace_array *tr, struct dentry *d_tracer)
6478{
121aaee7 6479 int cpu;
2b6080f2 6480
607e2ea1
SRRH
6481 trace_create_file("available_tracers", 0444, d_tracer,
6482 tr, &show_traces_fops);
6483
6484 trace_create_file("current_tracer", 0644, d_tracer,
6485 tr, &set_tracer_fops);
6486
ccfe9e42
AL
6487 trace_create_file("tracing_cpumask", 0644, d_tracer,
6488 tr, &tracing_cpumask_fops);
6489
2b6080f2
SR
6490 trace_create_file("trace_options", 0644, d_tracer,
6491 tr, &tracing_iter_fops);
6492
6493 trace_create_file("trace", 0644, d_tracer,
6484c71c 6494 tr, &tracing_fops);
2b6080f2
SR
6495
6496 trace_create_file("trace_pipe", 0444, d_tracer,
15544209 6497 tr, &tracing_pipe_fops);
2b6080f2
SR
6498
6499 trace_create_file("buffer_size_kb", 0644, d_tracer,
0bc392ee 6500 tr, &tracing_entries_fops);
2b6080f2
SR
6501
6502 trace_create_file("buffer_total_size_kb", 0444, d_tracer,
6503 tr, &tracing_total_entries_fops);
6504
238ae93d 6505 trace_create_file("free_buffer", 0200, d_tracer,
2b6080f2
SR
6506 tr, &tracing_free_buffer_fops);
6507
6508 trace_create_file("trace_marker", 0220, d_tracer,
6509 tr, &tracing_mark_fops);
6510
6511 trace_create_file("trace_clock", 0644, d_tracer, tr,
6512 &trace_clock_fops);
6513
6514 trace_create_file("tracing_on", 0644, d_tracer,
6484c71c 6515 tr, &rb_simple_fops);
ce9bae55 6516
6d9b3fa5
SRRH
6517#ifdef CONFIG_TRACER_MAX_TRACE
6518 trace_create_file("tracing_max_latency", 0644, d_tracer,
6519 &tr->max_latency, &tracing_max_lat_fops);
6520#endif
6521
591dffda
SRRH
6522 if (ftrace_create_function_files(tr, d_tracer))
6523 WARN(1, "Could not allocate function filter files");
6524
ce9bae55
SRRH
6525#ifdef CONFIG_TRACER_SNAPSHOT
6526 trace_create_file("snapshot", 0644, d_tracer,
6484c71c 6527 tr, &snapshot_fops);
ce9bae55 6528#endif
121aaee7
SRRH
6529
6530 for_each_tracing_cpu(cpu)
6531 tracing_init_debugfs_percpu(tr, cpu);
6532
2b6080f2
SR
6533}
6534
b5ad384e 6535static __init int tracer_init_debugfs(void)
bc0c38d1
SR
6536{
6537 struct dentry *d_tracer;
bc0c38d1 6538
7e53bd42
LJ
6539 trace_access_lock_init();
6540
bc0c38d1 6541 d_tracer = tracing_init_dentry();
14a5ae40 6542 if (IS_ERR(d_tracer))
ed6f1c99 6543 return 0;
bc0c38d1 6544
2b6080f2 6545 init_tracer_debugfs(&global_trace, d_tracer);
bc0c38d1 6546
5452af66 6547 trace_create_file("tracing_thresh", 0644, d_tracer,
6508fa76 6548 &global_trace, &tracing_thresh_fops);
a8259075 6549
339ae5d3 6550 trace_create_file("README", 0444, d_tracer,
5452af66
FW
6551 NULL, &tracing_readme_fops);
6552
69abe6a5
AP
6553 trace_create_file("saved_cmdlines", 0444, d_tracer,
6554 NULL, &tracing_saved_cmdlines_fops);
5bf9a1ee 6555
939c7a4f
YY
6556 trace_create_file("saved_cmdlines_size", 0644, d_tracer,
6557 NULL, &tracing_saved_cmdlines_size_fops);
6558
bc0c38d1 6559#ifdef CONFIG_DYNAMIC_FTRACE
5452af66
FW
6560 trace_create_file("dyn_ftrace_total_info", 0444, d_tracer,
6561 &ftrace_update_tot_cnt, &tracing_dyn_info_fops);
bc0c38d1 6562#endif
b04cc6b1 6563
277ba044 6564 create_trace_instances(d_tracer);
5452af66 6565
2b6080f2 6566 create_trace_options_dir(&global_trace);
b04cc6b1 6567
b5ad384e 6568 return 0;
bc0c38d1
SR
6569}
6570
3f5a54e3
SR
6571static int trace_panic_handler(struct notifier_block *this,
6572 unsigned long event, void *unused)
6573{
944ac425 6574 if (ftrace_dump_on_oops)
cecbca96 6575 ftrace_dump(ftrace_dump_on_oops);
3f5a54e3
SR
6576 return NOTIFY_OK;
6577}
6578
6579static struct notifier_block trace_panic_notifier = {
6580 .notifier_call = trace_panic_handler,
6581 .next = NULL,
6582 .priority = 150 /* priority: INT_MAX >= x >= 0 */
6583};
6584
6585static int trace_die_handler(struct notifier_block *self,
6586 unsigned long val,
6587 void *data)
6588{
6589 switch (val) {
6590 case DIE_OOPS:
944ac425 6591 if (ftrace_dump_on_oops)
cecbca96 6592 ftrace_dump(ftrace_dump_on_oops);
3f5a54e3
SR
6593 break;
6594 default:
6595 break;
6596 }
6597 return NOTIFY_OK;
6598}
6599
6600static struct notifier_block trace_die_notifier = {
6601 .notifier_call = trace_die_handler,
6602 .priority = 200
6603};
6604
6605/*
6606 * printk is set to max of 1024, we really don't need it that big.
6607 * Nothing should be printing 1000 characters anyway.
6608 */
6609#define TRACE_MAX_PRINT 1000
6610
6611/*
6612 * Define here KERN_TRACE so that we have one place to modify
6613 * it if we decide to change what log level the ftrace dump
6614 * should be at.
6615 */
428aee14 6616#define KERN_TRACE KERN_EMERG
3f5a54e3 6617
955b61e5 6618void
3f5a54e3
SR
6619trace_printk_seq(struct trace_seq *s)
6620{
6621 /* Probably should print a warning here. */
3a161d99
SRRH
6622 if (s->seq.len >= TRACE_MAX_PRINT)
6623 s->seq.len = TRACE_MAX_PRINT;
3f5a54e3 6624
820b75f6
SRRH
6625 /*
6626 * More paranoid code. Although the buffer size is set to
6627 * PAGE_SIZE, and TRACE_MAX_PRINT is 1000, this is just
6628 * an extra layer of protection.
6629 */
6630 if (WARN_ON_ONCE(s->seq.len >= s->seq.size))
6631 s->seq.len = s->seq.size - 1;
3f5a54e3
SR
6632
6633 /* should be zero ended, but we are paranoid. */
3a161d99 6634 s->buffer[s->seq.len] = 0;
3f5a54e3
SR
6635
6636 printk(KERN_TRACE "%s", s->buffer);
6637
f9520750 6638 trace_seq_init(s);
3f5a54e3
SR
6639}
6640
955b61e5
JW
6641void trace_init_global_iter(struct trace_iterator *iter)
6642{
6643 iter->tr = &global_trace;
2b6080f2 6644 iter->trace = iter->tr->current_trace;
ae3b5093 6645 iter->cpu_file = RING_BUFFER_ALL_CPUS;
12883efb 6646 iter->trace_buffer = &global_trace.trace_buffer;
b2f974d6
CS
6647
6648 if (iter->trace && iter->trace->open)
6649 iter->trace->open(iter);
6650
6651 /* Annotate start of buffers if we had overruns */
6652 if (ring_buffer_overruns(iter->trace_buffer->buffer))
6653 iter->iter_flags |= TRACE_FILE_ANNOTATE;
6654
6655 /* Output in nanoseconds only if we are using a clock in nanoseconds. */
6656 if (trace_clocks[iter->tr->clock_id].in_ns)
6657 iter->iter_flags |= TRACE_FILE_TIME_IN_NS;
955b61e5
JW
6658}
6659
7fe70b57 6660void ftrace_dump(enum ftrace_dump_mode oops_dump_mode)
3f5a54e3 6661{
3f5a54e3
SR
6662 /* use static because iter can be a bit big for the stack */
6663 static struct trace_iterator iter;
7fe70b57 6664 static atomic_t dump_running;
cf586b61 6665 unsigned int old_userobj;
d769041f
SR
6666 unsigned long flags;
6667 int cnt = 0, cpu;
3f5a54e3 6668
7fe70b57
SRRH
6669 /* Only allow one dump user at a time. */
6670 if (atomic_inc_return(&dump_running) != 1) {
6671 atomic_dec(&dump_running);
6672 return;
6673 }
3f5a54e3 6674
7fe70b57
SRRH
6675 /*
6676 * Always turn off tracing when we dump.
6677 * We don't need to show trace output of what happens
6678 * between multiple crashes.
6679 *
6680 * If the user does a sysrq-z, then they can re-enable
6681 * tracing with echo 1 > tracing_on.
6682 */
0ee6b6cf 6683 tracing_off();
cf586b61 6684
7fe70b57 6685 local_irq_save(flags);
3f5a54e3 6686
38dbe0b1 6687 /* Simulate the iterator */
955b61e5
JW
6688 trace_init_global_iter(&iter);
6689
d769041f 6690 for_each_tracing_cpu(cpu) {
12883efb 6691 atomic_inc(&per_cpu_ptr(iter.tr->trace_buffer.data, cpu)->disabled);
d769041f
SR
6692 }
6693
cf586b61
FW
6694 old_userobj = trace_flags & TRACE_ITER_SYM_USEROBJ;
6695
b54d3de9
TE
6696 /* don't look at user memory in panic mode */
6697 trace_flags &= ~TRACE_ITER_SYM_USEROBJ;
6698
cecbca96
FW
6699 switch (oops_dump_mode) {
6700 case DUMP_ALL:
ae3b5093 6701 iter.cpu_file = RING_BUFFER_ALL_CPUS;
cecbca96
FW
6702 break;
6703 case DUMP_ORIG:
6704 iter.cpu_file = raw_smp_processor_id();
6705 break;
6706 case DUMP_NONE:
6707 goto out_enable;
6708 default:
6709 printk(KERN_TRACE "Bad dumping mode, switching to all CPUs dump\n");
ae3b5093 6710 iter.cpu_file = RING_BUFFER_ALL_CPUS;
cecbca96
FW
6711 }
6712
6713 printk(KERN_TRACE "Dumping ftrace buffer:\n");
3f5a54e3 6714
7fe70b57
SRRH
6715 /* Did function tracer already get disabled? */
6716 if (ftrace_is_dead()) {
6717 printk("# WARNING: FUNCTION TRACING IS CORRUPTED\n");
6718 printk("# MAY BE MISSING FUNCTION EVENTS\n");
6719 }
6720
3f5a54e3
SR
6721 /*
6722 * We need to stop all tracing on all CPUS to read the
6723 * the next buffer. This is a bit expensive, but is
6724 * not done often. We fill all what we can read,
6725 * and then release the locks again.
6726 */
6727
3f5a54e3
SR
6728 while (!trace_empty(&iter)) {
6729
6730 if (!cnt)
6731 printk(KERN_TRACE "---------------------------------\n");
6732
6733 cnt++;
6734
6735 /* reset all but tr, trace, and overruns */
6736 memset(&iter.seq, 0,
6737 sizeof(struct trace_iterator) -
6738 offsetof(struct trace_iterator, seq));
6739 iter.iter_flags |= TRACE_FILE_LAT_FMT;
6740 iter.pos = -1;
6741
955b61e5 6742 if (trace_find_next_entry_inc(&iter) != NULL) {
74e7ff8c
LJ
6743 int ret;
6744
6745 ret = print_trace_line(&iter);
6746 if (ret != TRACE_TYPE_NO_CONSUME)
6747 trace_consume(&iter);
3f5a54e3 6748 }
b892e5c8 6749 touch_nmi_watchdog();
3f5a54e3
SR
6750
6751 trace_printk_seq(&iter.seq);
6752 }
6753
6754 if (!cnt)
6755 printk(KERN_TRACE " (ftrace buffer empty)\n");
6756 else
6757 printk(KERN_TRACE "---------------------------------\n");
6758
cecbca96 6759 out_enable:
7fe70b57 6760 trace_flags |= old_userobj;
cf586b61 6761
7fe70b57
SRRH
6762 for_each_tracing_cpu(cpu) {
6763 atomic_dec(&per_cpu_ptr(iter.trace_buffer->data, cpu)->disabled);
cf586b61 6764 }
7fe70b57 6765 atomic_dec(&dump_running);
cd891ae0 6766 local_irq_restore(flags);
3f5a54e3 6767}
a8eecf22 6768EXPORT_SYMBOL_GPL(ftrace_dump);
cf586b61 6769
3928a8a2 6770__init static int tracer_alloc_buffers(void)
bc0c38d1 6771{
73c5162a 6772 int ring_buf_size;
9e01c1b7 6773 int ret = -ENOMEM;
4c11d7ae 6774
750912fa 6775
9e01c1b7
RR
6776 if (!alloc_cpumask_var(&tracing_buffer_mask, GFP_KERNEL))
6777 goto out;
6778
ccfe9e42 6779 if (!alloc_cpumask_var(&global_trace.tracing_cpumask, GFP_KERNEL))
9e01c1b7 6780 goto out_free_buffer_mask;
4c11d7ae 6781
07d777fe
SR
6782 /* Only allocate trace_printk buffers if a trace_printk exists */
6783 if (__stop___trace_bprintk_fmt != __start___trace_bprintk_fmt)
81698831 6784 /* Must be called before global_trace.buffer is allocated */
07d777fe
SR
6785 trace_printk_init_buffers();
6786
73c5162a
SR
6787 /* To save memory, keep the ring buffer size to its minimum */
6788 if (ring_buffer_expanded)
6789 ring_buf_size = trace_buf_size;
6790 else
6791 ring_buf_size = 1;
6792
9e01c1b7 6793 cpumask_copy(tracing_buffer_mask, cpu_possible_mask);
ccfe9e42 6794 cpumask_copy(global_trace.tracing_cpumask, cpu_all_mask);
9e01c1b7 6795
2b6080f2
SR
6796 raw_spin_lock_init(&global_trace.start_lock);
6797
2c4a33ab
SRRH
6798 /* Used for event triggers */
6799 temp_buffer = ring_buffer_alloc(PAGE_SIZE, RB_FL_OVERWRITE);
6800 if (!temp_buffer)
6801 goto out_free_cpumask;
6802
939c7a4f
YY
6803 if (trace_create_savedcmd() < 0)
6804 goto out_free_temp_buffer;
6805
9e01c1b7 6806 /* TODO: make the number of buffers hot pluggable with CPUS */
737223fb 6807 if (allocate_trace_buffers(&global_trace, ring_buf_size) < 0) {
3928a8a2
SR
6808 printk(KERN_ERR "tracer: failed to allocate ring buffer!\n");
6809 WARN_ON(1);
939c7a4f 6810 goto out_free_savedcmd;
4c11d7ae 6811 }
a7603ff4 6812
499e5470
SR
6813 if (global_trace.buffer_disabled)
6814 tracing_off();
4c11d7ae 6815
e1e232ca
SR
6816 if (trace_boot_clock) {
6817 ret = tracing_set_clock(&global_trace, trace_boot_clock);
6818 if (ret < 0)
6819 pr_warning("Trace clock %s not defined, going back to default\n",
6820 trace_boot_clock);
6821 }
6822
ca164318
SRRH
6823 /*
6824 * register_tracer() might reference current_trace, so it
6825 * needs to be set before we register anything. This is
6826 * just a bootstrap of current_trace anyway.
6827 */
2b6080f2
SR
6828 global_trace.current_trace = &nop_trace;
6829
0b9b12c1
SRRH
6830 global_trace.max_lock = (arch_spinlock_t)__ARCH_SPIN_LOCK_UNLOCKED;
6831
4104d326
SRRH
6832 ftrace_init_global_array_ops(&global_trace);
6833
ca164318
SRRH
6834 register_tracer(&nop_trace);
6835
60a11774
SR
6836 /* All seems OK, enable tracing */
6837 tracing_disabled = 0;
3928a8a2 6838
3f5a54e3
SR
6839 atomic_notifier_chain_register(&panic_notifier_list,
6840 &trace_panic_notifier);
6841
6842 register_die_notifier(&trace_die_notifier);
2fc1dfbe 6843
ae63b31e
SR
6844 global_trace.flags = TRACE_ARRAY_FL_GLOBAL;
6845
6846 INIT_LIST_HEAD(&global_trace.systems);
6847 INIT_LIST_HEAD(&global_trace.events);
6848 list_add(&global_trace.list, &ftrace_trace_arrays);
6849
7bcfaf54
SR
6850 while (trace_boot_options) {
6851 char *option;
6852
6853 option = strsep(&trace_boot_options, ",");
2b6080f2 6854 trace_set_options(&global_trace, option);
7bcfaf54
SR
6855 }
6856
77fd5c15
SRRH
6857 register_snapshot_cmd();
6858
2fc1dfbe 6859 return 0;
3f5a54e3 6860
939c7a4f
YY
6861out_free_savedcmd:
6862 free_saved_cmdlines_buffer(savedcmd);
2c4a33ab
SRRH
6863out_free_temp_buffer:
6864 ring_buffer_free(temp_buffer);
9e01c1b7 6865out_free_cpumask:
ccfe9e42 6866 free_cpumask_var(global_trace.tracing_cpumask);
9e01c1b7
RR
6867out_free_buffer_mask:
6868 free_cpumask_var(tracing_buffer_mask);
6869out:
6870 return ret;
bc0c38d1 6871}
b2821ae6 6872
5f893b26
SRRH
6873void __init trace_init(void)
6874{
0daa2302
SRRH
6875 if (tracepoint_printk) {
6876 tracepoint_print_iter =
6877 kmalloc(sizeof(*tracepoint_print_iter), GFP_KERNEL);
6878 if (WARN_ON(!tracepoint_print_iter))
6879 tracepoint_printk = 0;
6880 }
5f893b26
SRRH
6881 tracer_alloc_buffers();
6882 init_ftrace_syscalls();
6883 trace_event_init();
6884}
6885
b2821ae6
SR
6886__init static int clear_boot_tracer(void)
6887{
6888 /*
6889 * The default tracer at boot buffer is an init section.
6890 * This function is called in lateinit. If we did not
6891 * find the boot tracer, then clear it out, to prevent
6892 * later registration from accessing the buffer that is
6893 * about to be freed.
6894 */
6895 if (!default_bootup_tracer)
6896 return 0;
6897
6898 printk(KERN_INFO "ftrace bootup tracer '%s' not registered.\n",
6899 default_bootup_tracer);
6900 default_bootup_tracer = NULL;
6901
6902 return 0;
6903}
6904
b5ad384e 6905fs_initcall(tracer_init_debugfs);
b2821ae6 6906late_initcall(clear_boot_tracer);