2008-05-13 03:20:42 +08:00
|
|
|
/*
|
|
|
|
* ring buffer based function tracer
|
|
|
|
*
|
|
|
|
* Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com>
|
|
|
|
* Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
|
|
|
|
*
|
|
|
|
* Originally taken from the RT patch by:
|
|
|
|
* Arnaldo Carvalho de Melo <acme@redhat.com>
|
|
|
|
*
|
|
|
|
* Based on code from the latency_tracer, that is:
|
|
|
|
* Copyright (C) 2004-2006 Ingo Molnar
|
|
|
|
* Copyright (C) 2004 William Lee Irwin III
|
|
|
|
*/
|
2008-12-02 11:20:19 +08:00
|
|
|
#include <linux/ring_buffer.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/utsrelease.h>
|
2008-12-02 11:20:19 +08:00
|
|
|
#include <linux/stacktrace.h>
|
|
|
|
#include <linux/writeback.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/kallsyms.h>
|
|
|
|
#include <linux/seq_file.h>
|
2008-07-31 10:36:46 +08:00
|
|
|
#include <linux/notifier.h>
|
2008-12-02 11:20:19 +08:00
|
|
|
#include <linux/irqflags.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/debugfs.h>
|
2008-05-13 03:20:43 +08:00
|
|
|
#include <linux/pagemap.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/hardirq.h>
|
|
|
|
#include <linux/linkage.h>
|
|
|
|
#include <linux/uaccess.h>
|
2008-12-02 11:20:19 +08:00
|
|
|
#include <linux/kprobes.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/ftrace.h>
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/percpu.h>
|
2008-12-02 11:20:19 +08:00
|
|
|
#include <linux/splice.h>
|
2008-07-31 10:36:46 +08:00
|
|
|
#include <linux/kdebug.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/ctype.h>
|
|
|
|
#include <linux/init.h>
|
2008-05-13 03:20:49 +08:00
|
|
|
#include <linux/poll.h>
|
2008-05-13 03:20:42 +08:00
|
|
|
#include <linux/gfp.h>
|
|
|
|
#include <linux/fs.h>
|
2008-05-13 03:20:51 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
#include "trace.h"
|
2008-12-24 12:24:12 +08:00
|
|
|
#include "trace_output.h"
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
#define TRACE_BUFFER_FLAGS (RB_FL_OVERWRITE)
|
|
|
|
|
2009-01-16 12:40:11 +08:00
|
|
|
unsigned long __read_mostly tracing_max_latency;
|
2008-05-13 03:20:42 +08:00
|
|
|
unsigned long __read_mostly tracing_thresh;
|
|
|
|
|
2008-12-06 10:41:33 +08:00
|
|
|
/*
|
|
|
|
* We need to change this state when a selftest is running.
|
2008-12-05 06:47:35 +08:00
|
|
|
* A selftest will lurk into the ring-buffer to count the
|
|
|
|
* entries inserted during the selftest although some concurrent
|
|
|
|
* insertions into the ring-buffer such as ftrace_printk could occurred
|
|
|
|
* at the same time, giving false positive or negative results.
|
|
|
|
*/
|
2008-12-06 10:41:33 +08:00
|
|
|
static bool __read_mostly tracing_selftest_running;
|
2008-12-05 06:47:35 +08:00
|
|
|
|
2009-02-03 10:38:32 +08:00
|
|
|
/*
|
|
|
|
* If a tracer is running, we do not want to run SELFTEST.
|
|
|
|
*/
|
|
|
|
static bool __read_mostly tracing_selftest_disabled;
|
|
|
|
|
2008-11-18 02:23:42 +08:00
|
|
|
/* For tracers that don't implement custom flags */
|
|
|
|
static struct tracer_opt dummy_tracer_opt[] = {
|
|
|
|
{ }
|
|
|
|
};
|
|
|
|
|
|
|
|
static struct tracer_flags dummy_tracer_flags = {
|
|
|
|
.val = 0,
|
|
|
|
.opts = dummy_tracer_opt
|
|
|
|
};
|
|
|
|
|
|
|
|
static int dummy_set_flag(u32 old_flags, u32 bit, int set)
|
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
2008-11-06 05:05:44 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Kill all tracing for good (never come back).
|
|
|
|
* It is initialized to 1 but will turn to zero if the initialization
|
|
|
|
* of the tracer is successful. But that is the only place that sets
|
|
|
|
* this back to zero.
|
|
|
|
*/
|
2009-02-11 02:44:12 +08:00
|
|
|
static int tracing_disabled = 1;
|
2008-11-06 05:05:44 +08:00
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
static DEFINE_PER_CPU(local_t, ftrace_cpu_disabled);
|
|
|
|
|
|
|
|
static inline void ftrace_disable_cpu(void)
|
|
|
|
{
|
|
|
|
preempt_disable();
|
|
|
|
local_inc(&__get_cpu_var(ftrace_cpu_disabled));
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void ftrace_enable_cpu(void)
|
|
|
|
{
|
|
|
|
local_dec(&__get_cpu_var(ftrace_cpu_disabled));
|
|
|
|
preempt_enable();
|
|
|
|
}
|
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
static cpumask_var_t __read_mostly tracing_buffer_mask;
|
2008-05-13 03:21:00 +08:00
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
/* Define which cpu buffers are currently read in trace_pipe */
|
|
|
|
static cpumask_var_t tracing_reader_cpumask;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
#define for_each_tracing_cpu(cpu) \
|
2009-01-01 07:42:22 +08:00
|
|
|
for_each_cpu(cpu, tracing_buffer_mask)
|
2008-05-13 03:21:00 +08:00
|
|
|
|
2008-10-24 07:26:08 +08:00
|
|
|
/*
|
|
|
|
* ftrace_dump_on_oops - variable to dump ftrace buffer on oops
|
|
|
|
*
|
|
|
|
* If there is an oops (or kernel panic) and the ftrace_dump_on_oops
|
|
|
|
* is set, then ftrace_dump is called. This will output the contents
|
|
|
|
* of the ftrace buffers to the console. This is very useful for
|
|
|
|
* capturing traces that lead to crashes and outputing it to a
|
|
|
|
* serial console.
|
|
|
|
*
|
|
|
|
* It is default off, but you can enable it with either specifying
|
|
|
|
* "ftrace_dump_on_oops" in the kernel command line, or setting
|
|
|
|
* /proc/sys/kernel/ftrace_dump_on_oops to true.
|
|
|
|
*/
|
|
|
|
int ftrace_dump_on_oops;
|
|
|
|
|
2009-02-03 10:38:32 +08:00
|
|
|
static int tracing_set_tracer(const char *buf);
|
|
|
|
|
|
|
|
#define BOOTUP_TRACER_SIZE 100
|
|
|
|
static char bootup_tracer_buf[BOOTUP_TRACER_SIZE] __initdata;
|
|
|
|
static char *default_bootup_tracer;
|
2008-11-02 02:57:37 +08:00
|
|
|
|
|
|
|
static int __init set_ftrace(char *str)
|
|
|
|
{
|
2009-02-03 10:38:32 +08:00
|
|
|
strncpy(bootup_tracer_buf, str, BOOTUP_TRACER_SIZE);
|
|
|
|
default_bootup_tracer = bootup_tracer_buf;
|
2008-11-02 02:57:37 +08:00
|
|
|
return 1;
|
|
|
|
}
|
2009-02-03 10:38:32 +08:00
|
|
|
__setup("ftrace=", set_ftrace);
|
2008-11-02 02:57:37 +08:00
|
|
|
|
2008-10-24 07:26:08 +08:00
|
|
|
static int __init set_ftrace_dump_on_oops(char *str)
|
|
|
|
{
|
|
|
|
ftrace_dump_on_oops = 1;
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
__setup("ftrace_dump_on_oops", set_ftrace_dump_on_oops);
|
2008-05-13 03:20:44 +08:00
|
|
|
|
2008-05-24 03:37:28 +08:00
|
|
|
long
|
2008-05-13 03:20:42 +08:00
|
|
|
ns2usecs(cycle_t nsec)
|
|
|
|
{
|
|
|
|
nsec += 500;
|
|
|
|
do_div(nsec, 1000);
|
|
|
|
return nsec;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
cycle_t ftrace_now(int cpu)
|
2008-05-13 03:20:46 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
u64 ts = ring_buffer_time_stamp(cpu);
|
|
|
|
ring_buffer_normalize_time_stamp(cpu, &ts);
|
|
|
|
return ts;
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/*
|
|
|
|
* The global_trace is the descriptor that holds the tracing
|
|
|
|
* buffers for the live tracing. For each CPU, it contains
|
|
|
|
* a link list of pages that will store trace entries. The
|
|
|
|
* page descriptor of the pages in the memory is used to hold
|
|
|
|
* the link list by linking the lru item in the page descriptor
|
|
|
|
* to each of the pages in the buffer per CPU.
|
|
|
|
*
|
|
|
|
* For each active CPU there is a data field that holds the
|
|
|
|
* pages for the buffer for that CPU. Each CPU has the same number
|
|
|
|
* of pages allocated for its buffer.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
static struct trace_array global_trace;
|
|
|
|
|
|
|
|
static DEFINE_PER_CPU(struct trace_array_cpu, global_trace_cpu);
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/*
|
|
|
|
* The max_tr is used to snapshot the global_trace when a maximum
|
|
|
|
* latency is reached. Some tracers will use this to store a maximum
|
|
|
|
* trace while it continues examining live traces.
|
|
|
|
*
|
|
|
|
* The buffers for the max_tr are set up the same as the global_trace.
|
|
|
|
* When a snapshot is taken, the link list of the max_tr is swapped
|
|
|
|
* with the link list of the global_trace and the buffers are reset for
|
|
|
|
* the global_trace so the tracing can continue.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
static struct trace_array max_tr;
|
|
|
|
|
|
|
|
static DEFINE_PER_CPU(struct trace_array_cpu, max_data);
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/* tracer_enabled is used to toggle activation of a tracer */
|
2008-05-13 03:20:48 +08:00
|
|
|
static int tracer_enabled = 1;
|
2008-05-13 03:21:00 +08:00
|
|
|
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
/**
|
|
|
|
* tracing_is_enabled - return tracer_enabled status
|
|
|
|
*
|
|
|
|
* This function is used by other tracers to know the status
|
|
|
|
* of the tracer_enabled flag. Tracers may use this function
|
|
|
|
* to know if it should enable their features when starting
|
|
|
|
* up. See irqsoff tracer for an example (start_irqsoff_tracer).
|
|
|
|
*/
|
|
|
|
int tracing_is_enabled(void)
|
|
|
|
{
|
|
|
|
return tracer_enabled;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/*
|
2008-09-30 11:02:41 +08:00
|
|
|
* trace_buf_size is the size in bytes that is allocated
|
|
|
|
* for a buffer. Note, the number of bytes is always rounded
|
|
|
|
* to page size.
|
2008-07-31 10:36:46 +08:00
|
|
|
*
|
|
|
|
* This number is purposely set to a low number of 16384.
|
|
|
|
* If the dump on oops happens, it will be much appreciated
|
|
|
|
* to not have to wait for all that output. Anyway this can be
|
|
|
|
* boot time and run time configurable.
|
2008-05-13 03:21:00 +08:00
|
|
|
*/
|
2008-09-30 11:02:41 +08:00
|
|
|
#define TRACE_BUF_SIZE_DEFAULT 1441792UL /* 16384 * 88 (sizeof(entry)) */
|
2008-07-31 10:36:46 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
static unsigned long trace_buf_size = TRACE_BUF_SIZE_DEFAULT;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/* trace_types holds a link list of available tracers. */
|
2008-05-13 03:20:42 +08:00
|
|
|
static struct tracer *trace_types __read_mostly;
|
2008-05-13 03:21:00 +08:00
|
|
|
|
|
|
|
/* current_trace points to the tracer that is currently active */
|
2008-05-13 03:20:42 +08:00
|
|
|
static struct tracer *current_trace __read_mostly;
|
2008-05-13 03:21:00 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* max_tracer_type_len is used to simplify the allocating of
|
|
|
|
* buffers to read userspace tracer names. We keep track of
|
|
|
|
* the longest tracer name registered.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
static int max_tracer_type_len;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/*
|
|
|
|
* trace_types_lock is used to protect the trace_types list.
|
|
|
|
* This lock is also used to keep user access serialized.
|
|
|
|
* Accesses from userspace will grab this lock while userspace
|
|
|
|
* activities happen inside the kernel.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
static DEFINE_MUTEX(trace_types_lock);
|
2008-05-13 03:21:00 +08:00
|
|
|
|
|
|
|
/* trace_wait is a waitqueue for tasks blocked on trace_poll */
|
2008-05-13 03:20:52 +08:00
|
|
|
static DECLARE_WAIT_QUEUE_HEAD(trace_wait);
|
|
|
|
|
2008-11-13 06:52:37 +08:00
|
|
|
/* trace_flags holds trace_options default values */
|
2008-11-13 06:52:38 +08:00
|
|
|
unsigned long trace_flags = TRACE_ITER_PRINT_PARENT | TRACE_ITER_PRINTK |
|
2009-02-03 06:29:21 +08:00
|
|
|
TRACE_ITER_ANNOTATE | TRACE_ITER_CONTEXT_INFO;
|
2008-05-13 03:20:52 +08:00
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/**
|
|
|
|
* trace_wake_up - wake up tasks waiting for trace input
|
|
|
|
*
|
|
|
|
* Simply wakes up any task that is blocked on the trace_wait
|
|
|
|
* queue. These is used with trace_poll for tasks polling the trace.
|
|
|
|
*/
|
2008-05-13 03:20:52 +08:00
|
|
|
void trace_wake_up(void)
|
|
|
|
{
|
2008-05-13 03:20:52 +08:00
|
|
|
/*
|
|
|
|
* The runqueue_is_locked() can fail, but this is the best we
|
|
|
|
* have for now:
|
|
|
|
*/
|
|
|
|
if (!(trace_flags & TRACE_ITER_BLOCK) && !runqueue_is_locked())
|
2008-05-13 03:20:52 +08:00
|
|
|
wake_up(&trace_wait);
|
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
static int __init set_buf_size(char *str)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
unsigned long buf_size;
|
2008-05-13 03:21:00 +08:00
|
|
|
int ret;
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
if (!str)
|
|
|
|
return 0;
|
2008-09-30 11:02:41 +08:00
|
|
|
ret = strict_strtoul(str, 0, &buf_size);
|
2008-05-13 03:21:00 +08:00
|
|
|
/* nr_entries can not be zero */
|
2008-09-30 11:02:41 +08:00
|
|
|
if (ret < 0 || buf_size == 0)
|
2008-05-13 03:21:00 +08:00
|
|
|
return 0;
|
2008-09-30 11:02:41 +08:00
|
|
|
trace_buf_size = buf_size;
|
2008-05-13 03:20:42 +08:00
|
|
|
return 1;
|
|
|
|
}
|
2008-09-30 11:02:41 +08:00
|
|
|
__setup("trace_buf_size=", set_buf_size);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
unsigned long nsecs_to_usecs(unsigned long nsecs)
|
|
|
|
{
|
|
|
|
return nsecs / 1000;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/* These must match the bit postions in trace_iterator_flags */
|
2008-05-13 03:20:42 +08:00
|
|
|
static const char *trace_options[] = {
|
|
|
|
"print-parent",
|
|
|
|
"sym-offset",
|
|
|
|
"sym-addr",
|
|
|
|
"verbose",
|
2008-05-13 03:20:47 +08:00
|
|
|
"raw",
|
2008-05-13 03:20:49 +08:00
|
|
|
"hex",
|
2008-05-13 03:20:47 +08:00
|
|
|
"bin",
|
2008-05-13 03:20:49 +08:00
|
|
|
"block",
|
2008-05-13 03:20:51 +08:00
|
|
|
"stacktrace",
|
2008-05-13 03:20:52 +08:00
|
|
|
"sched-tree",
|
2008-09-04 16:24:14 +08:00
|
|
|
"ftrace_printk",
|
ftrace: function tracer with irqs disabled
Impact: disable interrupts during trace entry creation (as opposed to preempt)
To help with performance, I set the ftracer to not disable interrupts,
and only to disable preemption. If an interrupt occurred, it would not
be traced, because the function tracer protects itself from recursion.
This may be faster, but the trace output might miss some traces.
This patch makes the fuction trace disable interrupts, but it also
adds a runtime feature to disable preemption instead. It does this by
having two different tracer functions. When the function tracer is
enabled, it will check to see which version is requested (irqs disabled
or preemption disabled). Then it will use the corresponding function
as the tracer.
Irq disabling is the default behaviour, but if the user wants better
performance, with the chance of missing traces, then they can choose
the preempt disabled version.
Running hackbench 3 times with the irqs disabled and 3 times with
the preempt disabled function tracer yielded:
tracing type times entries recorded
------------ -------- ----------------
irq disabled 43.393 166433066
43.282 166172618
43.298 166256704
preempt disabled 38.969 159871710
38.943 159972935
39.325 161056510
Average:
irqs disabled: 43.324 166287462
preempt disabled: 39.079 160300385
preempt is 10.8 percent faster than irqs disabled.
I wrote a patch to count function trace recursion and reran hackbench.
With irq disabled: 1,150 times the function tracer did not trace due to
recursion.
with preempt disabled: 5,117,718 times.
The thousand times with irq disabled could be due to NMIs, or simply a case
where it called a function that was not protected by notrace.
But we also see that a large amount of the trace is lost with the
preempt version.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Cc: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-04 12:15:57 +08:00
|
|
|
"ftrace_preempt",
|
2008-11-13 04:24:24 +08:00
|
|
|
"branch",
|
2008-11-13 06:52:38 +08:00
|
|
|
"annotate",
|
2008-11-22 19:28:47 +08:00
|
|
|
"userstacktrace",
|
2008-11-22 19:28:48 +08:00
|
|
|
"sym-userobj",
|
2008-12-14 03:18:13 +08:00
|
|
|
"printk-msg-only",
|
2009-02-03 06:29:21 +08:00
|
|
|
"context-info",
|
2008-05-13 03:20:42 +08:00
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/*
|
|
|
|
* ftrace_max_lock is used to protect the swapping of buffers
|
|
|
|
* when taking a max snapshot. The buffers themselves are
|
|
|
|
* protected by per_cpu spinlocks. But the action of the swap
|
|
|
|
* needs its own lock.
|
|
|
|
*
|
|
|
|
* This is defined as a raw_spinlock_t in order to help
|
|
|
|
* with performance when lockdep debugging is enabled.
|
|
|
|
*/
|
2008-05-13 03:20:55 +08:00
|
|
|
static raw_spinlock_t ftrace_max_lock =
|
|
|
|
(raw_spinlock_t)__RAW_SPIN_LOCK_UNLOCKED;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Copy the new maximum trace into the separate maximum-trace
|
|
|
|
* structure. (this way the maximum trace is permanently saved,
|
|
|
|
* for later retrieval via /debugfs/tracing/latency_trace)
|
|
|
|
*/
|
2008-05-13 03:20:51 +08:00
|
|
|
static void
|
2008-05-13 03:20:42 +08:00
|
|
|
__update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
|
|
|
|
{
|
|
|
|
struct trace_array_cpu *data = tr->data[cpu];
|
|
|
|
|
|
|
|
max_tr.cpu = cpu;
|
|
|
|
max_tr.time_start = data->preempt_timestamp;
|
|
|
|
|
|
|
|
data = max_tr.data[cpu];
|
|
|
|
data->saved_latency = tracing_max_latency;
|
|
|
|
|
|
|
|
memcpy(data->comm, tsk->comm, TASK_COMM_LEN);
|
|
|
|
data->pid = tsk->pid;
|
2008-11-14 07:39:16 +08:00
|
|
|
data->uid = task_uid(tsk);
|
2008-05-13 03:20:42 +08:00
|
|
|
data->nice = tsk->static_prio - 20 - MAX_RT_PRIO;
|
|
|
|
data->policy = tsk->policy;
|
|
|
|
data->rt_priority = tsk->rt_priority;
|
|
|
|
|
|
|
|
/* record this tasks comm */
|
2009-02-17 14:07:28 +08:00
|
|
|
tracing_record_cmdline(tsk);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:02 +08:00
|
|
|
ssize_t trace_seq_to_user(struct trace_seq *s, char __user *ubuf, size_t cnt)
|
|
|
|
{
|
|
|
|
int len;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (s->len <= s->readpos)
|
|
|
|
return -EBUSY;
|
|
|
|
|
|
|
|
len = s->len - s->readpos;
|
|
|
|
if (cnt > len)
|
|
|
|
cnt = len;
|
|
|
|
ret = copy_to_user(ubuf, s->buffer + s->readpos, cnt);
|
|
|
|
if (ret)
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
s->readpos += len;
|
|
|
|
return cnt;
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
|
|
|
|
2009-02-09 14:15:56 +08:00
|
|
|
ssize_t trace_seq_to_buffer(struct trace_seq *s, void *buf, size_t cnt)
|
|
|
|
{
|
|
|
|
int len;
|
|
|
|
void *ret;
|
|
|
|
|
|
|
|
if (s->len <= s->readpos)
|
|
|
|
return -EBUSY;
|
|
|
|
|
|
|
|
len = s->len - s->readpos;
|
|
|
|
if (cnt > len)
|
|
|
|
cnt = len;
|
|
|
|
ret = memcpy(buf, s->buffer + s->readpos, cnt);
|
|
|
|
if (!ret)
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
s->readpos += len;
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void
|
2008-05-13 03:20:46 +08:00
|
|
|
trace_print_seq(struct seq_file *m, struct trace_seq *s)
|
|
|
|
{
|
|
|
|
int len = s->len >= PAGE_SIZE ? PAGE_SIZE - 1 : s->len;
|
|
|
|
|
|
|
|
s->buffer[len] = 0;
|
|
|
|
seq_puts(m, s->buffer);
|
|
|
|
|
2009-03-03 03:04:40 +08:00
|
|
|
trace_seq_init(s);
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/**
|
|
|
|
* update_max_tr - snapshot all trace buffers from global_trace to max_tr
|
|
|
|
* @tr: tracer
|
|
|
|
* @tsk: the task with the latency
|
|
|
|
* @cpu: The cpu that initiated the trace.
|
|
|
|
*
|
|
|
|
* Flip the buffers between the @tr and the max_tr and record information
|
|
|
|
* about which task was the cause of this latency.
|
|
|
|
*/
|
2008-05-13 03:20:51 +08:00
|
|
|
void
|
2008-05-13 03:20:42 +08:00
|
|
|
update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
|
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer *buf = tr->buffer;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:20:43 +08:00
|
|
|
WARN_ON_ONCE(!irqs_disabled());
|
2008-05-13 03:20:55 +08:00
|
|
|
__raw_spin_lock(&ftrace_max_lock);
|
2008-09-30 11:02:41 +08:00
|
|
|
|
|
|
|
tr->buffer = max_tr.buffer;
|
|
|
|
max_tr.buffer = buf;
|
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_disable_cpu();
|
2008-09-30 11:02:41 +08:00
|
|
|
ring_buffer_reset(tr->buffer);
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_enable_cpu();
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
__update_max_tr(tr, tsk, cpu);
|
2008-05-13 03:20:55 +08:00
|
|
|
__raw_spin_unlock(&ftrace_max_lock);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* update_max_tr_single - only copy one trace over, and reset the rest
|
|
|
|
* @tr - tracer
|
|
|
|
* @tsk - task with the latency
|
|
|
|
* @cpu - the cpu of the buffer to copy.
|
2008-05-13 03:21:00 +08:00
|
|
|
*
|
|
|
|
* Flip the trace of a single CPU buffer between the @tr and the max_tr.
|
2008-05-13 03:20:42 +08:00
|
|
|
*/
|
2008-05-13 03:20:51 +08:00
|
|
|
void
|
2008-05-13 03:20:42 +08:00
|
|
|
update_max_tr_single(struct trace_array *tr, struct task_struct *tsk, int cpu)
|
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
int ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:20:43 +08:00
|
|
|
WARN_ON_ONCE(!irqs_disabled());
|
2008-05-13 03:20:55 +08:00
|
|
|
__raw_spin_lock(&ftrace_max_lock);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_disable_cpu();
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
ring_buffer_reset(max_tr.buffer);
|
|
|
|
ret = ring_buffer_swap_cpu(max_tr.buffer, tr->buffer, cpu);
|
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_enable_cpu();
|
|
|
|
|
2009-01-22 04:24:56 +08:00
|
|
|
WARN_ON_ONCE(ret && ret != -EAGAIN);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
__update_max_tr(tr, tsk, cpu);
|
2008-05-13 03:20:55 +08:00
|
|
|
__raw_spin_unlock(&ftrace_max_lock);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
/**
|
|
|
|
* register_tracer - register a tracer with the ftrace system.
|
|
|
|
* @type - the plugin for the tracer
|
|
|
|
*
|
|
|
|
* Register a new plugin tracer.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
int register_tracer(struct tracer *type)
|
2009-02-11 02:44:45 +08:00
|
|
|
__releases(kernel_lock)
|
|
|
|
__acquires(kernel_lock)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
struct tracer *t;
|
|
|
|
int len;
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
if (!type->name) {
|
|
|
|
pr_info("Tracer must have a name\n");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2008-11-19 17:00:15 +08:00
|
|
|
/*
|
|
|
|
* When this gets called we hold the BKL which means that
|
|
|
|
* preemption is disabled. Various trace selftests however
|
|
|
|
* need to disable and enable preemption for successful tests.
|
|
|
|
* So we drop the BKL here and grab it after the tests again.
|
|
|
|
*/
|
|
|
|
unlock_kernel();
|
2008-05-13 03:20:42 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
2008-11-19 17:00:15 +08:00
|
|
|
|
2008-12-06 10:41:33 +08:00
|
|
|
tracing_selftest_running = true;
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
for (t = trace_types; t; t = t->next) {
|
|
|
|
if (strcmp(type->name, t->name) == 0) {
|
|
|
|
/* already found */
|
|
|
|
pr_info("Trace %s already registered\n",
|
|
|
|
type->name);
|
|
|
|
ret = -1;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-11-18 02:23:42 +08:00
|
|
|
if (!type->set_flag)
|
|
|
|
type->set_flag = &dummy_set_flag;
|
|
|
|
if (!type->flags)
|
|
|
|
type->flags = &dummy_tracer_flags;
|
|
|
|
else
|
|
|
|
if (!type->flags->opts)
|
|
|
|
type->flags->opts = dummy_tracer_opt;
|
2009-02-11 09:25:00 +08:00
|
|
|
if (!type->wait_pipe)
|
|
|
|
type->wait_pipe = default_wait_pipe;
|
|
|
|
|
2008-11-18 02:23:42 +08:00
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
#ifdef CONFIG_FTRACE_STARTUP_TEST
|
2009-02-03 10:38:32 +08:00
|
|
|
if (type->selftest && !tracing_selftest_disabled) {
|
2008-05-13 03:20:44 +08:00
|
|
|
struct tracer *saved_tracer = current_trace;
|
|
|
|
struct trace_array *tr = &global_trace;
|
|
|
|
int i;
|
2008-12-05 06:47:35 +08:00
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
/*
|
|
|
|
* Run a selftest on this tracer.
|
|
|
|
* Here we reset the trace buffer, and set the current
|
|
|
|
* tracer to be this tracer. The tracer can then run some
|
|
|
|
* internal tracing to verify that everything is in order.
|
|
|
|
* If we fail, we do not register this tracer.
|
|
|
|
*/
|
2008-11-19 17:00:15 +08:00
|
|
|
for_each_tracing_cpu(i)
|
2008-09-30 11:02:41 +08:00
|
|
|
tracing_reset(tr, i);
|
2008-11-19 17:00:15 +08:00
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
current_trace = type;
|
|
|
|
/* the test is responsible for initializing and enabling */
|
|
|
|
pr_info("Testing tracer %s: ", type->name);
|
|
|
|
ret = type->selftest(type, tr);
|
|
|
|
/* the test is responsible for resetting too */
|
|
|
|
current_trace = saved_tracer;
|
|
|
|
if (ret) {
|
|
|
|
printk(KERN_CONT "FAILED!\n");
|
|
|
|
goto out;
|
|
|
|
}
|
2008-05-13 03:20:45 +08:00
|
|
|
/* Only reset on passing, to avoid touching corrupted buffers */
|
2008-11-19 17:00:15 +08:00
|
|
|
for_each_tracing_cpu(i)
|
2008-09-30 11:02:41 +08:00
|
|
|
tracing_reset(tr, i);
|
2008-11-19 17:00:15 +08:00
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
printk(KERN_CONT "PASSED\n");
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
type->next = trace_types;
|
|
|
|
trace_types = type;
|
|
|
|
len = strlen(type->name);
|
|
|
|
if (len > max_tracer_type_len)
|
|
|
|
max_tracer_type_len = len;
|
2008-05-13 03:20:44 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
out:
|
2008-12-06 10:41:33 +08:00
|
|
|
tracing_selftest_running = false;
|
2008-05-13 03:20:42 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
2009-02-05 14:13:38 +08:00
|
|
|
if (ret || !default_bootup_tracer)
|
|
|
|
goto out_unlock;
|
|
|
|
|
|
|
|
if (strncmp(default_bootup_tracer, type->name, BOOTUP_TRACER_SIZE))
|
|
|
|
goto out_unlock;
|
|
|
|
|
|
|
|
printk(KERN_INFO "Starting tracer '%s'\n", type->name);
|
|
|
|
/* Do we want this tracer to start on bootup? */
|
|
|
|
tracing_set_tracer(type->name);
|
|
|
|
default_bootup_tracer = NULL;
|
|
|
|
/* disable other selftests, since this will break it. */
|
|
|
|
tracing_selftest_disabled = 1;
|
2009-02-03 10:38:32 +08:00
|
|
|
#ifdef CONFIG_FTRACE_STARTUP_TEST
|
2009-02-05 14:13:38 +08:00
|
|
|
printk(KERN_INFO "Disabling FTRACE selftests due to running tracer '%s'\n",
|
|
|
|
type->name);
|
2009-02-03 10:38:32 +08:00
|
|
|
#endif
|
|
|
|
|
2009-02-05 14:13:38 +08:00
|
|
|
out_unlock:
|
2009-02-03 10:38:32 +08:00
|
|
|
lock_kernel();
|
2008-05-13 03:20:42 +08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
void unregister_tracer(struct tracer *type)
|
|
|
|
{
|
|
|
|
struct tracer **t;
|
|
|
|
int len;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
for (t = &trace_types; *t; t = &(*t)->next) {
|
|
|
|
if (*t == type)
|
|
|
|
goto found;
|
|
|
|
}
|
|
|
|
pr_info("Trace %s not registered\n", type->name);
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
found:
|
|
|
|
*t = (*t)->next;
|
2009-02-08 04:52:59 +08:00
|
|
|
|
|
|
|
if (type == current_trace && tracer_enabled) {
|
|
|
|
tracer_enabled = 0;
|
|
|
|
tracing_stop();
|
|
|
|
if (current_trace->stop)
|
|
|
|
current_trace->stop(&global_trace);
|
|
|
|
current_trace = &nop_trace;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
if (strlen(type->name) != max_tracer_type_len)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
max_tracer_type_len = 0;
|
|
|
|
for (t = &trace_types; *t; t = &(*t)->next) {
|
|
|
|
len = strlen((*t)->name);
|
|
|
|
if (len > max_tracer_type_len)
|
|
|
|
max_tracer_type_len = len;
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
}
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
void tracing_reset(struct trace_array *tr, int cpu)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_disable_cpu();
|
2008-09-30 11:02:41 +08:00
|
|
|
ring_buffer_reset_cpu(tr->buffer, cpu);
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_enable_cpu();
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-12-19 18:08:39 +08:00
|
|
|
void tracing_reset_online_cpus(struct trace_array *tr)
|
|
|
|
{
|
|
|
|
int cpu;
|
|
|
|
|
|
|
|
tr->time_start = ftrace_now(tr->cpu);
|
|
|
|
|
|
|
|
for_each_online_cpu(cpu)
|
|
|
|
tracing_reset(tr, cpu);
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
#define SAVED_CMDLINES 128
|
|
|
|
static unsigned map_pid_to_cmdline[PID_MAX_DEFAULT+1];
|
|
|
|
static unsigned map_cmdline_to_pid[SAVED_CMDLINES];
|
|
|
|
static char saved_cmdlines[SAVED_CMDLINES][TASK_COMM_LEN];
|
|
|
|
static int cmdline_idx;
|
2009-03-04 19:32:55 +08:00
|
|
|
static raw_spinlock_t trace_cmdline_lock = __RAW_SPIN_LOCK_UNLOCKED;
|
2008-05-13 03:21:00 +08:00
|
|
|
|
|
|
|
/* temporary disable recording */
|
2009-02-11 02:44:12 +08:00
|
|
|
static atomic_t trace_record_cmdline_disabled __read_mostly;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
static void trace_init_cmdlines(void)
|
|
|
|
{
|
|
|
|
memset(&map_pid_to_cmdline, -1, sizeof(map_pid_to_cmdline));
|
|
|
|
memset(&map_cmdline_to_pid, -1, sizeof(map_cmdline_to_pid));
|
|
|
|
cmdline_idx = 0;
|
|
|
|
}
|
|
|
|
|
2008-11-06 05:05:44 +08:00
|
|
|
static int trace_stop_count;
|
|
|
|
static DEFINE_SPINLOCK(tracing_start_lock);
|
|
|
|
|
2008-11-22 01:59:38 +08:00
|
|
|
/**
|
|
|
|
* ftrace_off_permanent - disable all ftrace code permanently
|
|
|
|
*
|
|
|
|
* This should only be called when a serious anomally has
|
|
|
|
* been detected. This will turn off the function tracing,
|
|
|
|
* ring buffers, and other tracing utilites. It takes no
|
|
|
|
* locks and can be called from any context.
|
|
|
|
*/
|
|
|
|
void ftrace_off_permanent(void)
|
|
|
|
{
|
|
|
|
tracing_disabled = 1;
|
|
|
|
ftrace_stop();
|
|
|
|
tracing_off_permanent();
|
|
|
|
}
|
|
|
|
|
2008-11-06 05:05:44 +08:00
|
|
|
/**
|
|
|
|
* tracing_start - quick start of the tracer
|
|
|
|
*
|
|
|
|
* If tracing is enabled but was stopped by tracing_stop,
|
|
|
|
* this will start the tracer back up.
|
|
|
|
*/
|
|
|
|
void tracing_start(void)
|
|
|
|
{
|
|
|
|
struct ring_buffer *buffer;
|
|
|
|
unsigned long flags;
|
|
|
|
|
|
|
|
if (tracing_disabled)
|
|
|
|
return;
|
|
|
|
|
|
|
|
spin_lock_irqsave(&tracing_start_lock, flags);
|
2009-01-23 03:26:15 +08:00
|
|
|
if (--trace_stop_count) {
|
|
|
|
if (trace_stop_count < 0) {
|
|
|
|
/* Someone screwed up their debugging */
|
|
|
|
WARN_ON_ONCE(1);
|
|
|
|
trace_stop_count = 0;
|
|
|
|
}
|
2008-11-06 05:05:44 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
buffer = global_trace.buffer;
|
|
|
|
if (buffer)
|
|
|
|
ring_buffer_record_enable(buffer);
|
|
|
|
|
|
|
|
buffer = max_tr.buffer;
|
|
|
|
if (buffer)
|
|
|
|
ring_buffer_record_enable(buffer);
|
|
|
|
|
|
|
|
ftrace_start();
|
|
|
|
out:
|
|
|
|
spin_unlock_irqrestore(&tracing_start_lock, flags);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* tracing_stop - quick stop of the tracer
|
|
|
|
*
|
|
|
|
* Light weight way to stop tracing. Use in conjunction with
|
|
|
|
* tracing_start.
|
|
|
|
*/
|
|
|
|
void tracing_stop(void)
|
|
|
|
{
|
|
|
|
struct ring_buffer *buffer;
|
|
|
|
unsigned long flags;
|
|
|
|
|
|
|
|
ftrace_stop();
|
|
|
|
spin_lock_irqsave(&tracing_start_lock, flags);
|
|
|
|
if (trace_stop_count++)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
buffer = global_trace.buffer;
|
|
|
|
if (buffer)
|
|
|
|
ring_buffer_record_disable(buffer);
|
|
|
|
|
|
|
|
buffer = max_tr.buffer;
|
|
|
|
if (buffer)
|
|
|
|
ring_buffer_record_disable(buffer);
|
|
|
|
|
|
|
|
out:
|
|
|
|
spin_unlock_irqrestore(&tracing_start_lock, flags);
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
void trace_stop_cmdline_recording(void);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void trace_save_cmdline(struct task_struct *tsk)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
unsigned map;
|
|
|
|
unsigned idx;
|
|
|
|
|
|
|
|
if (!tsk->pid || unlikely(tsk->pid > PID_MAX_DEFAULT))
|
|
|
|
return;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* It's not the end of the world if we don't get
|
|
|
|
* the lock, but we also don't want to spin
|
|
|
|
* nor do we want to disable interrupts,
|
|
|
|
* so if we miss here, then better luck next time.
|
|
|
|
*/
|
2009-03-04 19:32:55 +08:00
|
|
|
if (!__raw_spin_trylock(&trace_cmdline_lock))
|
2008-05-13 03:20:42 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
idx = map_pid_to_cmdline[tsk->pid];
|
|
|
|
if (idx >= SAVED_CMDLINES) {
|
|
|
|
idx = (cmdline_idx + 1) % SAVED_CMDLINES;
|
|
|
|
|
|
|
|
map = map_cmdline_to_pid[idx];
|
|
|
|
if (map <= PID_MAX_DEFAULT)
|
|
|
|
map_pid_to_cmdline[map] = (unsigned)-1;
|
|
|
|
|
|
|
|
map_pid_to_cmdline[tsk->pid] = idx;
|
|
|
|
|
|
|
|
cmdline_idx = idx;
|
|
|
|
}
|
|
|
|
|
|
|
|
memcpy(&saved_cmdlines[idx], tsk->comm, TASK_COMM_LEN);
|
|
|
|
|
2009-03-04 19:32:55 +08:00
|
|
|
__raw_spin_unlock(&trace_cmdline_lock);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-11-26 13:16:26 +08:00
|
|
|
char *trace_find_cmdline(int pid)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
char *cmdline = "<...>";
|
|
|
|
unsigned map;
|
|
|
|
|
|
|
|
if (!pid)
|
|
|
|
return "<idle>";
|
|
|
|
|
|
|
|
if (pid > PID_MAX_DEFAULT)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
map = map_pid_to_cmdline[pid];
|
|
|
|
if (map >= SAVED_CMDLINES)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
cmdline = saved_cmdlines[map];
|
|
|
|
|
|
|
|
out:
|
|
|
|
return cmdline;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
void tracing_record_cmdline(struct task_struct *tsk)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
if (atomic_read(&trace_record_cmdline_disabled))
|
|
|
|
return;
|
|
|
|
|
|
|
|
trace_save_cmdline(tsk);
|
|
|
|
}
|
|
|
|
|
2008-09-17 02:56:41 +08:00
|
|
|
void
|
2008-10-02 01:14:09 +08:00
|
|
|
tracing_generic_entry_update(struct trace_entry *entry, unsigned long flags,
|
|
|
|
int pc)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
struct task_struct *tsk = current;
|
|
|
|
|
2008-09-30 11:02:42 +08:00
|
|
|
entry->preempt_count = pc & 0xff;
|
|
|
|
entry->pid = (tsk) ? tsk->pid : 0;
|
2008-11-22 19:28:48 +08:00
|
|
|
entry->tgid = (tsk) ? tsk->tgid : 0;
|
2008-09-30 11:02:42 +08:00
|
|
|
entry->flags =
|
2008-10-24 21:42:59 +08:00
|
|
|
#ifdef CONFIG_TRACE_IRQFLAGS_SUPPORT
|
2008-08-02 00:26:40 +08:00
|
|
|
(irqs_disabled_flags(flags) ? TRACE_FLAG_IRQS_OFF : 0) |
|
2008-10-24 21:42:59 +08:00
|
|
|
#else
|
|
|
|
TRACE_FLAG_IRQS_NOSUPPORT |
|
|
|
|
#endif
|
2008-05-13 03:20:42 +08:00
|
|
|
((pc & HARDIRQ_MASK) ? TRACE_FLAG_HARDIRQ : 0) |
|
|
|
|
((pc & SOFTIRQ_MASK) ? TRACE_FLAG_SOFTIRQ : 0) |
|
|
|
|
(need_resched() ? TRACE_FLAG_NEED_RESCHED : 0);
|
|
|
|
}
|
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
struct ring_buffer_event *trace_buffer_lock_reserve(struct trace_array *tr,
|
|
|
|
unsigned char type,
|
|
|
|
unsigned long len,
|
|
|
|
unsigned long flags, int pc)
|
|
|
|
{
|
|
|
|
struct ring_buffer_event *event;
|
|
|
|
|
|
|
|
event = ring_buffer_lock_reserve(tr->buffer, len);
|
|
|
|
if (event != NULL) {
|
|
|
|
struct trace_entry *ent = ring_buffer_event_data(event);
|
|
|
|
|
|
|
|
tracing_generic_entry_update(ent, flags, pc);
|
|
|
|
ent->type = type;
|
|
|
|
}
|
|
|
|
|
|
|
|
return event;
|
|
|
|
}
|
|
|
|
static void ftrace_trace_stack(struct trace_array *tr,
|
|
|
|
unsigned long flags, int skip, int pc);
|
|
|
|
static void ftrace_trace_userstack(struct trace_array *tr,
|
|
|
|
unsigned long flags, int pc);
|
|
|
|
|
|
|
|
void trace_buffer_unlock_commit(struct trace_array *tr,
|
|
|
|
struct ring_buffer_event *event,
|
|
|
|
unsigned long flags, int pc)
|
|
|
|
{
|
|
|
|
ring_buffer_unlock_commit(tr->buffer, event);
|
|
|
|
|
|
|
|
ftrace_trace_stack(tr, flags, 6, pc);
|
|
|
|
ftrace_trace_userstack(tr, flags, pc);
|
|
|
|
trace_wake_up();
|
|
|
|
}
|
|
|
|
|
2009-02-28 08:38:04 +08:00
|
|
|
struct ring_buffer_event *
|
|
|
|
trace_current_buffer_lock_reserve(unsigned char type, unsigned long len,
|
|
|
|
unsigned long flags, int pc)
|
|
|
|
{
|
|
|
|
return trace_buffer_lock_reserve(&global_trace,
|
|
|
|
type, len, flags, pc);
|
|
|
|
}
|
|
|
|
|
|
|
|
void trace_current_buffer_unlock_commit(struct ring_buffer_event *event,
|
|
|
|
unsigned long flags, int pc)
|
|
|
|
{
|
|
|
|
return trace_buffer_unlock_commit(&global_trace, event, flags, pc);
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
void
|
2009-02-05 14:13:37 +08:00
|
|
|
trace_function(struct trace_array *tr,
|
2008-10-02 01:14:09 +08:00
|
|
|
unsigned long ip, unsigned long parent_ip, unsigned long flags,
|
|
|
|
int pc)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-09-30 11:02:42 +08:00
|
|
|
struct ftrace_entry *entry;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
/* If we are reading the ring buffer, don't trace */
|
|
|
|
if (unlikely(local_read(&__get_cpu_var(ftrace_cpu_disabled))))
|
|
|
|
return;
|
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_FN, sizeof(*entry),
|
|
|
|
flags, pc);
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
2008-09-30 11:02:42 +08:00
|
|
|
entry->ip = ip;
|
|
|
|
entry->parent_ip = parent_ip;
|
2009-02-06 02:12:56 +08:00
|
|
|
ring_buffer_unlock_commit(tr->buffer, event);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-11-26 04:07:04 +08:00
|
|
|
#ifdef CONFIG_FUNCTION_GRAPH_TRACER
|
2008-11-26 07:57:25 +08:00
|
|
|
static void __trace_graph_entry(struct trace_array *tr,
|
|
|
|
struct ftrace_graph_ent *trace,
|
|
|
|
unsigned long flags,
|
|
|
|
int pc)
|
|
|
|
{
|
|
|
|
struct ring_buffer_event *event;
|
|
|
|
struct ftrace_graph_ent_entry *entry;
|
|
|
|
|
|
|
|
if (unlikely(local_read(&__get_cpu_var(ftrace_cpu_disabled))))
|
|
|
|
return;
|
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(&global_trace, TRACE_GRAPH_ENT,
|
|
|
|
sizeof(*entry), flags, pc);
|
2008-11-26 07:57:25 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
|
|
|
entry->graph_ent = *trace;
|
2009-02-06 02:12:56 +08:00
|
|
|
ring_buffer_unlock_commit(global_trace.buffer, event);
|
2008-11-26 07:57:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void __trace_graph_return(struct trace_array *tr,
|
2008-11-26 04:07:04 +08:00
|
|
|
struct ftrace_graph_ret *trace,
|
2008-11-11 14:14:25 +08:00
|
|
|
unsigned long flags,
|
|
|
|
int pc)
|
|
|
|
{
|
|
|
|
struct ring_buffer_event *event;
|
2008-11-26 07:57:25 +08:00
|
|
|
struct ftrace_graph_ret_entry *entry;
|
2008-11-11 14:14:25 +08:00
|
|
|
|
|
|
|
if (unlikely(local_read(&__get_cpu_var(ftrace_cpu_disabled))))
|
|
|
|
return;
|
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(&global_trace, TRACE_GRAPH_RET,
|
|
|
|
sizeof(*entry), flags, pc);
|
2008-11-11 14:14:25 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
2008-11-26 07:57:25 +08:00
|
|
|
entry->ret = *trace;
|
2009-02-06 02:12:56 +08:00
|
|
|
ring_buffer_unlock_commit(global_trace.buffer, event);
|
2008-11-11 14:14:25 +08:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
void
|
2008-05-13 03:20:49 +08:00
|
|
|
ftrace(struct trace_array *tr, struct trace_array_cpu *data,
|
2008-10-02 01:14:09 +08:00
|
|
|
unsigned long ip, unsigned long parent_ip, unsigned long flags,
|
|
|
|
int pc)
|
2008-05-13 03:20:49 +08:00
|
|
|
{
|
|
|
|
if (likely(!atomic_read(&data->disabled)))
|
2009-02-05 14:13:37 +08:00
|
|
|
trace_function(tr, ip, parent_ip, flags, pc);
|
2008-05-13 03:20:49 +08:00
|
|
|
}
|
|
|
|
|
2009-01-16 08:12:40 +08:00
|
|
|
static void __ftrace_trace_stack(struct trace_array *tr,
|
|
|
|
unsigned long flags,
|
|
|
|
int skip, int pc)
|
2008-05-13 03:20:51 +08:00
|
|
|
{
|
2008-11-01 03:50:41 +08:00
|
|
|
#ifdef CONFIG_STACKTRACE
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-09-30 11:02:42 +08:00
|
|
|
struct stack_entry *entry;
|
2008-05-13 03:20:51 +08:00
|
|
|
struct stack_trace trace;
|
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_STACK,
|
|
|
|
sizeof(*entry), flags, pc);
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
2008-09-30 11:02:42 +08:00
|
|
|
memset(&entry->caller, 0, sizeof(entry->caller));
|
2008-05-13 03:20:51 +08:00
|
|
|
|
|
|
|
trace.nr_entries = 0;
|
|
|
|
trace.max_entries = FTRACE_STACK_ENTRIES;
|
|
|
|
trace.skip = skip;
|
2008-09-30 11:02:42 +08:00
|
|
|
trace.entries = entry->caller;
|
2008-05-13 03:20:51 +08:00
|
|
|
|
|
|
|
save_stack_trace(&trace);
|
2009-02-06 02:12:56 +08:00
|
|
|
ring_buffer_unlock_commit(tr->buffer, event);
|
2008-11-01 03:50:41 +08:00
|
|
|
#endif
|
2008-05-13 03:20:47 +08:00
|
|
|
}
|
|
|
|
|
2009-01-16 08:12:40 +08:00
|
|
|
static void ftrace_trace_stack(struct trace_array *tr,
|
|
|
|
unsigned long flags,
|
|
|
|
int skip, int pc)
|
|
|
|
{
|
|
|
|
if (!(trace_flags & TRACE_ITER_STACKTRACE))
|
|
|
|
return;
|
|
|
|
|
2009-02-05 14:13:37 +08:00
|
|
|
__ftrace_trace_stack(tr, flags, skip, pc);
|
2009-01-16 08:12:40 +08:00
|
|
|
}
|
|
|
|
|
2008-10-02 01:14:09 +08:00
|
|
|
void __trace_stack(struct trace_array *tr,
|
|
|
|
unsigned long flags,
|
2009-01-16 08:12:40 +08:00
|
|
|
int skip, int pc)
|
2008-10-02 01:14:09 +08:00
|
|
|
{
|
2009-02-05 14:13:37 +08:00
|
|
|
__ftrace_trace_stack(tr, flags, skip, pc);
|
2008-10-02 01:14:09 +08:00
|
|
|
}
|
|
|
|
|
2008-11-22 19:28:47 +08:00
|
|
|
static void ftrace_trace_userstack(struct trace_array *tr,
|
2009-02-05 14:13:37 +08:00
|
|
|
unsigned long flags, int pc)
|
2008-11-22 19:28:47 +08:00
|
|
|
{
|
2008-11-28 17:17:56 +08:00
|
|
|
#ifdef CONFIG_STACKTRACE
|
2008-11-23 18:39:06 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-11-22 19:28:47 +08:00
|
|
|
struct userstack_entry *entry;
|
|
|
|
struct stack_trace trace;
|
|
|
|
|
|
|
|
if (!(trace_flags & TRACE_ITER_USERSTACKTRACE))
|
|
|
|
return;
|
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_USER_STACK,
|
|
|
|
sizeof(*entry), flags, pc);
|
2008-11-22 19:28:47 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
|
|
|
|
|
|
|
memset(&entry->caller, 0, sizeof(entry->caller));
|
|
|
|
|
|
|
|
trace.nr_entries = 0;
|
|
|
|
trace.max_entries = FTRACE_STACK_ENTRIES;
|
|
|
|
trace.skip = 0;
|
|
|
|
trace.entries = entry->caller;
|
|
|
|
|
|
|
|
save_stack_trace_user(&trace);
|
2009-02-06 02:12:56 +08:00
|
|
|
ring_buffer_unlock_commit(tr->buffer, event);
|
2008-11-28 17:17:56 +08:00
|
|
|
#endif
|
2008-11-22 19:28:47 +08:00
|
|
|
}
|
|
|
|
|
2009-02-11 02:44:12 +08:00
|
|
|
#ifdef UNUSED
|
|
|
|
static void __trace_userstack(struct trace_array *tr, unsigned long flags)
|
2008-11-22 19:28:47 +08:00
|
|
|
{
|
2009-02-05 14:13:37 +08:00
|
|
|
ftrace_trace_userstack(tr, flags, preempt_count());
|
2008-11-22 19:28:47 +08:00
|
|
|
}
|
2009-02-11 02:44:12 +08:00
|
|
|
#endif /* UNUSED */
|
2008-11-22 19:28:47 +08:00
|
|
|
|
2008-10-02 01:14:09 +08:00
|
|
|
static void
|
2009-02-05 14:13:37 +08:00
|
|
|
ftrace_trace_special(void *__tr,
|
2008-10-02 01:14:09 +08:00
|
|
|
unsigned long arg1, unsigned long arg2, unsigned long arg3,
|
|
|
|
int pc)
|
2008-05-13 03:21:02 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-05-13 03:21:02 +08:00
|
|
|
struct trace_array *tr = __tr;
|
2008-09-30 11:02:42 +08:00
|
|
|
struct special_entry *entry;
|
2008-05-13 03:21:02 +08:00
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_SPECIAL,
|
|
|
|
sizeof(*entry), 0, pc);
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
2008-09-30 11:02:42 +08:00
|
|
|
entry->arg1 = arg1;
|
|
|
|
entry->arg2 = arg2;
|
|
|
|
entry->arg3 = arg3;
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
trace_buffer_unlock_commit(tr, event, 0, pc);
|
2008-05-13 03:21:02 +08:00
|
|
|
}
|
|
|
|
|
2008-10-02 01:14:09 +08:00
|
|
|
void
|
|
|
|
__trace_special(void *__tr, void *__data,
|
|
|
|
unsigned long arg1, unsigned long arg2, unsigned long arg3)
|
|
|
|
{
|
2009-02-05 14:13:37 +08:00
|
|
|
ftrace_trace_special(__tr, arg1, arg2, arg3, preempt_count());
|
2008-10-02 01:14:09 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
void
|
2008-05-13 03:20:42 +08:00
|
|
|
tracing_sched_switch_trace(struct trace_array *tr,
|
2008-05-13 03:20:51 +08:00
|
|
|
struct task_struct *prev,
|
|
|
|
struct task_struct *next,
|
2008-10-02 01:14:09 +08:00
|
|
|
unsigned long flags, int pc)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-09-30 11:02:42 +08:00
|
|
|
struct ctx_switch_entry *entry;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_CTX,
|
|
|
|
sizeof(*entry), flags, pc);
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
2008-09-30 11:02:42 +08:00
|
|
|
entry->prev_pid = prev->pid;
|
|
|
|
entry->prev_prio = prev->prio;
|
|
|
|
entry->prev_state = prev->state;
|
|
|
|
entry->next_pid = next->pid;
|
|
|
|
entry->next_prio = next->prio;
|
|
|
|
entry->next_state = next->state;
|
|
|
|
entry->next_cpu = task_cpu(next);
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
trace_buffer_unlock_commit(tr, event, flags, pc);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
void
|
|
|
|
tracing_sched_wakeup_trace(struct trace_array *tr,
|
2008-05-13 03:20:51 +08:00
|
|
|
struct task_struct *wakee,
|
|
|
|
struct task_struct *curr,
|
2008-10-02 01:14:09 +08:00
|
|
|
unsigned long flags, int pc)
|
2008-05-13 03:20:51 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-09-30 11:02:42 +08:00
|
|
|
struct ctx_switch_entry *entry;
|
2008-05-13 03:20:51 +08:00
|
|
|
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_WAKE,
|
|
|
|
sizeof(*entry), flags, pc);
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!event)
|
|
|
|
return;
|
|
|
|
entry = ring_buffer_event_data(event);
|
2008-09-30 11:02:42 +08:00
|
|
|
entry->prev_pid = curr->pid;
|
|
|
|
entry->prev_prio = curr->prio;
|
|
|
|
entry->prev_state = curr->state;
|
|
|
|
entry->next_pid = wakee->pid;
|
|
|
|
entry->next_prio = wakee->prio;
|
|
|
|
entry->next_state = wakee->state;
|
|
|
|
entry->next_cpu = task_cpu(wakee);
|
2009-02-11 09:25:00 +08:00
|
|
|
|
|
|
|
ring_buffer_unlock_commit(tr->buffer, event);
|
|
|
|
ftrace_trace_stack(tr, flags, 6, pc);
|
|
|
|
ftrace_trace_userstack(tr, flags, pc);
|
2008-05-13 03:20:51 +08:00
|
|
|
}
|
|
|
|
|
2008-05-22 12:22:18 +08:00
|
|
|
void
|
|
|
|
ftrace_special(unsigned long arg1, unsigned long arg2, unsigned long arg3)
|
|
|
|
{
|
|
|
|
struct trace_array *tr = &global_trace;
|
|
|
|
struct trace_array_cpu *data;
|
2008-11-11 12:07:30 +08:00
|
|
|
unsigned long flags;
|
2008-05-22 12:22:18 +08:00
|
|
|
int cpu;
|
2008-10-02 01:14:09 +08:00
|
|
|
int pc;
|
2008-05-22 12:22:18 +08:00
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
if (tracing_disabled)
|
2008-05-22 12:22:18 +08:00
|
|
|
return;
|
|
|
|
|
2008-10-02 01:14:09 +08:00
|
|
|
pc = preempt_count();
|
2008-11-11 12:07:30 +08:00
|
|
|
local_irq_save(flags);
|
2008-05-22 12:22:18 +08:00
|
|
|
cpu = raw_smp_processor_id();
|
|
|
|
data = tr->data[cpu];
|
|
|
|
|
2008-11-11 12:07:30 +08:00
|
|
|
if (likely(atomic_inc_return(&data->disabled) == 1))
|
2009-02-05 14:13:37 +08:00
|
|
|
ftrace_trace_special(tr, arg1, arg2, arg3, pc);
|
2008-05-22 12:22:18 +08:00
|
|
|
|
2008-11-11 12:07:30 +08:00
|
|
|
atomic_dec(&data->disabled);
|
|
|
|
local_irq_restore(flags);
|
2008-05-22 12:22:18 +08:00
|
|
|
}
|
|
|
|
|
2008-11-26 04:07:04 +08:00
|
|
|
#ifdef CONFIG_FUNCTION_GRAPH_TRACER
|
2008-12-03 12:50:05 +08:00
|
|
|
int trace_graph_entry(struct ftrace_graph_ent *trace)
|
2008-11-11 14:14:25 +08:00
|
|
|
{
|
|
|
|
struct trace_array *tr = &global_trace;
|
|
|
|
struct trace_array_cpu *data;
|
|
|
|
unsigned long flags;
|
|
|
|
long disabled;
|
|
|
|
int cpu;
|
|
|
|
int pc;
|
|
|
|
|
2008-12-04 04:36:59 +08:00
|
|
|
if (!ftrace_trace_task(current))
|
|
|
|
return 0;
|
|
|
|
|
2008-12-04 04:36:57 +08:00
|
|
|
if (!ftrace_graph_addr(trace->func))
|
|
|
|
return 0;
|
|
|
|
|
2008-12-03 04:34:05 +08:00
|
|
|
local_irq_save(flags);
|
2008-11-11 14:14:25 +08:00
|
|
|
cpu = raw_smp_processor_id();
|
|
|
|
data = tr->data[cpu];
|
|
|
|
disabled = atomic_inc_return(&data->disabled);
|
|
|
|
if (likely(disabled == 1)) {
|
|
|
|
pc = preempt_count();
|
2009-02-05 14:13:37 +08:00
|
|
|
__trace_graph_entry(tr, trace, flags, pc);
|
2008-11-26 07:57:25 +08:00
|
|
|
}
|
2008-12-04 04:36:57 +08:00
|
|
|
/* Only do the atomic if it is not already set */
|
|
|
|
if (!test_tsk_trace_graph(current))
|
|
|
|
set_tsk_trace_graph(current);
|
2008-11-26 07:57:25 +08:00
|
|
|
atomic_dec(&data->disabled);
|
2008-12-03 04:34:05 +08:00
|
|
|
local_irq_restore(flags);
|
2008-12-03 12:50:05 +08:00
|
|
|
|
|
|
|
return 1;
|
2008-11-26 07:57:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void trace_graph_return(struct ftrace_graph_ret *trace)
|
|
|
|
{
|
|
|
|
struct trace_array *tr = &global_trace;
|
|
|
|
struct trace_array_cpu *data;
|
|
|
|
unsigned long flags;
|
|
|
|
long disabled;
|
|
|
|
int cpu;
|
|
|
|
int pc;
|
|
|
|
|
2008-12-03 04:34:05 +08:00
|
|
|
local_irq_save(flags);
|
2008-11-26 07:57:25 +08:00
|
|
|
cpu = raw_smp_processor_id();
|
|
|
|
data = tr->data[cpu];
|
|
|
|
disabled = atomic_inc_return(&data->disabled);
|
|
|
|
if (likely(disabled == 1)) {
|
|
|
|
pc = preempt_count();
|
2009-02-05 14:13:37 +08:00
|
|
|
__trace_graph_return(tr, trace, flags, pc);
|
2008-11-11 14:14:25 +08:00
|
|
|
}
|
2008-12-04 04:36:57 +08:00
|
|
|
if (!trace->depth)
|
|
|
|
clear_tsk_trace_graph(current);
|
2008-11-11 14:14:25 +08:00
|
|
|
atomic_dec(&data->disabled);
|
2008-12-03 04:34:05 +08:00
|
|
|
local_irq_restore(flags);
|
2008-11-11 14:14:25 +08:00
|
|
|
}
|
2008-11-26 04:07:04 +08:00
|
|
|
#endif /* CONFIG_FUNCTION_GRAPH_TRACER */
|
2008-11-11 14:14:25 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
enum trace_file_type {
|
|
|
|
TRACE_FILE_LAT_FMT = 1,
|
2008-11-13 06:52:38 +08:00
|
|
|
TRACE_FILE_ANNOTATE = 2,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
2008-11-12 19:59:32 +08:00
|
|
|
static void trace_iterator_increment(struct trace_iterator *iter)
|
2008-09-04 05:42:51 +08:00
|
|
|
{
|
2008-10-01 12:29:53 +08:00
|
|
|
/* Don't allow ftrace to trace into the ring buffers */
|
|
|
|
ftrace_disable_cpu();
|
|
|
|
|
2008-09-04 05:42:51 +08:00
|
|
|
iter->idx++;
|
2008-10-01 12:29:53 +08:00
|
|
|
if (iter->buffer_iter[iter->cpu])
|
|
|
|
ring_buffer_read(iter->buffer_iter[iter->cpu], NULL);
|
|
|
|
|
|
|
|
ftrace_enable_cpu();
|
2008-09-04 05:42:51 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static struct trace_entry *
|
2008-09-30 11:02:41 +08:00
|
|
|
peek_next_entry(struct trace_iterator *iter, int cpu, u64 *ts)
|
2008-08-02 00:26:41 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
|
|
|
struct ring_buffer_iter *buf_iter = iter->buffer_iter[cpu];
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
/* Don't allow ftrace to trace into the ring buffers */
|
|
|
|
ftrace_disable_cpu();
|
|
|
|
|
|
|
|
if (buf_iter)
|
|
|
|
event = ring_buffer_iter_peek(buf_iter, ts);
|
|
|
|
else
|
|
|
|
event = ring_buffer_peek(iter->tr->buffer, cpu, ts);
|
|
|
|
|
|
|
|
ftrace_enable_cpu();
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
return event ? ring_buffer_event_data(event) : NULL;
|
2008-08-02 00:26:41 +08:00
|
|
|
}
|
2008-10-01 12:29:53 +08:00
|
|
|
|
2008-08-02 00:26:41 +08:00
|
|
|
static struct trace_entry *
|
2008-09-30 11:02:41 +08:00
|
|
|
__find_next_entry(struct trace_iterator *iter, int *ent_cpu, u64 *ent_ts)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer *buffer = iter->tr->buffer;
|
2008-05-13 03:20:42 +08:00
|
|
|
struct trace_entry *ent, *next = NULL;
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
int cpu_file = iter->cpu_file;
|
2008-09-30 11:02:41 +08:00
|
|
|
u64 next_ts = 0, ts;
|
2008-05-13 03:20:42 +08:00
|
|
|
int next_cpu = -1;
|
|
|
|
int cpu;
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
/*
|
|
|
|
* If we are in a per_cpu trace file, don't bother by iterating over
|
|
|
|
* all cpu and peek directly.
|
|
|
|
*/
|
|
|
|
if (cpu_file > TRACE_PIPE_ALL_CPU) {
|
|
|
|
if (ring_buffer_empty_cpu(buffer, cpu_file))
|
|
|
|
return NULL;
|
|
|
|
ent = peek_next_entry(iter, cpu_file, ent_ts);
|
|
|
|
if (ent_cpu)
|
|
|
|
*ent_cpu = cpu_file;
|
|
|
|
|
|
|
|
return ent;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
for_each_tracing_cpu(cpu) {
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
if (ring_buffer_empty_cpu(buffer, cpu))
|
|
|
|
continue;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
ent = peek_next_entry(iter, cpu, &ts);
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-05-13 03:20:46 +08:00
|
|
|
/*
|
|
|
|
* Pick the entry with the smallest timestamp:
|
|
|
|
*/
|
2008-09-30 11:02:41 +08:00
|
|
|
if (ent && (!next || ts < next_ts)) {
|
2008-05-13 03:20:42 +08:00
|
|
|
next = ent;
|
|
|
|
next_cpu = cpu;
|
2008-09-30 11:02:41 +08:00
|
|
|
next_ts = ts;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (ent_cpu)
|
|
|
|
*ent_cpu = next_cpu;
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
if (ent_ts)
|
|
|
|
*ent_ts = next_ts;
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
return next;
|
|
|
|
}
|
|
|
|
|
2008-08-02 00:26:41 +08:00
|
|
|
/* Find the next real entry, without updating the iterator itself */
|
2009-02-03 06:29:21 +08:00
|
|
|
struct trace_entry *trace_find_next_entry(struct trace_iterator *iter,
|
|
|
|
int *ent_cpu, u64 *ent_ts)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
return __find_next_entry(iter, ent_cpu, ent_ts);
|
2008-08-02 00:26:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Find the next real entry, and increment the iterator to the next entry */
|
|
|
|
static void *find_next_entry_inc(struct trace_iterator *iter)
|
|
|
|
{
|
2008-09-30 11:02:41 +08:00
|
|
|
iter->ent = __find_next_entry(iter, &iter->cpu, &iter->ts);
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
if (iter->ent)
|
2008-11-12 19:59:32 +08:00
|
|
|
trace_iterator_increment(iter);
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
return iter->ent ? iter : NULL;
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void trace_consume(struct trace_iterator *iter)
|
2008-05-13 03:20:46 +08:00
|
|
|
{
|
2008-10-01 12:29:53 +08:00
|
|
|
/* Don't allow ftrace to trace into the ring buffers */
|
|
|
|
ftrace_disable_cpu();
|
2008-09-30 11:02:41 +08:00
|
|
|
ring_buffer_consume(iter->tr->buffer, iter->cpu, &iter->ts);
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_enable_cpu();
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void *s_next(struct seq_file *m, void *v, loff_t *pos)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
struct trace_iterator *iter = m->private;
|
|
|
|
int i = (int)*pos;
|
2008-05-13 03:20:45 +08:00
|
|
|
void *ent;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
(*pos)++;
|
|
|
|
|
|
|
|
/* can't go backwards */
|
|
|
|
if (iter->idx > i)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
if (iter->idx < 0)
|
|
|
|
ent = find_next_entry_inc(iter);
|
|
|
|
else
|
|
|
|
ent = iter;
|
|
|
|
|
|
|
|
while (ent && iter->idx < i)
|
|
|
|
ent = find_next_entry_inc(iter);
|
|
|
|
|
|
|
|
iter->pos = *pos;
|
|
|
|
|
|
|
|
return ent;
|
|
|
|
}
|
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
/*
|
|
|
|
* No necessary locking here. The worst thing which can
|
|
|
|
* happen is loosing events consumed at the same time
|
|
|
|
* by a trace_pipe reader.
|
|
|
|
* Other than that, we don't risk to crash the ring buffer
|
|
|
|
* because it serializes the readers.
|
|
|
|
*
|
|
|
|
* The current tracer is copied to avoid a global locking
|
|
|
|
* all around.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
static void *s_start(struct seq_file *m, loff_t *pos)
|
|
|
|
{
|
|
|
|
struct trace_iterator *iter = m->private;
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
static struct tracer *old_tracer;
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
int cpu_file = iter->cpu_file;
|
2008-05-13 03:20:42 +08:00
|
|
|
void *p = NULL;
|
|
|
|
loff_t l = 0;
|
2008-09-30 11:02:41 +08:00
|
|
|
int cpu;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
/* copy the tracer to avoid using a global lock all around */
|
2008-05-13 03:20:42 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
if (unlikely(old_tracer != current_trace && current_trace)) {
|
|
|
|
old_tracer = current_trace;
|
|
|
|
*iter->trace = *current_trace;
|
2008-05-13 03:20:56 +08:00
|
|
|
}
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
atomic_inc(&trace_record_cmdline_disabled);
|
|
|
|
|
|
|
|
if (*pos != iter->pos) {
|
|
|
|
iter->ent = NULL;
|
|
|
|
iter->cpu = 0;
|
|
|
|
iter->idx = -1;
|
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_disable_cpu();
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
if (cpu_file == TRACE_PIPE_ALL_CPU) {
|
|
|
|
for_each_tracing_cpu(cpu)
|
|
|
|
ring_buffer_iter_reset(iter->buffer_iter[cpu]);
|
|
|
|
} else
|
|
|
|
ring_buffer_iter_reset(iter->buffer_iter[cpu_file]);
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
ftrace_enable_cpu();
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
for (p = iter; p && l < *pos; p = s_next(m, p, &l))
|
|
|
|
;
|
|
|
|
|
|
|
|
} else {
|
2008-05-13 03:20:43 +08:00
|
|
|
l = *pos - 1;
|
2008-05-13 03:20:42 +08:00
|
|
|
p = s_next(m, p, &l);
|
|
|
|
}
|
|
|
|
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void s_stop(struct seq_file *m, void *p)
|
|
|
|
{
|
|
|
|
atomic_dec(&trace_record_cmdline_disabled);
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void print_lat_help_header(struct seq_file *m)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-08-21 07:36:11 +08:00
|
|
|
seq_puts(m, "# _------=> CPU# \n");
|
|
|
|
seq_puts(m, "# / _-----=> irqs-off \n");
|
|
|
|
seq_puts(m, "# | / _----=> need-resched \n");
|
|
|
|
seq_puts(m, "# || / _---=> hardirq/softirq \n");
|
|
|
|
seq_puts(m, "# ||| / _--=> preempt-depth \n");
|
|
|
|
seq_puts(m, "# |||| / \n");
|
|
|
|
seq_puts(m, "# ||||| delay \n");
|
|
|
|
seq_puts(m, "# cmd pid ||||| time | caller \n");
|
|
|
|
seq_puts(m, "# \\ / ||||| \\ | / \n");
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void print_func_help_header(struct seq_file *m)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-08-21 07:36:11 +08:00
|
|
|
seq_puts(m, "# TASK-PID CPU# TIMESTAMP FUNCTION\n");
|
|
|
|
seq_puts(m, "# | | | | |\n");
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void
|
2008-05-13 03:20:42 +08:00
|
|
|
print_trace_header(struct seq_file *m, struct trace_iterator *iter)
|
|
|
|
{
|
|
|
|
unsigned long sym_flags = (trace_flags & TRACE_ITER_SYM_MASK);
|
|
|
|
struct trace_array *tr = iter->tr;
|
|
|
|
struct trace_array_cpu *data = tr->data[tr->cpu];
|
|
|
|
struct tracer *type = current_trace;
|
2008-09-30 11:02:41 +08:00
|
|
|
unsigned long total;
|
|
|
|
unsigned long entries;
|
2008-05-13 03:20:42 +08:00
|
|
|
const char *name = "preemption";
|
|
|
|
|
|
|
|
if (type)
|
|
|
|
name = type->name;
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
entries = ring_buffer_entries(iter->tr->buffer);
|
|
|
|
total = entries +
|
|
|
|
ring_buffer_overruns(iter->tr->buffer);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
seq_printf(m, "%s latency trace v1.1.5 on %s\n",
|
|
|
|
name, UTS_RELEASE);
|
|
|
|
seq_puts(m, "-----------------------------------"
|
|
|
|
"---------------------------------\n");
|
|
|
|
seq_printf(m, " latency: %lu us, #%lu/%lu, CPU#%d |"
|
|
|
|
" (M:%s VP:%d, KP:%d, SP:%d HP:%d",
|
2008-05-13 03:20:44 +08:00
|
|
|
nsecs_to_usecs(data->saved_latency),
|
2008-05-13 03:20:42 +08:00
|
|
|
entries,
|
2008-05-13 03:20:43 +08:00
|
|
|
total,
|
2008-05-13 03:20:42 +08:00
|
|
|
tr->cpu,
|
|
|
|
#if defined(CONFIG_PREEMPT_NONE)
|
|
|
|
"server",
|
|
|
|
#elif defined(CONFIG_PREEMPT_VOLUNTARY)
|
|
|
|
"desktop",
|
2008-07-11 08:58:12 +08:00
|
|
|
#elif defined(CONFIG_PREEMPT)
|
2008-05-13 03:20:42 +08:00
|
|
|
"preempt",
|
|
|
|
#else
|
|
|
|
"unknown",
|
|
|
|
#endif
|
|
|
|
/* These are reserved for later use */
|
|
|
|
0, 0, 0, 0);
|
|
|
|
#ifdef CONFIG_SMP
|
|
|
|
seq_printf(m, " #P:%d)\n", num_online_cpus());
|
|
|
|
#else
|
|
|
|
seq_puts(m, ")\n");
|
|
|
|
#endif
|
|
|
|
seq_puts(m, " -----------------\n");
|
|
|
|
seq_printf(m, " | task: %.16s-%d "
|
|
|
|
"(uid:%d nice:%ld policy:%ld rt_prio:%ld)\n",
|
|
|
|
data->comm, data->pid, data->uid, data->nice,
|
|
|
|
data->policy, data->rt_priority);
|
|
|
|
seq_puts(m, " -----------------\n");
|
|
|
|
|
|
|
|
if (data->critical_start) {
|
|
|
|
seq_puts(m, " => started at: ");
|
2008-05-13 03:20:46 +08:00
|
|
|
seq_print_ip_sym(&iter->seq, data->critical_start, sym_flags);
|
|
|
|
trace_print_seq(m, &iter->seq);
|
2008-05-13 03:20:42 +08:00
|
|
|
seq_puts(m, "\n => ended at: ");
|
2008-05-13 03:20:46 +08:00
|
|
|
seq_print_ip_sym(&iter->seq, data->critical_end, sym_flags);
|
|
|
|
trace_print_seq(m, &iter->seq);
|
2008-05-13 03:20:42 +08:00
|
|
|
seq_puts(m, "\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
seq_puts(m, "\n");
|
|
|
|
}
|
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
static void test_cpu_buff_start(struct trace_iterator *iter)
|
|
|
|
{
|
|
|
|
struct trace_seq *s = &iter->seq;
|
|
|
|
|
2008-11-13 06:52:38 +08:00
|
|
|
if (!(trace_flags & TRACE_ITER_ANNOTATE))
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (!(iter->iter_flags & TRACE_FILE_ANNOTATE))
|
|
|
|
return;
|
|
|
|
|
2009-01-01 07:42:23 +08:00
|
|
|
if (cpumask_test_cpu(iter->cpu, iter->started))
|
2008-11-08 11:36:02 +08:00
|
|
|
return;
|
|
|
|
|
2009-01-01 07:42:23 +08:00
|
|
|
cpumask_set_cpu(iter->cpu, iter->started);
|
2008-11-08 11:36:02 +08:00
|
|
|
trace_seq_printf(s, "##### CPU %u buffer started ####\n", iter->cpu);
|
|
|
|
}
|
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
static enum print_line_t print_lat_fmt(struct trace_iterator *iter)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-05-13 03:20:46 +08:00
|
|
|
struct trace_seq *s = &iter->seq;
|
2008-05-13 03:20:42 +08:00
|
|
|
unsigned long sym_flags = (trace_flags & TRACE_ITER_SYM_MASK);
|
2008-12-24 12:24:13 +08:00
|
|
|
struct trace_event *event;
|
2008-05-13 03:20:42 +08:00
|
|
|
struct trace_entry *entry = iter->ent;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
test_cpu_buff_start(iter);
|
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
event = ftrace_find_event(entry->type);
|
|
|
|
|
|
|
|
if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
|
2009-02-04 06:20:41 +08:00
|
|
|
if (!trace_print_lat_context(iter))
|
|
|
|
goto partial;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
2008-09-30 11:02:42 +08:00
|
|
|
|
2009-02-05 06:16:39 +08:00
|
|
|
if (event)
|
2009-02-04 06:20:41 +08:00
|
|
|
return event->latency_trace(iter, sym_flags);
|
|
|
|
|
|
|
|
if (!trace_seq_printf(s, "Unknown type %d\n", entry->type))
|
|
|
|
goto partial;
|
2008-11-22 19:28:47 +08:00
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
return TRACE_TYPE_HANDLED;
|
2009-02-04 06:20:41 +08:00
|
|
|
partial:
|
|
|
|
return TRACE_TYPE_PARTIAL_LINE;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
static enum print_line_t print_trace_fmt(struct trace_iterator *iter)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-05-13 03:20:46 +08:00
|
|
|
struct trace_seq *s = &iter->seq;
|
2008-05-13 03:20:42 +08:00
|
|
|
unsigned long sym_flags = (trace_flags & TRACE_ITER_SYM_MASK);
|
2008-05-13 03:20:45 +08:00
|
|
|
struct trace_entry *entry;
|
2008-12-24 12:24:13 +08:00
|
|
|
struct trace_event *event;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:20:45 +08:00
|
|
|
entry = iter->ent;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
test_cpu_buff_start(iter);
|
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
event = ftrace_find_event(entry->type);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
|
2009-02-04 06:20:41 +08:00
|
|
|
if (!trace_print_context(iter))
|
|
|
|
goto partial;
|
2009-02-03 06:29:21 +08:00
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-05 06:16:39 +08:00
|
|
|
if (event)
|
2009-02-04 06:20:41 +08:00
|
|
|
return event->trace(iter, sym_flags);
|
|
|
|
|
|
|
|
if (!trace_seq_printf(s, "Unknown type %d\n", entry->type))
|
|
|
|
goto partial;
|
2008-11-22 19:28:47 +08:00
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
return TRACE_TYPE_HANDLED;
|
2009-02-04 06:20:41 +08:00
|
|
|
partial:
|
|
|
|
return TRACE_TYPE_PARTIAL_LINE;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
static enum print_line_t print_raw_fmt(struct trace_iterator *iter)
|
2008-05-13 03:20:47 +08:00
|
|
|
{
|
|
|
|
struct trace_seq *s = &iter->seq;
|
|
|
|
struct trace_entry *entry;
|
2008-12-24 12:24:13 +08:00
|
|
|
struct trace_event *event;
|
2008-05-13 03:20:47 +08:00
|
|
|
|
|
|
|
entry = iter->ent;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
|
2009-02-04 06:20:41 +08:00
|
|
|
if (!trace_seq_printf(s, "%d %d %llu ",
|
|
|
|
entry->pid, iter->cpu, iter->ts))
|
|
|
|
goto partial;
|
2009-02-03 06:29:21 +08:00
|
|
|
}
|
2008-05-13 03:20:47 +08:00
|
|
|
|
2008-12-24 12:24:13 +08:00
|
|
|
event = ftrace_find_event(entry->type);
|
2009-02-05 06:16:39 +08:00
|
|
|
if (event)
|
2009-02-04 06:20:41 +08:00
|
|
|
return event->raw(iter, 0);
|
|
|
|
|
|
|
|
if (!trace_seq_printf(s, "%d ?\n", entry->type))
|
|
|
|
goto partial;
|
2008-09-30 11:02:42 +08:00
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
return TRACE_TYPE_HANDLED;
|
2009-02-04 06:20:41 +08:00
|
|
|
partial:
|
|
|
|
return TRACE_TYPE_PARTIAL_LINE;
|
2008-05-13 03:20:47 +08:00
|
|
|
}
|
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
static enum print_line_t print_hex_fmt(struct trace_iterator *iter)
|
2008-05-13 03:20:49 +08:00
|
|
|
{
|
|
|
|
struct trace_seq *s = &iter->seq;
|
|
|
|
unsigned char newline = '\n';
|
|
|
|
struct trace_entry *entry;
|
2008-12-24 12:24:13 +08:00
|
|
|
struct trace_event *event;
|
2008-05-13 03:20:49 +08:00
|
|
|
|
|
|
|
entry = iter->ent;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
|
|
|
|
SEQ_PUT_HEX_FIELD_RET(s, entry->pid);
|
|
|
|
SEQ_PUT_HEX_FIELD_RET(s, iter->cpu);
|
|
|
|
SEQ_PUT_HEX_FIELD_RET(s, iter->ts);
|
|
|
|
}
|
2008-05-13 03:20:49 +08:00
|
|
|
|
2008-12-24 12:24:13 +08:00
|
|
|
event = ftrace_find_event(entry->type);
|
2009-02-05 06:16:39 +08:00
|
|
|
if (event) {
|
2009-02-04 08:05:50 +08:00
|
|
|
enum print_line_t ret = event->hex(iter, 0);
|
2009-02-04 06:20:41 +08:00
|
|
|
if (ret != TRACE_TYPE_HANDLED)
|
|
|
|
return ret;
|
|
|
|
}
|
2008-10-01 22:52:51 +08:00
|
|
|
|
2008-05-13 03:20:49 +08:00
|
|
|
SEQ_PUT_FIELD_RET(s, newline);
|
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
return TRACE_TYPE_HANDLED;
|
2008-05-13 03:20:49 +08:00
|
|
|
}
|
|
|
|
|
2008-12-14 03:18:13 +08:00
|
|
|
static enum print_line_t print_printk_msg_only(struct trace_iterator *iter)
|
|
|
|
{
|
|
|
|
struct trace_seq *s = &iter->seq;
|
|
|
|
struct trace_entry *entry = iter->ent;
|
|
|
|
struct print_entry *field;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
trace_assign_type(field, entry);
|
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
ret = trace_seq_printf(s, "%s", field->buf);
|
2008-12-14 03:18:13 +08:00
|
|
|
if (!ret)
|
|
|
|
return TRACE_TYPE_PARTIAL_LINE;
|
|
|
|
|
|
|
|
return TRACE_TYPE_HANDLED;
|
|
|
|
}
|
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
static enum print_line_t print_bin_fmt(struct trace_iterator *iter)
|
2008-05-13 03:20:47 +08:00
|
|
|
{
|
|
|
|
struct trace_seq *s = &iter->seq;
|
|
|
|
struct trace_entry *entry;
|
2008-12-24 12:24:13 +08:00
|
|
|
struct trace_event *event;
|
2008-05-13 03:20:47 +08:00
|
|
|
|
|
|
|
entry = iter->ent;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2009-02-03 06:29:21 +08:00
|
|
|
if (trace_flags & TRACE_ITER_CONTEXT_INFO) {
|
|
|
|
SEQ_PUT_FIELD_RET(s, entry->pid);
|
2009-02-08 08:38:43 +08:00
|
|
|
SEQ_PUT_FIELD_RET(s, iter->cpu);
|
2009-02-03 06:29:21 +08:00
|
|
|
SEQ_PUT_FIELD_RET(s, iter->ts);
|
|
|
|
}
|
2008-05-13 03:20:47 +08:00
|
|
|
|
2008-12-24 12:24:13 +08:00
|
|
|
event = ftrace_find_event(entry->type);
|
2009-02-05 06:16:39 +08:00
|
|
|
return event ? event->binary(iter, 0) : TRACE_TYPE_HANDLED;
|
2008-05-13 03:20:47 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
static int trace_empty(struct trace_iterator *iter)
|
|
|
|
{
|
|
|
|
int cpu;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
for_each_tracing_cpu(cpu) {
|
2008-10-01 12:29:53 +08:00
|
|
|
if (iter->buffer_iter[cpu]) {
|
|
|
|
if (!ring_buffer_iter_empty(iter->buffer_iter[cpu]))
|
|
|
|
return 0;
|
|
|
|
} else {
|
|
|
|
if (!ring_buffer_empty_cpu(iter->tr->buffer, cpu))
|
|
|
|
return 0;
|
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
2008-10-01 12:29:53 +08:00
|
|
|
|
2008-10-01 00:13:45 +08:00
|
|
|
return 1;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-09-30 02:18:34 +08:00
|
|
|
static enum print_line_t print_trace_line(struct trace_iterator *iter)
|
2008-05-13 03:20:47 +08:00
|
|
|
{
|
2008-09-30 02:18:34 +08:00
|
|
|
enum print_line_t ret;
|
|
|
|
|
|
|
|
if (iter->trace && iter->trace->print_line) {
|
|
|
|
ret = iter->trace->print_line(iter);
|
|
|
|
if (ret != TRACE_TYPE_UNHANDLED)
|
|
|
|
return ret;
|
|
|
|
}
|
2008-05-24 03:37:28 +08:00
|
|
|
|
2008-12-14 03:18:13 +08:00
|
|
|
if (iter->ent->type == TRACE_PRINT &&
|
|
|
|
trace_flags & TRACE_ITER_PRINTK &&
|
|
|
|
trace_flags & TRACE_ITER_PRINTK_MSGONLY)
|
|
|
|
return print_printk_msg_only(iter);
|
|
|
|
|
2008-05-13 03:20:47 +08:00
|
|
|
if (trace_flags & TRACE_ITER_BIN)
|
|
|
|
return print_bin_fmt(iter);
|
|
|
|
|
2008-05-13 03:20:49 +08:00
|
|
|
if (trace_flags & TRACE_ITER_HEX)
|
|
|
|
return print_hex_fmt(iter);
|
|
|
|
|
2008-05-13 03:20:47 +08:00
|
|
|
if (trace_flags & TRACE_ITER_RAW)
|
|
|
|
return print_raw_fmt(iter);
|
|
|
|
|
|
|
|
if (iter->iter_flags & TRACE_FILE_LAT_FMT)
|
2009-02-03 06:29:21 +08:00
|
|
|
return print_lat_fmt(iter);
|
2008-05-13 03:20:47 +08:00
|
|
|
|
|
|
|
return print_trace_fmt(iter);
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
static int s_show(struct seq_file *m, void *v)
|
|
|
|
{
|
|
|
|
struct trace_iterator *iter = v;
|
|
|
|
|
|
|
|
if (iter->ent == NULL) {
|
|
|
|
if (iter->tr) {
|
|
|
|
seq_printf(m, "# tracer: %s\n", iter->trace->name);
|
|
|
|
seq_puts(m, "#\n");
|
|
|
|
}
|
2008-11-25 16:12:31 +08:00
|
|
|
if (iter->trace && iter->trace->print_header)
|
|
|
|
iter->trace->print_header(m);
|
|
|
|
else if (iter->iter_flags & TRACE_FILE_LAT_FMT) {
|
2008-05-13 03:20:42 +08:00
|
|
|
/* print nothing if the buffers are empty */
|
|
|
|
if (trace_empty(iter))
|
|
|
|
return 0;
|
|
|
|
print_trace_header(m, iter);
|
|
|
|
if (!(trace_flags & TRACE_ITER_VERBOSE))
|
|
|
|
print_lat_help_header(m);
|
|
|
|
} else {
|
|
|
|
if (!(trace_flags & TRACE_ITER_VERBOSE))
|
|
|
|
print_func_help_header(m);
|
|
|
|
}
|
|
|
|
} else {
|
2008-05-13 03:20:47 +08:00
|
|
|
print_trace_line(iter);
|
2008-05-13 03:20:46 +08:00
|
|
|
trace_print_seq(m, &iter->seq);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct seq_operations tracer_seq_ops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.start = s_start,
|
|
|
|
.next = s_next,
|
|
|
|
.stop = s_stop,
|
|
|
|
.show = s_show,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static struct trace_iterator *
|
2009-02-27 13:12:38 +08:00
|
|
|
__tracing_open(struct inode *inode, struct file *file)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
long cpu_file = (long) inode->i_private;
|
2009-02-27 13:12:38 +08:00
|
|
|
void *fail_ret = ERR_PTR(-ENOMEM);
|
2008-05-13 03:20:42 +08:00
|
|
|
struct trace_iterator *iter;
|
2008-09-30 11:02:41 +08:00
|
|
|
struct seq_file *m;
|
2009-02-27 13:12:38 +08:00
|
|
|
int cpu, ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-27 13:12:38 +08:00
|
|
|
if (tracing_disabled)
|
|
|
|
return ERR_PTR(-ENODEV);
|
2008-05-13 03:20:44 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
iter = kzalloc(sizeof(*iter), GFP_KERNEL);
|
2009-02-27 13:12:38 +08:00
|
|
|
if (!iter)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
/*
|
|
|
|
* We make a copy of the current tracer to avoid concurrent
|
|
|
|
* changes on it while we are reading.
|
|
|
|
*/
|
2008-05-13 03:20:42 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
iter->trace = kzalloc(sizeof(*iter->trace), GFP_KERNEL);
|
2009-02-27 13:12:38 +08:00
|
|
|
if (!iter->trace)
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
goto fail;
|
2009-02-27 13:12:38 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
if (current_trace)
|
|
|
|
*iter->trace = *current_trace;
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
if (current_trace && current_trace->print_max)
|
|
|
|
iter->tr = &max_tr;
|
|
|
|
else
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
iter->tr = &global_trace;
|
2008-05-13 03:20:42 +08:00
|
|
|
iter->pos = -1;
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_init(&iter->mutex);
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
iter->cpu_file = cpu_file;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-11-25 16:12:31 +08:00
|
|
|
/* Notify the tracer early; before we stop tracing. */
|
|
|
|
if (iter->trace && iter->trace->open)
|
2008-12-11 20:53:26 +08:00
|
|
|
iter->trace->open(iter);
|
2008-11-25 16:12:31 +08:00
|
|
|
|
2008-11-13 06:52:38 +08:00
|
|
|
/* Annotate start of buffers if we had overruns */
|
|
|
|
if (ring_buffer_overruns(iter->tr->buffer))
|
|
|
|
iter->iter_flags |= TRACE_FILE_ANNOTATE;
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
if (iter->cpu_file == TRACE_PIPE_ALL_CPU) {
|
|
|
|
for_each_tracing_cpu(cpu) {
|
2008-11-13 06:52:38 +08:00
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
iter->buffer_iter[cpu] =
|
|
|
|
ring_buffer_read_start(iter->tr->buffer, cpu);
|
2008-10-01 12:29:53 +08:00
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
if (!iter->buffer_iter[cpu])
|
|
|
|
goto fail_buffer;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
cpu = iter->cpu_file;
|
2008-09-30 11:02:41 +08:00
|
|
|
iter->buffer_iter[cpu] =
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
ring_buffer_read_start(iter->tr->buffer, cpu);
|
2008-10-01 12:29:53 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!iter->buffer_iter[cpu])
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
goto fail;
|
2008-09-30 11:02:41 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
/* TODO stop tracer */
|
2009-02-27 13:12:38 +08:00
|
|
|
ret = seq_open(file, &tracer_seq_ops);
|
|
|
|
if (ret < 0) {
|
|
|
|
fail_ret = ERR_PTR(ret);
|
2008-09-30 11:02:41 +08:00
|
|
|
goto fail_buffer;
|
2009-02-27 13:12:38 +08:00
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
m = file->private_data;
|
|
|
|
m->private = iter;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
/* stop the trace while dumping */
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
tracing_stop();
|
2008-09-30 11:02:41 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
|
|
|
return iter;
|
2008-09-30 11:02:41 +08:00
|
|
|
|
|
|
|
fail_buffer:
|
|
|
|
for_each_tracing_cpu(cpu) {
|
|
|
|
if (iter->buffer_iter[cpu])
|
|
|
|
ring_buffer_read_finish(iter->buffer_iter[cpu]);
|
|
|
|
}
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
fail:
|
2008-09-30 11:02:41 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
kfree(iter->trace);
|
2008-11-15 02:05:31 +08:00
|
|
|
kfree(iter);
|
2008-09-30 11:02:41 +08:00
|
|
|
|
2009-02-27 13:12:38 +08:00
|
|
|
return fail_ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
int tracing_open_generic(struct inode *inode, struct file *filp)
|
|
|
|
{
|
2008-05-13 03:20:44 +08:00
|
|
|
if (tracing_disabled)
|
|
|
|
return -ENODEV;
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
filp->private_data = inode->i_private;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2009-02-11 02:44:12 +08:00
|
|
|
static int tracing_release(struct inode *inode, struct file *file)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
struct seq_file *m = (struct seq_file *)file->private_data;
|
|
|
|
struct trace_iterator *iter = m->private;
|
2008-09-30 11:02:41 +08:00
|
|
|
int cpu;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
2008-09-30 11:02:41 +08:00
|
|
|
for_each_tracing_cpu(cpu) {
|
|
|
|
if (iter->buffer_iter[cpu])
|
|
|
|
ring_buffer_read_finish(iter->buffer_iter[cpu]);
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
if (iter->trace && iter->trace->close)
|
|
|
|
iter->trace->close(iter);
|
|
|
|
|
|
|
|
/* reenable tracing if it was previously enabled */
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
tracing_start();
|
2008-05-13 03:20:42 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
|
|
|
seq_release(inode, file);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_destroy(&iter->mutex);
|
|
|
|
kfree(iter->trace);
|
2008-05-13 03:20:42 +08:00
|
|
|
kfree(iter);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int tracing_open(struct inode *inode, struct file *file)
|
|
|
|
{
|
2009-02-27 13:12:38 +08:00
|
|
|
struct trace_iterator *iter;
|
|
|
|
int ret = 0;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-27 13:12:38 +08:00
|
|
|
iter = __tracing_open(inode, file);
|
|
|
|
if (IS_ERR(iter))
|
|
|
|
ret = PTR_ERR(iter);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int tracing_lt_open(struct inode *inode, struct file *file)
|
|
|
|
{
|
|
|
|
struct trace_iterator *iter;
|
2009-02-27 13:12:38 +08:00
|
|
|
int ret = 0;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-27 13:12:38 +08:00
|
|
|
iter = __tracing_open(inode, file);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-27 13:12:38 +08:00
|
|
|
if (IS_ERR(iter))
|
|
|
|
ret = PTR_ERR(iter);
|
|
|
|
else
|
2008-05-13 03:20:42 +08:00
|
|
|
iter->iter_flags |= TRACE_FILE_LAT_FMT;
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2008-05-13 03:20:51 +08:00
|
|
|
static void *
|
2008-05-13 03:20:42 +08:00
|
|
|
t_next(struct seq_file *m, void *v, loff_t *pos)
|
|
|
|
{
|
|
|
|
struct tracer *t = m->private;
|
|
|
|
|
|
|
|
(*pos)++;
|
|
|
|
|
|
|
|
if (t)
|
|
|
|
t = t->next;
|
|
|
|
|
|
|
|
m->private = t;
|
|
|
|
|
|
|
|
return t;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void *t_start(struct seq_file *m, loff_t *pos)
|
|
|
|
{
|
|
|
|
struct tracer *t = m->private;
|
|
|
|
loff_t l = 0;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
for (; t && l < *pos; t = t_next(m, t, &l))
|
|
|
|
;
|
|
|
|
|
|
|
|
return t;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void t_stop(struct seq_file *m, void *p)
|
|
|
|
{
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int t_show(struct seq_file *m, void *v)
|
|
|
|
{
|
|
|
|
struct tracer *t = v;
|
|
|
|
|
|
|
|
if (!t)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
seq_printf(m, "%s", t->name);
|
|
|
|
if (t->next)
|
|
|
|
seq_putc(m, ' ');
|
|
|
|
else
|
|
|
|
seq_putc(m, '\n');
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct seq_operations show_traces_seq_ops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.start = t_start,
|
|
|
|
.next = t_next,
|
|
|
|
.stop = t_stop,
|
|
|
|
.show = t_show,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static int show_traces_open(struct inode *inode, struct file *file)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
if (tracing_disabled)
|
|
|
|
return -ENODEV;
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
ret = seq_open(file, &show_traces_seq_ops);
|
|
|
|
if (!ret) {
|
|
|
|
struct seq_file *m = file->private_data;
|
|
|
|
m->private = trace_types;
|
|
|
|
}
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct file_operations tracing_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_open,
|
|
|
|
.read = seq_read,
|
|
|
|
.llseek = seq_lseek,
|
|
|
|
.release = tracing_release,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static struct file_operations tracing_lt_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_lt_open,
|
|
|
|
.read = seq_read,
|
|
|
|
.llseek = seq_lseek,
|
|
|
|
.release = tracing_release,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static struct file_operations show_traces_fops = {
|
2008-05-13 03:20:52 +08:00
|
|
|
.open = show_traces_open,
|
|
|
|
.read = seq_read,
|
|
|
|
.release = seq_release,
|
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:52 +08:00
|
|
|
/*
|
|
|
|
* Only trace on a CPU if the bitmask is set:
|
|
|
|
*/
|
2009-01-01 07:42:22 +08:00
|
|
|
static cpumask_var_t tracing_cpumask;
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* The tracer itself will not take this lock, but still we want
|
|
|
|
* to provide a consistent cpumask to user-space:
|
|
|
|
*/
|
|
|
|
static DEFINE_MUTEX(tracing_cpumask_update_lock);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Temporary storage for the character representation of the
|
|
|
|
* CPU bitmask (and one more byte for the newline):
|
|
|
|
*/
|
|
|
|
static char mask_str[NR_CPUS + 1];
|
|
|
|
|
2008-05-13 03:20:52 +08:00
|
|
|
static ssize_t
|
|
|
|
tracing_cpumask_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t count, loff_t *ppos)
|
|
|
|
{
|
2008-05-13 03:20:52 +08:00
|
|
|
int len;
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
mutex_lock(&tracing_cpumask_update_lock);
|
2008-05-13 03:20:52 +08:00
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
len = cpumask_scnprintf(mask_str, count, tracing_cpumask);
|
2008-05-13 03:20:52 +08:00
|
|
|
if (count - len < 2) {
|
|
|
|
count = -EINVAL;
|
|
|
|
goto out_err;
|
|
|
|
}
|
|
|
|
len += sprintf(mask_str + len, "\n");
|
|
|
|
count = simple_read_from_buffer(ubuf, count, ppos, mask_str, NR_CPUS+1);
|
|
|
|
|
|
|
|
out_err:
|
2008-05-13 03:20:52 +08:00
|
|
|
mutex_unlock(&tracing_cpumask_update_lock);
|
|
|
|
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_cpumask_write(struct file *filp, const char __user *ubuf,
|
|
|
|
size_t count, loff_t *ppos)
|
|
|
|
{
|
2008-05-13 03:20:52 +08:00
|
|
|
int err, cpu;
|
2009-01-01 07:42:22 +08:00
|
|
|
cpumask_var_t tracing_cpumask_new;
|
|
|
|
|
|
|
|
if (!alloc_cpumask_var(&tracing_cpumask_new, GFP_KERNEL))
|
|
|
|
return -ENOMEM;
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
mutex_lock(&tracing_cpumask_update_lock);
|
2009-01-01 07:42:22 +08:00
|
|
|
err = cpumask_parse_user(ubuf, count, tracing_cpumask_new);
|
2008-05-13 03:20:52 +08:00
|
|
|
if (err)
|
2008-05-13 03:20:52 +08:00
|
|
|
goto err_unlock;
|
|
|
|
|
2008-12-03 04:34:05 +08:00
|
|
|
local_irq_disable();
|
2008-05-13 03:20:55 +08:00
|
|
|
__raw_spin_lock(&ftrace_max_lock);
|
2008-05-13 03:21:00 +08:00
|
|
|
for_each_tracing_cpu(cpu) {
|
2008-05-13 03:20:52 +08:00
|
|
|
/*
|
|
|
|
* Increase/decrease the disabled counter if we are
|
|
|
|
* about to flip a bit in the cpumask:
|
|
|
|
*/
|
2009-01-01 07:42:22 +08:00
|
|
|
if (cpumask_test_cpu(cpu, tracing_cpumask) &&
|
|
|
|
!cpumask_test_cpu(cpu, tracing_cpumask_new)) {
|
2008-05-13 03:20:52 +08:00
|
|
|
atomic_inc(&global_trace.data[cpu]->disabled);
|
|
|
|
}
|
2009-01-01 07:42:22 +08:00
|
|
|
if (!cpumask_test_cpu(cpu, tracing_cpumask) &&
|
|
|
|
cpumask_test_cpu(cpu, tracing_cpumask_new)) {
|
2008-05-13 03:20:52 +08:00
|
|
|
atomic_dec(&global_trace.data[cpu]->disabled);
|
|
|
|
}
|
|
|
|
}
|
2008-05-13 03:20:55 +08:00
|
|
|
__raw_spin_unlock(&ftrace_max_lock);
|
2008-12-03 04:34:05 +08:00
|
|
|
local_irq_enable();
|
2008-05-13 03:20:52 +08:00
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
cpumask_copy(tracing_cpumask, tracing_cpumask_new);
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
mutex_unlock(&tracing_cpumask_update_lock);
|
2009-01-01 07:42:22 +08:00
|
|
|
free_cpumask_var(tracing_cpumask_new);
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
return count;
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
err_unlock:
|
|
|
|
mutex_unlock(&tracing_cpumask_update_lock);
|
2009-01-01 07:42:22 +08:00
|
|
|
free_cpumask_var(tracing_cpumask);
|
2008-05-13 03:20:52 +08:00
|
|
|
|
|
|
|
return err;
|
2008-05-13 03:20:52 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static struct file_operations tracing_cpumask_fops = {
|
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = tracing_cpumask_read,
|
|
|
|
.write = tracing_cpumask_write,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static ssize_t
|
2008-11-13 06:52:37 +08:00
|
|
|
tracing_trace_options_read(struct file *filp, char __user *ubuf,
|
2008-05-13 03:20:42 +08:00
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
2009-02-27 12:55:58 +08:00
|
|
|
struct tracer_opt *trace_opts;
|
|
|
|
u32 tracer_flags;
|
|
|
|
int len = 0;
|
2008-05-13 03:20:42 +08:00
|
|
|
char *buf;
|
|
|
|
int r = 0;
|
2009-02-27 12:55:58 +08:00
|
|
|
int i;
|
2008-11-18 02:23:42 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-10 14:03:18 +08:00
|
|
|
/* calculate max size */
|
2008-05-13 03:20:42 +08:00
|
|
|
for (i = 0; trace_options[i]; i++) {
|
|
|
|
len += strlen(trace_options[i]);
|
2009-02-27 13:22:21 +08:00
|
|
|
len += 3; /* "no" and newline */
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2009-02-27 12:55:58 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
tracer_flags = current_trace->flags->val;
|
|
|
|
trace_opts = current_trace->flags->opts;
|
|
|
|
|
2008-11-18 02:23:42 +08:00
|
|
|
/*
|
|
|
|
* Increase the size with names of options specific
|
|
|
|
* of the current tracer.
|
|
|
|
*/
|
|
|
|
for (i = 0; trace_opts[i].name; i++) {
|
|
|
|
len += strlen(trace_opts[i].name);
|
2009-02-27 13:22:21 +08:00
|
|
|
len += 3; /* "no" and newline */
|
2008-11-18 02:23:42 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
/* +2 for \n and \0 */
|
|
|
|
buf = kmalloc(len + 2, GFP_KERNEL);
|
2009-02-27 12:55:58 +08:00
|
|
|
if (!buf) {
|
|
|
|
mutex_unlock(&trace_types_lock);
|
2008-05-13 03:20:42 +08:00
|
|
|
return -ENOMEM;
|
2009-02-27 12:55:58 +08:00
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
for (i = 0; trace_options[i]; i++) {
|
|
|
|
if (trace_flags & (1 << i))
|
2009-02-27 13:22:21 +08:00
|
|
|
r += sprintf(buf + r, "%s\n", trace_options[i]);
|
2008-05-13 03:20:42 +08:00
|
|
|
else
|
2009-02-27 13:22:21 +08:00
|
|
|
r += sprintf(buf + r, "no%s\n", trace_options[i]);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-11-18 02:23:42 +08:00
|
|
|
for (i = 0; trace_opts[i].name; i++) {
|
|
|
|
if (tracer_flags & trace_opts[i].bit)
|
2009-02-27 13:22:21 +08:00
|
|
|
r += sprintf(buf + r, "%s\n",
|
2008-11-18 02:23:42 +08:00
|
|
|
trace_opts[i].name);
|
|
|
|
else
|
2009-02-27 13:22:21 +08:00
|
|
|
r += sprintf(buf + r, "no%s\n",
|
2008-11-18 02:23:42 +08:00
|
|
|
trace_opts[i].name);
|
|
|
|
}
|
2009-02-27 12:55:58 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
2008-11-18 02:23:42 +08:00
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
WARN_ON(r >= len + 2);
|
|
|
|
|
2008-05-13 03:20:52 +08:00
|
|
|
r = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
kfree(buf);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
2008-11-18 02:23:42 +08:00
|
|
|
/* Try to assign a tracer specific option */
|
|
|
|
static int set_tracer_option(struct tracer *trace, char *cmp, int neg)
|
|
|
|
{
|
|
|
|
struct tracer_flags *trace_flags = trace->flags;
|
|
|
|
struct tracer_opt *opts = NULL;
|
|
|
|
int ret = 0, i = 0;
|
|
|
|
int len;
|
|
|
|
|
|
|
|
for (i = 0; trace_flags->opts[i].name; i++) {
|
|
|
|
opts = &trace_flags->opts[i];
|
|
|
|
len = strlen(opts->name);
|
|
|
|
|
|
|
|
if (strncmp(cmp, opts->name, len) == 0) {
|
|
|
|
ret = trace->set_flag(trace_flags->val,
|
|
|
|
opts->bit, !neg);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* Not found */
|
|
|
|
if (!trace_flags->opts[i].name)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
/* Refused to handle */
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
if (neg)
|
|
|
|
trace_flags->val &= ~opts->bit;
|
|
|
|
else
|
|
|
|
trace_flags->val |= opts->bit;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
static ssize_t
|
2008-11-13 06:52:37 +08:00
|
|
|
tracing_trace_options_write(struct file *filp, const char __user *ubuf,
|
2008-05-13 03:20:42 +08:00
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
char buf[64];
|
|
|
|
char *cmp = buf;
|
|
|
|
int neg = 0;
|
2008-11-18 02:23:42 +08:00
|
|
|
int ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
int i;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
if (cnt >= sizeof(buf))
|
|
|
|
return -EINVAL;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
|
|
|
if (strncmp(buf, "no", 2) == 0) {
|
|
|
|
neg = 1;
|
|
|
|
cmp += 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; trace_options[i]; i++) {
|
|
|
|
int len = strlen(trace_options[i]);
|
|
|
|
|
|
|
|
if (strncmp(cmp, trace_options[i], len) == 0) {
|
|
|
|
if (neg)
|
|
|
|
trace_flags &= ~(1 << i);
|
|
|
|
else
|
|
|
|
trace_flags |= (1 << i);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2008-11-18 02:23:42 +08:00
|
|
|
|
|
|
|
/* If no option could be set, test the specific tracer options */
|
|
|
|
if (!trace_options[i]) {
|
2009-02-27 12:55:58 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
2008-11-18 02:23:42 +08:00
|
|
|
ret = set_tracer_option(current_trace, cmp, neg);
|
2009-02-27 12:55:58 +08:00
|
|
|
mutex_unlock(&trace_types_lock);
|
2008-11-18 02:23:42 +08:00
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
filp->f_pos += cnt;
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct file_operations tracing_iter_fops = {
|
2008-05-13 03:20:52 +08:00
|
|
|
.open = tracing_open_generic,
|
2008-11-13 06:52:37 +08:00
|
|
|
.read = tracing_trace_options_read,
|
|
|
|
.write = tracing_trace_options_write,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:45 +08:00
|
|
|
static const char readme_msg[] =
|
|
|
|
"tracing mini-HOWTO:\n\n"
|
|
|
|
"# mkdir /debug\n"
|
|
|
|
"# mount -t debugfs nodev /debug\n\n"
|
|
|
|
"# cat /debug/tracing/available_tracers\n"
|
|
|
|
"wakeup preemptirqsoff preemptoff irqsoff ftrace sched_switch none\n\n"
|
|
|
|
"# cat /debug/tracing/current_tracer\n"
|
|
|
|
"none\n"
|
|
|
|
"# echo sched_switch > /debug/tracing/current_tracer\n"
|
|
|
|
"# cat /debug/tracing/current_tracer\n"
|
|
|
|
"sched_switch\n"
|
2008-11-13 06:52:37 +08:00
|
|
|
"# cat /debug/tracing/trace_options\n"
|
2008-05-13 03:20:45 +08:00
|
|
|
"noprint-parent nosym-offset nosym-addr noverbose\n"
|
2008-11-13 06:52:37 +08:00
|
|
|
"# echo print-parent > /debug/tracing/trace_options\n"
|
2008-05-13 03:20:45 +08:00
|
|
|
"# echo 1 > /debug/tracing/tracing_enabled\n"
|
|
|
|
"# cat /debug/tracing/trace > /tmp/trace.txt\n"
|
|
|
|
"echo 0 > /debug/tracing/tracing_enabled\n"
|
|
|
|
;
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_readme_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos,
|
|
|
|
readme_msg, strlen(readme_msg));
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct file_operations tracing_readme_fops = {
|
2008-05-13 03:20:52 +08:00
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = tracing_readme_read,
|
2008-05-13 03:20:45 +08:00
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
static ssize_t
|
|
|
|
tracing_ctrl_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
char buf[64];
|
|
|
|
int r;
|
|
|
|
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
r = sprintf(buf, "%u\n", tracer_enabled);
|
2008-05-13 03:20:45 +08:00
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_ctrl_write(struct file *filp, const char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
struct trace_array *tr = filp->private_data;
|
|
|
|
char buf[64];
|
2009-02-11 02:44:34 +08:00
|
|
|
unsigned long val;
|
2008-05-13 03:21:00 +08:00
|
|
|
int ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
if (cnt >= sizeof(buf))
|
|
|
|
return -EINVAL;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
ret = strict_strtoul(buf, 10, &val);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
val = !!val;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
if (tracer_enabled ^ val) {
|
|
|
|
if (val) {
|
2008-05-13 03:20:42 +08:00
|
|
|
tracer_enabled = 1;
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
if (current_trace->start)
|
|
|
|
current_trace->start(tr);
|
|
|
|
tracing_start();
|
|
|
|
} else {
|
2008-05-13 03:20:42 +08:00
|
|
|
tracer_enabled = 0;
|
ftrace: restructure tracing start/stop infrastructure
Impact: change where tracing is started up and stopped
Currently, when a new tracer is selected via echo'ing a tracer name into
the current_tracer file, the startup is only done if tracing_enabled is
set to one. If tracing_enabled is changed to zero (by echo'ing 0 into
the tracing_enabled file) a full shutdown is performed.
The full startup and shutdown of a tracer can be expensive and the
user can lose out traces when echo'ing in 0 to the tracing_enabled file,
because the process takes too long. There can also be places that
the user would like to start and stop the tracer several times and
doing the full startup and shutdown of a tracer might be too expensive.
This patch performs the full startup and shutdown when a tracer is
selected. It also adds a way to do a quick start or stop of a tracer.
The quick version is just a flag that prevents the tracing from
taking place, but the overhead of the code is still there.
For example, the startup of a tracer may enable tracepoints, or enable
the function tracer. The stop and start will just set a flag to
have the tracer ignore the calls when the tracepoint or function trace
is called. The overhead of the tracer may still be present when
the tracer is stopped, but no tracing will occur. Setting the tracer
to the 'nop' tracer (or any other tracer) will perform the shutdown
of the tracer which will disable the tracepoint or disable the
function tracer.
The tracing_enabled file will simply start or stop tracing.
This change is all internal. The end result for the user should be the same
as before. If tracing_enabled is not set, no trace will happen.
If tracing_enabled is set, then the trace will happen. The tracing_enabled
variable is static between tracers. Enabling tracing_enabled and
going to another tracer will keep tracing_enabled enabled. Same
is true with disabling tracing_enabled.
This patch will now provide a fast start/stop method to the users
for enabling or disabling tracing.
Note: There were two methods to the struct tracer that were never
used: The methods start and stop. These were to be used as a hook
to the reading of the trace output, but ended up not being
necessary. These two methods are now used to enable the start
and stop of each tracer, in case the tracer needs to do more than
just not write into the buffer. For example, the irqsoff tracer
must stop recording max latencies when tracing is stopped.
Signed-off-by: Steven Rostedt <srostedt@redhat.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-11-06 05:05:44 +08:00
|
|
|
tracing_stop();
|
|
|
|
if (current_trace->stop)
|
|
|
|
current_trace->stop(tr);
|
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
|
|
|
filp->f_pos += cnt;
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_set_trace_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
char buf[max_tracer_type_len+2];
|
|
|
|
int r;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
if (current_trace)
|
|
|
|
r = sprintf(buf, "%s\n", current_trace->name);
|
|
|
|
else
|
|
|
|
r = sprintf(buf, "\n");
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
2008-05-13 03:20:46 +08:00
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2009-02-06 04:02:00 +08:00
|
|
|
int tracer_init(struct tracer *t, struct trace_array *tr)
|
|
|
|
{
|
|
|
|
tracing_reset_online_cpus(tr);
|
|
|
|
return t->init(tr);
|
|
|
|
}
|
|
|
|
|
2009-02-27 12:43:05 +08:00
|
|
|
struct trace_option_dentry;
|
|
|
|
|
|
|
|
static struct trace_option_dentry *
|
|
|
|
create_trace_option_files(struct tracer *tracer);
|
|
|
|
|
|
|
|
static void
|
|
|
|
destroy_trace_option_files(struct trace_option_dentry *topts);
|
|
|
|
|
2009-02-03 10:38:32 +08:00
|
|
|
static int tracing_set_tracer(const char *buf)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2009-02-27 12:43:05 +08:00
|
|
|
static struct trace_option_dentry *topts;
|
2008-05-13 03:20:42 +08:00
|
|
|
struct trace_array *tr = &global_trace;
|
|
|
|
struct tracer *t;
|
2008-11-02 02:57:37 +08:00
|
|
|
int ret = 0;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
for (t = trace_types; t; t = t->next) {
|
|
|
|
if (strcmp(t->name, buf) == 0)
|
|
|
|
break;
|
|
|
|
}
|
2008-10-05 04:04:44 +08:00
|
|
|
if (!t) {
|
|
|
|
ret = -EINVAL;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
if (t == current_trace)
|
2008-05-13 03:20:42 +08:00
|
|
|
goto out;
|
|
|
|
|
2008-11-13 04:24:24 +08:00
|
|
|
trace_branch_disable();
|
2008-05-13 03:20:42 +08:00
|
|
|
if (current_trace && current_trace->reset)
|
|
|
|
current_trace->reset(tr);
|
|
|
|
|
2009-02-27 12:43:05 +08:00
|
|
|
destroy_trace_option_files(topts);
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
current_trace = t;
|
2009-02-27 12:43:05 +08:00
|
|
|
|
|
|
|
topts = create_trace_option_files(current_trace);
|
|
|
|
|
2008-11-16 12:57:26 +08:00
|
|
|
if (t->init) {
|
2009-02-06 04:02:00 +08:00
|
|
|
ret = tracer_init(t, tr);
|
2008-11-16 12:57:26 +08:00
|
|
|
if (ret)
|
|
|
|
goto out;
|
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-11-13 04:24:24 +08:00
|
|
|
trace_branch_enable(tr);
|
2008-05-13 03:20:42 +08:00
|
|
|
out:
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
2008-11-02 02:57:37 +08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_set_trace_write(struct file *filp, const char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
char buf[max_tracer_type_len+1];
|
|
|
|
int i;
|
|
|
|
size_t ret;
|
2008-11-16 12:53:19 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
ret = cnt;
|
2008-11-02 02:57:37 +08:00
|
|
|
|
|
|
|
if (cnt > max_tracer_type_len)
|
|
|
|
cnt = max_tracer_type_len;
|
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
|
|
|
/* strip ending whitespace. */
|
|
|
|
for (i = cnt - 1; i > 0 && isspace(buf[i]); i--)
|
|
|
|
buf[i] = 0;
|
|
|
|
|
2008-11-16 12:53:19 +08:00
|
|
|
err = tracing_set_tracer(buf);
|
|
|
|
if (err)
|
|
|
|
return err;
|
2008-11-02 02:57:37 +08:00
|
|
|
|
2008-11-16 12:53:19 +08:00
|
|
|
filp->f_pos += ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-10-05 04:04:44 +08:00
|
|
|
return ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_max_lat_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
unsigned long *ptr = filp->private_data;
|
|
|
|
char buf[64];
|
|
|
|
int r;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
r = snprintf(buf, sizeof(buf), "%ld\n",
|
2008-05-13 03:20:42 +08:00
|
|
|
*ptr == (unsigned long)-1 ? -1 : nsecs_to_usecs(*ptr));
|
2008-05-13 03:21:00 +08:00
|
|
|
if (r > sizeof(buf))
|
|
|
|
r = sizeof(buf);
|
2008-05-13 03:20:46 +08:00
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_max_lat_write(struct file *filp, const char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
2009-02-11 02:44:34 +08:00
|
|
|
unsigned long *ptr = filp->private_data;
|
2008-05-13 03:20:42 +08:00
|
|
|
char buf[64];
|
2009-02-11 02:44:34 +08:00
|
|
|
unsigned long val;
|
2008-05-13 03:21:00 +08:00
|
|
|
int ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
if (cnt >= sizeof(buf))
|
|
|
|
return -EINVAL;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
ret = strict_strtoul(buf, 10, &val);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
*ptr = val * 1000;
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:46 +08:00
|
|
|
static int tracing_open_pipe(struct inode *inode, struct file *filp)
|
|
|
|
{
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
long cpu_file = (long) inode->i_private;
|
2008-05-13 03:20:46 +08:00
|
|
|
struct trace_iterator *iter;
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
int ret = 0;
|
2008-05-13 03:20:46 +08:00
|
|
|
|
|
|
|
if (tracing_disabled)
|
|
|
|
return -ENODEV;
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
|
|
|
|
/* We only allow one reader per cpu */
|
|
|
|
if (cpu_file == TRACE_PIPE_ALL_CPU) {
|
|
|
|
if (!cpumask_empty(tracing_reader_cpumask)) {
|
|
|
|
ret = -EBUSY;
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
cpumask_setall(tracing_reader_cpumask);
|
|
|
|
} else {
|
|
|
|
if (!cpumask_test_cpu(cpu_file, tracing_reader_cpumask))
|
|
|
|
cpumask_set_cpu(cpu_file, tracing_reader_cpumask);
|
|
|
|
else {
|
|
|
|
ret = -EBUSY;
|
|
|
|
goto out;
|
|
|
|
}
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* create a buffer to store the information to pass to userspace */
|
|
|
|
iter = kzalloc(sizeof(*iter), GFP_KERNEL);
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
if (!iter) {
|
|
|
|
ret = -ENOMEM;
|
|
|
|
goto out;
|
|
|
|
}
|
2008-05-13 03:20:46 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
/*
|
|
|
|
* We make a copy of the current tracer to avoid concurrent
|
|
|
|
* changes on it while we are reading.
|
|
|
|
*/
|
|
|
|
iter->trace = kmalloc(sizeof(*iter->trace), GFP_KERNEL);
|
|
|
|
if (!iter->trace) {
|
|
|
|
ret = -ENOMEM;
|
|
|
|
goto fail;
|
|
|
|
}
|
|
|
|
if (current_trace)
|
|
|
|
*iter->trace = *current_trace;
|
|
|
|
|
2009-01-01 07:42:23 +08:00
|
|
|
if (!alloc_cpumask_var(&iter->started, GFP_KERNEL)) {
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
ret = -ENOMEM;
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
goto fail;
|
2009-01-01 07:42:23 +08:00
|
|
|
}
|
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
/* trace pipe does not show start of buffer */
|
2009-01-01 07:42:23 +08:00
|
|
|
cpumask_setall(iter->started);
|
2008-11-08 11:36:02 +08:00
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
iter->cpu_file = cpu_file;
|
2008-05-13 03:20:46 +08:00
|
|
|
iter->tr = &global_trace;
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_init(&iter->mutex);
|
2008-05-13 03:20:46 +08:00
|
|
|
filp->private_data = iter;
|
|
|
|
|
2008-05-13 03:21:01 +08:00
|
|
|
if (iter->trace->pipe_open)
|
|
|
|
iter->trace->pipe_open(iter);
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
out:
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
return ret;
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
|
|
|
|
fail:
|
|
|
|
kfree(iter->trace);
|
|
|
|
kfree(iter);
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
return ret;
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static int tracing_release_pipe(struct inode *inode, struct file *file)
|
|
|
|
{
|
|
|
|
struct trace_iterator *iter = file->private_data;
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
|
|
|
|
if (iter->cpu_file == TRACE_PIPE_ALL_CPU)
|
|
|
|
cpumask_clear(tracing_reader_cpumask);
|
|
|
|
else
|
|
|
|
cpumask_clear_cpu(iter->cpu_file, tracing_reader_cpumask);
|
|
|
|
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
2009-01-01 07:42:23 +08:00
|
|
|
free_cpumask_var(iter->started);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_destroy(&iter->mutex);
|
|
|
|
kfree(iter->trace);
|
2008-05-13 03:20:46 +08:00
|
|
|
kfree(iter);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:49 +08:00
|
|
|
static unsigned int
|
|
|
|
tracing_poll_pipe(struct file *filp, poll_table *poll_table)
|
|
|
|
{
|
|
|
|
struct trace_iterator *iter = filp->private_data;
|
|
|
|
|
|
|
|
if (trace_flags & TRACE_ITER_BLOCK) {
|
|
|
|
/*
|
|
|
|
* Always select as readable when in blocking mode
|
|
|
|
*/
|
|
|
|
return POLLIN | POLLRDNORM;
|
2008-05-13 03:21:00 +08:00
|
|
|
} else {
|
2008-05-13 03:20:49 +08:00
|
|
|
if (!trace_empty(iter))
|
|
|
|
return POLLIN | POLLRDNORM;
|
|
|
|
poll_wait(filp, &trace_wait, poll_table);
|
|
|
|
if (!trace_empty(iter))
|
|
|
|
return POLLIN | POLLRDNORM;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2009-02-11 09:25:00 +08:00
|
|
|
|
|
|
|
void default_wait_pipe(struct trace_iterator *iter)
|
|
|
|
{
|
|
|
|
DEFINE_WAIT(wait);
|
|
|
|
|
|
|
|
prepare_to_wait(&trace_wait, &wait, TASK_INTERRUPTIBLE);
|
|
|
|
|
|
|
|
if (trace_empty(iter))
|
|
|
|
schedule();
|
|
|
|
|
|
|
|
finish_wait(&trace_wait, &wait);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This is a make-shift waitqueue.
|
|
|
|
* A tracer might use this callback on some rare cases:
|
|
|
|
*
|
|
|
|
* 1) the current tracer might hold the runqueue lock when it wakes up
|
|
|
|
* a reader, hence a deadlock (sched, function, and function graph tracers)
|
|
|
|
* 2) the function tracers, trace all functions, we don't want
|
|
|
|
* the overhead of calling wake_up and friends
|
|
|
|
* (and tracing them too)
|
|
|
|
*
|
|
|
|
* Anyway, this is really very primitive wakeup.
|
|
|
|
*/
|
|
|
|
void poll_wait_pipe(struct trace_iterator *iter)
|
|
|
|
{
|
|
|
|
set_current_state(TASK_INTERRUPTIBLE);
|
|
|
|
/* sleep for 100 msecs, and try again. */
|
|
|
|
schedule_timeout(HZ / 10);
|
|
|
|
}
|
|
|
|
|
2009-02-09 14:15:55 +08:00
|
|
|
/* Must be called with trace_types_lock mutex held. */
|
|
|
|
static int tracing_wait_pipe(struct file *filp)
|
2008-05-13 03:20:46 +08:00
|
|
|
{
|
|
|
|
struct trace_iterator *iter = filp->private_data;
|
|
|
|
|
|
|
|
while (trace_empty(iter)) {
|
2008-05-13 03:20:58 +08:00
|
|
|
|
2008-05-13 03:21:01 +08:00
|
|
|
if ((filp->f_flags & O_NONBLOCK)) {
|
2009-02-09 14:15:55 +08:00
|
|
|
return -EAGAIN;
|
2008-05-13 03:21:01 +08:00
|
|
|
}
|
2008-05-13 03:20:58 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_unlock(&iter->mutex);
|
2008-05-13 03:21:01 +08:00
|
|
|
|
2009-02-11 09:25:00 +08:00
|
|
|
iter->trace->wait_pipe(iter);
|
2008-05-13 03:20:46 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_lock(&iter->mutex);
|
2008-05-13 03:21:01 +08:00
|
|
|
|
2009-02-11 09:25:00 +08:00
|
|
|
if (signal_pending(current))
|
2009-02-09 14:15:55 +08:00
|
|
|
return -EINTR;
|
2008-05-13 03:20:46 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* We block until we read something and tracing is disabled.
|
|
|
|
* We still block if tracing is disabled, but we have never
|
|
|
|
* read anything. This allows a user to cat this file, and
|
|
|
|
* then enable tracing. But after we have read something,
|
|
|
|
* we give an EOF when tracing is again disabled.
|
|
|
|
*
|
|
|
|
* iter->pos will be 0 if we haven't read anything.
|
|
|
|
*/
|
|
|
|
if (!tracer_enabled && iter->pos)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2009-02-09 14:15:55 +08:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Consumer reader.
|
|
|
|
*/
|
|
|
|
static ssize_t
|
|
|
|
tracing_read_pipe(struct file *filp, char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
struct trace_iterator *iter = filp->private_data;
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
static struct tracer *old_tracer;
|
2009-02-09 14:15:55 +08:00
|
|
|
ssize_t sret;
|
|
|
|
|
|
|
|
/* return any leftover data */
|
|
|
|
sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
|
|
|
|
if (sret != -EBUSY)
|
|
|
|
return sret;
|
|
|
|
|
2009-03-03 03:04:40 +08:00
|
|
|
trace_seq_init(&iter->seq);
|
2009-02-09 14:15:55 +08:00
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
/* copy the tracer to avoid using a global lock all around */
|
2009-02-09 14:15:55 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
if (unlikely(old_tracer != current_trace && current_trace)) {
|
|
|
|
old_tracer = current_trace;
|
|
|
|
*iter->trace = *current_trace;
|
|
|
|
}
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Avoid more than one consumer on a single file descriptor
|
|
|
|
* This is just a matter of traces coherency, the ring buffer itself
|
|
|
|
* is protected.
|
|
|
|
*/
|
|
|
|
mutex_lock(&iter->mutex);
|
2009-02-09 14:15:55 +08:00
|
|
|
if (iter->trace->read) {
|
|
|
|
sret = iter->trace->read(iter, filp, ubuf, cnt, ppos);
|
|
|
|
if (sret)
|
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
|
|
|
waitagain:
|
|
|
|
sret = tracing_wait_pipe(filp);
|
|
|
|
if (sret <= 0)
|
|
|
|
goto out;
|
|
|
|
|
2008-05-13 03:20:46 +08:00
|
|
|
/* stop when tracing is finished */
|
2009-02-09 14:15:55 +08:00
|
|
|
if (trace_empty(iter)) {
|
|
|
|
sret = 0;
|
2008-05-13 03:21:01 +08:00
|
|
|
goto out;
|
2009-02-09 14:15:55 +08:00
|
|
|
}
|
2008-05-13 03:20:46 +08:00
|
|
|
|
|
|
|
if (cnt >= PAGE_SIZE)
|
|
|
|
cnt = PAGE_SIZE - 1;
|
|
|
|
|
2008-05-13 03:21:01 +08:00
|
|
|
/* reset all but tr, trace, and overruns */
|
|
|
|
memset(&iter->seq, 0,
|
|
|
|
sizeof(struct trace_iterator) -
|
|
|
|
offsetof(struct trace_iterator, seq));
|
2008-05-13 03:21:01 +08:00
|
|
|
iter->pos = -1;
|
2008-05-13 03:20:46 +08:00
|
|
|
|
2008-05-13 03:20:48 +08:00
|
|
|
while (find_next_entry_inc(iter) != NULL) {
|
2008-09-30 02:18:34 +08:00
|
|
|
enum print_line_t ret;
|
2008-05-13 03:20:48 +08:00
|
|
|
int len = iter->seq.len;
|
|
|
|
|
2008-05-13 03:20:47 +08:00
|
|
|
ret = print_trace_line(iter);
|
2008-09-30 02:18:34 +08:00
|
|
|
if (ret == TRACE_TYPE_PARTIAL_LINE) {
|
2008-05-13 03:20:48 +08:00
|
|
|
/* don't print partial lines */
|
|
|
|
iter->seq.len = len;
|
2008-05-13 03:20:46 +08:00
|
|
|
break;
|
2008-05-13 03:20:48 +08:00
|
|
|
}
|
2009-02-07 01:30:44 +08:00
|
|
|
if (ret != TRACE_TYPE_NO_CONSUME)
|
|
|
|
trace_consume(iter);
|
2008-05-13 03:20:46 +08:00
|
|
|
|
|
|
|
if (iter->seq.len >= cnt)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Now copy what we have to the user */
|
2008-05-13 03:21:02 +08:00
|
|
|
sret = trace_seq_to_user(&iter->seq, ubuf, cnt);
|
|
|
|
if (iter->seq.readpos >= iter->seq.len)
|
2009-03-03 03:04:40 +08:00
|
|
|
trace_seq_init(&iter->seq);
|
2008-09-30 02:23:48 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* If there was nothing to send to user, inspite of consuming trace
|
|
|
|
* entries, go back to wait for more entries.
|
|
|
|
*/
|
2008-05-13 03:21:02 +08:00
|
|
|
if (sret == -EBUSY)
|
2008-09-30 02:23:48 +08:00
|
|
|
goto waitagain;
|
2008-05-13 03:20:46 +08:00
|
|
|
|
2008-05-13 03:21:01 +08:00
|
|
|
out:
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_unlock(&iter->mutex);
|
2008-05-13 03:21:01 +08:00
|
|
|
|
2008-05-13 03:21:02 +08:00
|
|
|
return sret;
|
2008-05-13 03:20:46 +08:00
|
|
|
}
|
|
|
|
|
2009-02-09 14:15:56 +08:00
|
|
|
static void tracing_pipe_buf_release(struct pipe_inode_info *pipe,
|
|
|
|
struct pipe_buffer *buf)
|
|
|
|
{
|
|
|
|
__free_page(buf->page);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void tracing_spd_release_pipe(struct splice_pipe_desc *spd,
|
|
|
|
unsigned int idx)
|
|
|
|
{
|
|
|
|
__free_page(spd->pages[idx]);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct pipe_buf_operations tracing_pipe_buf_ops = {
|
2009-02-10 01:06:29 +08:00
|
|
|
.can_merge = 0,
|
|
|
|
.map = generic_pipe_buf_map,
|
|
|
|
.unmap = generic_pipe_buf_unmap,
|
|
|
|
.confirm = generic_pipe_buf_confirm,
|
|
|
|
.release = tracing_pipe_buf_release,
|
|
|
|
.steal = generic_pipe_buf_steal,
|
|
|
|
.get = generic_pipe_buf_get,
|
2009-02-09 14:15:56 +08:00
|
|
|
};
|
|
|
|
|
2009-02-10 01:06:29 +08:00
|
|
|
static size_t
|
2009-02-11 09:51:30 +08:00
|
|
|
tracing_fill_pipe_page(size_t rem, struct trace_iterator *iter)
|
2009-02-10 01:06:29 +08:00
|
|
|
{
|
|
|
|
size_t count;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
/* Seq buffer is page-sized, exactly what we need. */
|
|
|
|
for (;;) {
|
|
|
|
count = iter->seq.len;
|
|
|
|
ret = print_trace_line(iter);
|
|
|
|
count = iter->seq.len - count;
|
|
|
|
if (rem < count) {
|
|
|
|
rem = 0;
|
|
|
|
iter->seq.len -= count;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
if (ret == TRACE_TYPE_PARTIAL_LINE) {
|
|
|
|
iter->seq.len -= count;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
trace_consume(iter);
|
|
|
|
rem -= count;
|
|
|
|
if (!find_next_entry_inc(iter)) {
|
|
|
|
rem = 0;
|
|
|
|
iter->ent = NULL;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return rem;
|
|
|
|
}
|
|
|
|
|
2009-02-09 14:15:56 +08:00
|
|
|
static ssize_t tracing_splice_read_pipe(struct file *filp,
|
|
|
|
loff_t *ppos,
|
|
|
|
struct pipe_inode_info *pipe,
|
|
|
|
size_t len,
|
|
|
|
unsigned int flags)
|
|
|
|
{
|
|
|
|
struct page *pages[PIPE_BUFFERS];
|
|
|
|
struct partial_page partial[PIPE_BUFFERS];
|
|
|
|
struct trace_iterator *iter = filp->private_data;
|
|
|
|
struct splice_pipe_desc spd = {
|
2009-02-10 01:06:29 +08:00
|
|
|
.pages = pages,
|
|
|
|
.partial = partial,
|
|
|
|
.nr_pages = 0, /* This gets updated below. */
|
|
|
|
.flags = flags,
|
|
|
|
.ops = &tracing_pipe_buf_ops,
|
|
|
|
.spd_release = tracing_spd_release_pipe,
|
2009-02-09 14:15:56 +08:00
|
|
|
};
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
static struct tracer *old_tracer;
|
2009-02-09 14:15:56 +08:00
|
|
|
ssize_t ret;
|
2009-02-10 01:06:29 +08:00
|
|
|
size_t rem;
|
2009-02-09 14:15:56 +08:00
|
|
|
unsigned int i;
|
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
/* copy the tracer to avoid using a global lock all around */
|
2009-02-09 14:15:56 +08:00
|
|
|
mutex_lock(&trace_types_lock);
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
if (unlikely(old_tracer != current_trace && current_trace)) {
|
|
|
|
old_tracer = current_trace;
|
|
|
|
*iter->trace = *current_trace;
|
|
|
|
}
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
|
|
|
mutex_lock(&iter->mutex);
|
2009-02-09 14:15:56 +08:00
|
|
|
|
|
|
|
if (iter->trace->splice_read) {
|
|
|
|
ret = iter->trace->splice_read(iter, filp,
|
|
|
|
ppos, pipe, len, flags);
|
|
|
|
if (ret)
|
2009-02-10 01:06:29 +08:00
|
|
|
goto out_err;
|
2009-02-09 14:15:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ret = tracing_wait_pipe(filp);
|
|
|
|
if (ret <= 0)
|
2009-02-10 01:06:29 +08:00
|
|
|
goto out_err;
|
2009-02-09 14:15:56 +08:00
|
|
|
|
|
|
|
if (!iter->ent && !find_next_entry_inc(iter)) {
|
|
|
|
ret = -EFAULT;
|
2009-02-10 01:06:29 +08:00
|
|
|
goto out_err;
|
2009-02-09 14:15:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Fill as many pages as possible. */
|
|
|
|
for (i = 0, rem = len; i < PIPE_BUFFERS && rem; i++) {
|
|
|
|
pages[i] = alloc_page(GFP_KERNEL);
|
2009-02-10 01:06:29 +08:00
|
|
|
if (!pages[i])
|
|
|
|
break;
|
2009-02-09 14:15:56 +08:00
|
|
|
|
2009-02-11 09:51:30 +08:00
|
|
|
rem = tracing_fill_pipe_page(rem, iter);
|
2009-02-09 14:15:56 +08:00
|
|
|
|
|
|
|
/* Copy the data into the page, so we can start over. */
|
|
|
|
ret = trace_seq_to_buffer(&iter->seq,
|
|
|
|
page_address(pages[i]),
|
|
|
|
iter->seq.len);
|
|
|
|
if (ret < 0) {
|
|
|
|
__free_page(pages[i]);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
partial[i].offset = 0;
|
|
|
|
partial[i].len = iter->seq.len;
|
|
|
|
|
2009-03-03 03:04:40 +08:00
|
|
|
trace_seq_init(&iter->seq);
|
2009-02-09 14:15:56 +08:00
|
|
|
}
|
|
|
|
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_unlock(&iter->mutex);
|
2009-02-09 14:15:56 +08:00
|
|
|
|
|
|
|
spd.nr_pages = i;
|
|
|
|
|
|
|
|
return splice_to_pipe(pipe, &spd);
|
|
|
|
|
2009-02-10 01:06:29 +08:00
|
|
|
out_err:
|
tracing/core: make the read callbacks reentrants
Now that several per-cpu files can be read or spliced at the
same, we want the read/splice callbacks for tracing files to be
reentrants.
Until now, a single global mutex (trace_types_lock) serialized
the access to tracing_read_pipe(), tracing_splice_read_pipe(),
and the seq helpers.
Ie: it means that if a user tries to read trace_pipe0 and
trace_pipe1 at the same time, the access to the function
tracing_read_pipe() is contended and one reader must wait for
the other to finish its read call.
The trace_type_lock mutex is mostly here to serialize the access
to the global current tracer (current_trace), which can be
changed concurrently. Although the iter struct keeps a private
pointer to this tracer, its callbacks can be changed by another
function.
The method used here is to not keep anymore private reference to
the tracer inside the iterator but to make a copy of it inside
the iterator. Then it checks on subsequents read calls if the
tracer has changed. This is not costly because the current
tracer is not expected to be changed often, so we use a branch
prediction for that.
Moreover, we add a private mutex to the iterator (there is one
iterator per file descriptor) to serialize the accesses in case
of multiple consumers per file descriptor (which would be a
silly idea from the user). Note that this is not to protect the
ring buffer, since the ring buffer already serializes the
readers accesses. This is to prevent from traces weirdness in
case of concurrent consumers. But these mutexes can be dropped
anyway, that would not result in any crash. Just tell me what
you think about it.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 13:13:16 +08:00
|
|
|
mutex_unlock(&iter->mutex);
|
2009-02-09 14:15:56 +08:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:59 +08:00
|
|
|
static ssize_t
|
|
|
|
tracing_entries_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
struct trace_array *tr = filp->private_data;
|
|
|
|
char buf[64];
|
|
|
|
int r;
|
|
|
|
|
2008-11-13 13:09:35 +08:00
|
|
|
r = sprintf(buf, "%lu\n", tr->entries >> 10);
|
2008-05-13 03:20:59 +08:00
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_entries_write(struct file *filp, const char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
|
|
|
unsigned long val;
|
|
|
|
char buf[64];
|
2008-11-11 10:46:00 +08:00
|
|
|
int ret, cpu;
|
2008-05-13 03:20:59 +08:00
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
if (cnt >= sizeof(buf))
|
|
|
|
return -EINVAL;
|
2008-05-13 03:20:59 +08:00
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
2008-05-13 03:21:00 +08:00
|
|
|
ret = strict_strtoul(buf, 10, &val);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
2008-05-13 03:20:59 +08:00
|
|
|
|
|
|
|
/* must have at least 1 entry */
|
|
|
|
if (!val)
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
tracing_stop();
|
2008-05-13 03:20:59 +08:00
|
|
|
|
2008-11-11 10:46:00 +08:00
|
|
|
/* disable all cpu buffers */
|
|
|
|
for_each_tracing_cpu(cpu) {
|
|
|
|
if (global_trace.data[cpu])
|
|
|
|
atomic_inc(&global_trace.data[cpu]->disabled);
|
|
|
|
if (max_tr.data[cpu])
|
|
|
|
atomic_inc(&max_tr.data[cpu]->disabled);
|
|
|
|
}
|
|
|
|
|
2008-11-13 13:09:35 +08:00
|
|
|
/* value is in KB */
|
|
|
|
val <<= 10;
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
if (val != global_trace.entries) {
|
|
|
|
ret = ring_buffer_resize(global_trace.buffer, val);
|
|
|
|
if (ret < 0) {
|
|
|
|
cnt = ret;
|
2008-05-13 03:21:04 +08:00
|
|
|
goto out;
|
|
|
|
}
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
ret = ring_buffer_resize(max_tr.buffer, val);
|
|
|
|
if (ret < 0) {
|
|
|
|
int r;
|
|
|
|
cnt = ret;
|
|
|
|
r = ring_buffer_resize(global_trace.buffer,
|
|
|
|
global_trace.entries);
|
|
|
|
if (r < 0) {
|
|
|
|
/* AARGH! We are left with different
|
|
|
|
* size max buffer!!!! */
|
|
|
|
WARN_ON(1);
|
|
|
|
tracing_disabled = 1;
|
2008-05-13 03:20:59 +08:00
|
|
|
}
|
2008-09-30 11:02:41 +08:00
|
|
|
goto out;
|
2008-05-13 03:20:59 +08:00
|
|
|
}
|
2008-05-13 03:21:04 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
global_trace.entries = val;
|
2008-05-13 03:20:59 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
filp->f_pos += cnt;
|
|
|
|
|
2008-05-22 12:22:16 +08:00
|
|
|
/* If check pages failed, return ENOMEM */
|
|
|
|
if (tracing_disabled)
|
|
|
|
cnt = -ENOMEM;
|
2008-05-13 03:20:59 +08:00
|
|
|
out:
|
2008-11-11 10:46:00 +08:00
|
|
|
for_each_tracing_cpu(cpu) {
|
|
|
|
if (global_trace.data[cpu])
|
|
|
|
atomic_dec(&global_trace.data[cpu]->disabled);
|
|
|
|
if (max_tr.data[cpu])
|
|
|
|
atomic_dec(&max_tr.data[cpu]->disabled);
|
|
|
|
}
|
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
tracing_start();
|
2008-05-13 03:20:59 +08:00
|
|
|
max_tr.entries = global_trace.entries;
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
2008-09-17 03:06:42 +08:00
|
|
|
static int mark_printk(const char *fmt, ...)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
va_list args;
|
|
|
|
va_start(args, fmt);
|
2008-12-04 06:45:11 +08:00
|
|
|
ret = trace_vprintk(0, -1, fmt, args);
|
2008-09-17 03:06:42 +08:00
|
|
|
va_end(args);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_mark_write(struct file *filp, const char __user *ubuf,
|
|
|
|
size_t cnt, loff_t *fpos)
|
|
|
|
{
|
|
|
|
char *buf;
|
|
|
|
char *end;
|
|
|
|
|
2008-11-08 11:36:02 +08:00
|
|
|
if (tracing_disabled)
|
2008-09-17 03:06:42 +08:00
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (cnt > TRACE_BUF_SIZE)
|
|
|
|
cnt = TRACE_BUF_SIZE;
|
|
|
|
|
|
|
|
buf = kmalloc(cnt + 1, GFP_KERNEL);
|
|
|
|
if (buf == NULL)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
if (copy_from_user(buf, ubuf, cnt)) {
|
|
|
|
kfree(buf);
|
|
|
|
return -EFAULT;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Cut from the first nil or newline. */
|
|
|
|
buf[cnt] = '\0';
|
|
|
|
end = strchr(buf, '\n');
|
|
|
|
if (end)
|
|
|
|
*end = '\0';
|
|
|
|
|
|
|
|
cnt = mark_printk("%s\n", buf);
|
|
|
|
kfree(buf);
|
|
|
|
*fpos += cnt;
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
static struct file_operations tracing_max_lat_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = tracing_max_lat_read,
|
|
|
|
.write = tracing_max_lat_write,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static struct file_operations tracing_ctrl_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = tracing_ctrl_read,
|
|
|
|
.write = tracing_ctrl_write,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
static struct file_operations set_tracer_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = tracing_set_trace_read,
|
|
|
|
.write = tracing_set_trace_write,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:46 +08:00
|
|
|
static struct file_operations tracing_pipe_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_open_pipe,
|
2008-05-13 03:20:49 +08:00
|
|
|
.poll = tracing_poll_pipe,
|
2008-05-13 03:20:46 +08:00
|
|
|
.read = tracing_read_pipe,
|
2009-02-09 14:15:56 +08:00
|
|
|
.splice_read = tracing_splice_read_pipe,
|
2008-05-13 03:20:46 +08:00
|
|
|
.release = tracing_release_pipe,
|
2008-05-13 03:20:46 +08:00
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:59 +08:00
|
|
|
static struct file_operations tracing_entries_fops = {
|
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = tracing_entries_read,
|
|
|
|
.write = tracing_entries_write,
|
|
|
|
};
|
|
|
|
|
2008-09-17 03:06:42 +08:00
|
|
|
static struct file_operations tracing_mark_fops = {
|
2008-09-22 02:16:30 +08:00
|
|
|
.open = tracing_open_generic,
|
2008-09-17 03:06:42 +08:00
|
|
|
.write = tracing_mark_write,
|
|
|
|
};
|
|
|
|
|
2008-12-02 11:20:19 +08:00
|
|
|
struct ftrace_buffer_info {
|
|
|
|
struct trace_array *tr;
|
|
|
|
void *spare;
|
|
|
|
int cpu;
|
|
|
|
unsigned int read;
|
|
|
|
};
|
|
|
|
|
|
|
|
static int tracing_buffers_open(struct inode *inode, struct file *filp)
|
|
|
|
{
|
|
|
|
int cpu = (int)(long)inode->i_private;
|
|
|
|
struct ftrace_buffer_info *info;
|
|
|
|
|
|
|
|
if (tracing_disabled)
|
|
|
|
return -ENODEV;
|
|
|
|
|
|
|
|
info = kzalloc(sizeof(*info), GFP_KERNEL);
|
|
|
|
if (!info)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
info->tr = &global_trace;
|
|
|
|
info->cpu = cpu;
|
|
|
|
info->spare = ring_buffer_alloc_read_page(info->tr->buffer);
|
|
|
|
/* Force reading ring buffer for first read */
|
|
|
|
info->read = (unsigned int)-1;
|
|
|
|
if (!info->spare)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
filp->private_data = info;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
out:
|
|
|
|
kfree(info);
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_buffers_read(struct file *filp, char __user *ubuf,
|
|
|
|
size_t count, loff_t *ppos)
|
|
|
|
{
|
|
|
|
struct ftrace_buffer_info *info = filp->private_data;
|
|
|
|
unsigned int pos;
|
|
|
|
ssize_t ret;
|
|
|
|
size_t size;
|
|
|
|
|
|
|
|
/* Do we have previous read data to read? */
|
|
|
|
if (info->read < PAGE_SIZE)
|
|
|
|
goto read;
|
|
|
|
|
|
|
|
info->read = 0;
|
|
|
|
|
|
|
|
ret = ring_buffer_read_page(info->tr->buffer,
|
|
|
|
&info->spare,
|
|
|
|
count,
|
|
|
|
info->cpu, 0);
|
|
|
|
if (ret < 0)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
pos = ring_buffer_page_len(info->spare);
|
|
|
|
|
|
|
|
if (pos < PAGE_SIZE)
|
|
|
|
memset(info->spare + pos, 0, PAGE_SIZE - pos);
|
|
|
|
|
|
|
|
read:
|
|
|
|
size = PAGE_SIZE - info->read;
|
|
|
|
if (size > count)
|
|
|
|
size = count;
|
|
|
|
|
|
|
|
ret = copy_to_user(ubuf, info->spare + info->read, size);
|
|
|
|
if (ret)
|
|
|
|
return -EFAULT;
|
|
|
|
*ppos += size;
|
|
|
|
info->read += size;
|
|
|
|
|
|
|
|
return size;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int tracing_buffers_release(struct inode *inode, struct file *file)
|
|
|
|
{
|
|
|
|
struct ftrace_buffer_info *info = file->private_data;
|
|
|
|
|
|
|
|
ring_buffer_free_read_page(info->tr->buffer, info->spare);
|
|
|
|
kfree(info);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct buffer_ref {
|
|
|
|
struct ring_buffer *buffer;
|
|
|
|
void *page;
|
|
|
|
int ref;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void buffer_pipe_buf_release(struct pipe_inode_info *pipe,
|
|
|
|
struct pipe_buffer *buf)
|
|
|
|
{
|
|
|
|
struct buffer_ref *ref = (struct buffer_ref *)buf->private;
|
|
|
|
|
|
|
|
if (--ref->ref)
|
|
|
|
return;
|
|
|
|
|
|
|
|
ring_buffer_free_read_page(ref->buffer, ref->page);
|
|
|
|
kfree(ref);
|
|
|
|
buf->private = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int buffer_pipe_buf_steal(struct pipe_inode_info *pipe,
|
|
|
|
struct pipe_buffer *buf)
|
|
|
|
{
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void buffer_pipe_buf_get(struct pipe_inode_info *pipe,
|
|
|
|
struct pipe_buffer *buf)
|
|
|
|
{
|
|
|
|
struct buffer_ref *ref = (struct buffer_ref *)buf->private;
|
|
|
|
|
|
|
|
ref->ref++;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Pipe buffer operations for a buffer. */
|
|
|
|
static struct pipe_buf_operations buffer_pipe_buf_ops = {
|
|
|
|
.can_merge = 0,
|
|
|
|
.map = generic_pipe_buf_map,
|
|
|
|
.unmap = generic_pipe_buf_unmap,
|
|
|
|
.confirm = generic_pipe_buf_confirm,
|
|
|
|
.release = buffer_pipe_buf_release,
|
|
|
|
.steal = buffer_pipe_buf_steal,
|
|
|
|
.get = buffer_pipe_buf_get,
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Callback from splice_to_pipe(), if we need to release some pages
|
|
|
|
* at the end of the spd in case we error'ed out in filling the pipe.
|
|
|
|
*/
|
|
|
|
static void buffer_spd_release(struct splice_pipe_desc *spd, unsigned int i)
|
|
|
|
{
|
|
|
|
struct buffer_ref *ref =
|
|
|
|
(struct buffer_ref *)spd->partial[i].private;
|
|
|
|
|
|
|
|
if (--ref->ref)
|
|
|
|
return;
|
|
|
|
|
|
|
|
ring_buffer_free_read_page(ref->buffer, ref->page);
|
|
|
|
kfree(ref);
|
|
|
|
spd->partial[i].private = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
tracing_buffers_splice_read(struct file *file, loff_t *ppos,
|
|
|
|
struct pipe_inode_info *pipe, size_t len,
|
|
|
|
unsigned int flags)
|
|
|
|
{
|
|
|
|
struct ftrace_buffer_info *info = file->private_data;
|
|
|
|
struct partial_page partial[PIPE_BUFFERS];
|
|
|
|
struct page *pages[PIPE_BUFFERS];
|
|
|
|
struct splice_pipe_desc spd = {
|
|
|
|
.pages = pages,
|
|
|
|
.partial = partial,
|
|
|
|
.flags = flags,
|
|
|
|
.ops = &buffer_pipe_buf_ops,
|
|
|
|
.spd_release = buffer_spd_release,
|
|
|
|
};
|
|
|
|
struct buffer_ref *ref;
|
|
|
|
int size, i;
|
|
|
|
size_t ret;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* We can't seek on a buffer input
|
|
|
|
*/
|
|
|
|
if (unlikely(*ppos))
|
|
|
|
return -ESPIPE;
|
|
|
|
|
|
|
|
|
|
|
|
for (i = 0; i < PIPE_BUFFERS && len; i++, len -= size) {
|
|
|
|
struct page *page;
|
|
|
|
int r;
|
|
|
|
|
|
|
|
ref = kzalloc(sizeof(*ref), GFP_KERNEL);
|
|
|
|
if (!ref)
|
|
|
|
break;
|
|
|
|
|
|
|
|
ref->buffer = info->tr->buffer;
|
|
|
|
ref->page = ring_buffer_alloc_read_page(ref->buffer);
|
|
|
|
if (!ref->page) {
|
|
|
|
kfree(ref);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
r = ring_buffer_read_page(ref->buffer, &ref->page,
|
|
|
|
len, info->cpu, 0);
|
|
|
|
if (r < 0) {
|
|
|
|
ring_buffer_free_read_page(ref->buffer,
|
|
|
|
ref->page);
|
|
|
|
kfree(ref);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* zero out any left over data, this is going to
|
|
|
|
* user land.
|
|
|
|
*/
|
|
|
|
size = ring_buffer_page_len(ref->page);
|
|
|
|
if (size < PAGE_SIZE)
|
|
|
|
memset(ref->page + size, 0, PAGE_SIZE - size);
|
|
|
|
|
|
|
|
page = virt_to_page(ref->page);
|
|
|
|
|
|
|
|
spd.pages[i] = page;
|
|
|
|
spd.partial[i].len = PAGE_SIZE;
|
|
|
|
spd.partial[i].offset = 0;
|
|
|
|
spd.partial[i].private = (unsigned long)ref;
|
|
|
|
spd.nr_pages++;
|
|
|
|
}
|
|
|
|
|
|
|
|
spd.nr_pages = i;
|
|
|
|
|
|
|
|
/* did we read anything? */
|
|
|
|
if (!spd.nr_pages) {
|
|
|
|
if (flags & SPLICE_F_NONBLOCK)
|
|
|
|
ret = -EAGAIN;
|
|
|
|
else
|
|
|
|
ret = 0;
|
|
|
|
/* TODO: block */
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
ret = splice_to_pipe(pipe, &spd);
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct file_operations tracing_buffers_fops = {
|
|
|
|
.open = tracing_buffers_open,
|
|
|
|
.read = tracing_buffers_read,
|
|
|
|
.release = tracing_buffers_release,
|
|
|
|
.splice_read = tracing_buffers_splice_read,
|
|
|
|
.llseek = no_llseek,
|
|
|
|
};
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
#ifdef CONFIG_DYNAMIC_FTRACE
|
|
|
|
|
2008-10-31 04:08:33 +08:00
|
|
|
int __weak ftrace_arch_read_dyn_info(char *buf, int size)
|
|
|
|
{
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
static ssize_t
|
2008-10-31 04:08:33 +08:00
|
|
|
tracing_read_dyn_info(struct file *filp, char __user *ubuf,
|
2008-05-13 03:20:42 +08:00
|
|
|
size_t cnt, loff_t *ppos)
|
|
|
|
{
|
2008-10-31 12:03:22 +08:00
|
|
|
static char ftrace_dyn_info_buffer[1024];
|
|
|
|
static DEFINE_MUTEX(dyn_info_mutex);
|
2008-05-13 03:20:42 +08:00
|
|
|
unsigned long *p = filp->private_data;
|
2008-10-31 04:08:33 +08:00
|
|
|
char *buf = ftrace_dyn_info_buffer;
|
2008-10-31 12:03:22 +08:00
|
|
|
int size = ARRAY_SIZE(ftrace_dyn_info_buffer);
|
2008-05-13 03:20:42 +08:00
|
|
|
int r;
|
|
|
|
|
2008-10-31 04:08:33 +08:00
|
|
|
mutex_lock(&dyn_info_mutex);
|
|
|
|
r = sprintf(buf, "%ld ", *p);
|
2008-05-13 03:20:46 +08:00
|
|
|
|
2008-10-31 12:03:22 +08:00
|
|
|
r += ftrace_arch_read_dyn_info(buf+r, (size-1)-r);
|
2008-10-31 04:08:33 +08:00
|
|
|
buf[r++] = '\n';
|
|
|
|
|
|
|
|
r = simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
|
|
|
|
|
|
|
|
mutex_unlock(&dyn_info_mutex);
|
|
|
|
|
|
|
|
return r;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-10-31 04:08:33 +08:00
|
|
|
static struct file_operations tracing_dyn_info_fops = {
|
2008-05-13 03:20:46 +08:00
|
|
|
.open = tracing_open_generic,
|
2008-10-31 04:08:33 +08:00
|
|
|
.read = tracing_read_dyn_info,
|
2008-05-13 03:20:42 +08:00
|
|
|
};
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static struct dentry *d_tracer;
|
|
|
|
|
|
|
|
struct dentry *tracing_init_dentry(void)
|
|
|
|
{
|
|
|
|
static int once;
|
|
|
|
|
|
|
|
if (d_tracer)
|
|
|
|
return d_tracer;
|
|
|
|
|
|
|
|
d_tracer = debugfs_create_dir("tracing", NULL);
|
|
|
|
|
|
|
|
if (!d_tracer && !once) {
|
|
|
|
once = 1;
|
|
|
|
pr_warning("Could not create debugfs directory 'tracing'\n");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return d_tracer;
|
|
|
|
}
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
static struct dentry *d_percpu;
|
|
|
|
|
|
|
|
struct dentry *tracing_dentry_percpu(void)
|
|
|
|
{
|
|
|
|
static int once;
|
|
|
|
struct dentry *d_tracer;
|
|
|
|
|
|
|
|
if (d_percpu)
|
|
|
|
return d_percpu;
|
|
|
|
|
|
|
|
d_tracer = tracing_init_dentry();
|
|
|
|
|
|
|
|
if (!d_tracer)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
d_percpu = debugfs_create_dir("per_cpu", d_tracer);
|
|
|
|
|
|
|
|
if (!d_percpu && !once) {
|
|
|
|
once = 1;
|
|
|
|
pr_warning("Could not create debugfs directory 'per_cpu'\n");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return d_percpu;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void tracing_init_debugfs_percpu(long cpu)
|
|
|
|
{
|
|
|
|
struct dentry *d_percpu = tracing_dentry_percpu();
|
2009-02-26 07:41:38 +08:00
|
|
|
struct dentry *entry, *d_cpu;
|
|
|
|
/* strlen(cpu) + MAX(log10(cpu)) + '\0' */
|
|
|
|
char cpu_dir[7];
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
|
|
|
|
if (cpu > 999 || cpu < 0)
|
|
|
|
return;
|
|
|
|
|
2009-02-26 07:41:38 +08:00
|
|
|
sprintf(cpu_dir, "cpu%ld", cpu);
|
|
|
|
d_cpu = debugfs_create_dir(cpu_dir, d_percpu);
|
|
|
|
if (!d_cpu) {
|
|
|
|
pr_warning("Could not create debugfs '%s' entry\n", cpu_dir);
|
|
|
|
return;
|
|
|
|
}
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
|
2009-02-26 07:41:38 +08:00
|
|
|
/* per cpu trace_pipe */
|
|
|
|
entry = debugfs_create_file("trace_pipe", 0444, d_cpu,
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
(void *) cpu, &tracing_pipe_fops);
|
|
|
|
if (!entry)
|
2009-02-26 07:41:38 +08:00
|
|
|
pr_warning("Could not create debugfs 'trace_pipe' entry\n");
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
|
|
|
|
/* per cpu trace */
|
2009-02-26 07:41:38 +08:00
|
|
|
entry = debugfs_create_file("trace", 0444, d_cpu,
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
(void *) cpu, &tracing_fops);
|
|
|
|
if (!entry)
|
2009-02-26 07:41:38 +08:00
|
|
|
pr_warning("Could not create debugfs 'trace' entry\n");
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:44 +08:00
|
|
|
#ifdef CONFIG_FTRACE_SELFTEST
|
|
|
|
/* Let selftest have access to static functions in this file */
|
|
|
|
#include "trace_selftest.c"
|
|
|
|
#endif
|
|
|
|
|
2009-02-27 12:43:05 +08:00
|
|
|
struct trace_option_dentry {
|
|
|
|
struct tracer_opt *opt;
|
|
|
|
struct tracer_flags *flags;
|
|
|
|
struct dentry *entry;
|
|
|
|
};
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
trace_options_read(struct file *filp, char __user *ubuf, size_t cnt,
|
|
|
|
loff_t *ppos)
|
|
|
|
{
|
|
|
|
struct trace_option_dentry *topt = filp->private_data;
|
|
|
|
char *buf;
|
|
|
|
|
|
|
|
if (topt->flags->val & topt->opt->bit)
|
|
|
|
buf = "1\n";
|
|
|
|
else
|
|
|
|
buf = "0\n";
|
|
|
|
|
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
trace_options_write(struct file *filp, const char __user *ubuf, size_t cnt,
|
|
|
|
loff_t *ppos)
|
|
|
|
{
|
|
|
|
struct trace_option_dentry *topt = filp->private_data;
|
|
|
|
unsigned long val;
|
|
|
|
char buf[64];
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (cnt >= sizeof(buf))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
|
|
|
ret = strict_strtoul(buf, 10, &val);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
ret = 0;
|
|
|
|
switch (val) {
|
|
|
|
case 0:
|
|
|
|
/* do nothing if already cleared */
|
|
|
|
if (!(topt->flags->val & topt->opt->bit))
|
|
|
|
break;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
if (current_trace->set_flag)
|
|
|
|
ret = current_trace->set_flag(topt->flags->val,
|
|
|
|
topt->opt->bit, 0);
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
topt->flags->val &= ~topt->opt->bit;
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
/* do nothing if already set */
|
|
|
|
if (topt->flags->val & topt->opt->bit)
|
|
|
|
break;
|
|
|
|
|
|
|
|
mutex_lock(&trace_types_lock);
|
|
|
|
if (current_trace->set_flag)
|
|
|
|
ret = current_trace->set_flag(topt->flags->val,
|
|
|
|
topt->opt->bit, 1);
|
|
|
|
mutex_unlock(&trace_types_lock);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
topt->flags->val |= topt->opt->bit;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
*ppos += cnt;
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static const struct file_operations trace_options_fops = {
|
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = trace_options_read,
|
|
|
|
.write = trace_options_write,
|
|
|
|
};
|
|
|
|
|
2009-02-27 11:19:12 +08:00
|
|
|
static ssize_t
|
|
|
|
trace_options_core_read(struct file *filp, char __user *ubuf, size_t cnt,
|
|
|
|
loff_t *ppos)
|
|
|
|
{
|
|
|
|
long index = (long)filp->private_data;
|
|
|
|
char *buf;
|
|
|
|
|
|
|
|
if (trace_flags & (1 << index))
|
|
|
|
buf = "1\n";
|
|
|
|
else
|
|
|
|
buf = "0\n";
|
|
|
|
|
|
|
|
return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
static ssize_t
|
|
|
|
trace_options_core_write(struct file *filp, const char __user *ubuf, size_t cnt,
|
|
|
|
loff_t *ppos)
|
|
|
|
{
|
|
|
|
long index = (long)filp->private_data;
|
|
|
|
char buf[64];
|
|
|
|
unsigned long val;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
if (cnt >= sizeof(buf))
|
|
|
|
return -EINVAL;
|
|
|
|
|
|
|
|
if (copy_from_user(&buf, ubuf, cnt))
|
|
|
|
return -EFAULT;
|
|
|
|
|
|
|
|
buf[cnt] = 0;
|
|
|
|
|
|
|
|
ret = strict_strtoul(buf, 10, &val);
|
|
|
|
if (ret < 0)
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
switch (val) {
|
|
|
|
case 0:
|
|
|
|
trace_flags &= ~(1 << index);
|
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
trace_flags |= 1 << index;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
*ppos += cnt;
|
|
|
|
|
|
|
|
return cnt;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const struct file_operations trace_options_core_fops = {
|
|
|
|
.open = tracing_open_generic,
|
|
|
|
.read = trace_options_core_read,
|
|
|
|
.write = trace_options_core_write,
|
|
|
|
};
|
|
|
|
|
|
|
|
static struct dentry *trace_options_init_dentry(void)
|
|
|
|
{
|
|
|
|
struct dentry *d_tracer;
|
|
|
|
static struct dentry *t_options;
|
|
|
|
|
|
|
|
if (t_options)
|
|
|
|
return t_options;
|
|
|
|
|
|
|
|
d_tracer = tracing_init_dentry();
|
|
|
|
if (!d_tracer)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
t_options = debugfs_create_dir("options", d_tracer);
|
|
|
|
if (!t_options) {
|
|
|
|
pr_warning("Could not create debugfs directory 'options'\n");
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return t_options;
|
|
|
|
}
|
|
|
|
|
2009-02-27 12:43:05 +08:00
|
|
|
static void
|
|
|
|
create_trace_option_file(struct trace_option_dentry *topt,
|
|
|
|
struct tracer_flags *flags,
|
|
|
|
struct tracer_opt *opt)
|
|
|
|
{
|
|
|
|
struct dentry *t_options;
|
|
|
|
struct dentry *entry;
|
|
|
|
|
|
|
|
t_options = trace_options_init_dentry();
|
|
|
|
if (!t_options)
|
|
|
|
return;
|
|
|
|
|
|
|
|
topt->flags = flags;
|
|
|
|
topt->opt = opt;
|
|
|
|
|
|
|
|
entry = debugfs_create_file(opt->name, 0644, t_options, topt,
|
|
|
|
&trace_options_fops);
|
|
|
|
|
|
|
|
topt->entry = entry;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct trace_option_dentry *
|
|
|
|
create_trace_option_files(struct tracer *tracer)
|
|
|
|
{
|
|
|
|
struct trace_option_dentry *topts;
|
|
|
|
struct tracer_flags *flags;
|
|
|
|
struct tracer_opt *opts;
|
|
|
|
int cnt;
|
|
|
|
|
|
|
|
if (!tracer)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
flags = tracer->flags;
|
|
|
|
|
|
|
|
if (!flags || !flags->opts)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
opts = flags->opts;
|
|
|
|
|
|
|
|
for (cnt = 0; opts[cnt].name; cnt++)
|
|
|
|
;
|
|
|
|
|
2009-02-27 23:51:10 +08:00
|
|
|
topts = kcalloc(cnt + 1, sizeof(*topts), GFP_KERNEL);
|
2009-02-27 12:43:05 +08:00
|
|
|
if (!topts)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
for (cnt = 0; opts[cnt].name; cnt++)
|
|
|
|
create_trace_option_file(&topts[cnt], flags,
|
|
|
|
&opts[cnt]);
|
|
|
|
|
|
|
|
return topts;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
destroy_trace_option_files(struct trace_option_dentry *topts)
|
|
|
|
{
|
|
|
|
int cnt;
|
|
|
|
|
|
|
|
if (!topts)
|
|
|
|
return;
|
|
|
|
|
|
|
|
for (cnt = 0; topts[cnt].opt; cnt++) {
|
|
|
|
if (topts[cnt].entry)
|
|
|
|
debugfs_remove(topts[cnt].entry);
|
|
|
|
}
|
|
|
|
|
|
|
|
kfree(topts);
|
|
|
|
}
|
|
|
|
|
2009-02-27 11:19:12 +08:00
|
|
|
static struct dentry *
|
|
|
|
create_trace_option_core_file(const char *option, long index)
|
|
|
|
{
|
|
|
|
struct dentry *t_options;
|
|
|
|
struct dentry *entry;
|
|
|
|
|
|
|
|
t_options = trace_options_init_dentry();
|
|
|
|
if (!t_options)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
entry = debugfs_create_file(option, 0644, t_options, (void *)index,
|
|
|
|
&trace_options_core_fops);
|
|
|
|
|
|
|
|
return entry;
|
|
|
|
}
|
|
|
|
|
|
|
|
static __init void create_trace_options_dir(void)
|
|
|
|
{
|
|
|
|
struct dentry *t_options;
|
|
|
|
struct dentry *entry;
|
|
|
|
int i;
|
|
|
|
|
|
|
|
t_options = trace_options_init_dentry();
|
|
|
|
if (!t_options)
|
|
|
|
return;
|
|
|
|
|
|
|
|
for (i = 0; trace_options[i]; i++) {
|
|
|
|
entry = create_trace_option_core_file(trace_options[i], i);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs %s entry\n",
|
|
|
|
trace_options[i]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-09-23 18:34:32 +08:00
|
|
|
static __init int tracer_init_debugfs(void)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
|
|
|
struct dentry *d_tracer;
|
2008-12-02 11:20:19 +08:00
|
|
|
struct dentry *buffers;
|
2008-05-13 03:20:42 +08:00
|
|
|
struct dentry *entry;
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
int cpu;
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
d_tracer = tracing_init_dentry();
|
|
|
|
|
|
|
|
entry = debugfs_create_file("tracing_enabled", 0644, d_tracer,
|
|
|
|
&global_trace, &tracing_ctrl_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs 'tracing_enabled' entry\n");
|
|
|
|
|
2008-11-13 06:52:37 +08:00
|
|
|
entry = debugfs_create_file("trace_options", 0644, d_tracer,
|
2008-05-13 03:20:42 +08:00
|
|
|
NULL, &tracing_iter_fops);
|
|
|
|
if (!entry)
|
2008-11-13 06:52:37 +08:00
|
|
|
pr_warning("Could not create debugfs 'trace_options' entry\n");
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2009-02-27 11:19:12 +08:00
|
|
|
create_trace_options_dir();
|
|
|
|
|
2008-05-13 03:20:52 +08:00
|
|
|
entry = debugfs_create_file("tracing_cpumask", 0644, d_tracer,
|
|
|
|
NULL, &tracing_cpumask_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs 'tracing_cpumask' entry\n");
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
entry = debugfs_create_file("trace", 0444, d_tracer,
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
(void *) TRACE_PIPE_ALL_CPU, &tracing_fops);
|
2008-05-13 03:20:42 +08:00
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs 'trace' entry\n");
|
|
|
|
|
|
|
|
entry = debugfs_create_file("available_tracers", 0444, d_tracer,
|
|
|
|
&global_trace, &show_traces_fops);
|
|
|
|
if (!entry)
|
2008-08-16 03:08:22 +08:00
|
|
|
pr_warning("Could not create debugfs 'available_tracers' entry\n");
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
entry = debugfs_create_file("current_tracer", 0444, d_tracer,
|
|
|
|
&global_trace, &set_tracer_fops);
|
|
|
|
if (!entry)
|
2008-08-16 03:08:22 +08:00
|
|
|
pr_warning("Could not create debugfs 'current_tracer' entry\n");
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
entry = debugfs_create_file("tracing_max_latency", 0644, d_tracer,
|
|
|
|
&tracing_max_latency,
|
|
|
|
&tracing_max_lat_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs "
|
|
|
|
"'tracing_max_latency' entry\n");
|
|
|
|
|
|
|
|
entry = debugfs_create_file("tracing_thresh", 0644, d_tracer,
|
|
|
|
&tracing_thresh, &tracing_max_lat_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs "
|
2008-08-16 03:08:22 +08:00
|
|
|
"'tracing_thresh' entry\n");
|
2008-05-13 03:20:45 +08:00
|
|
|
entry = debugfs_create_file("README", 0644, d_tracer,
|
|
|
|
NULL, &tracing_readme_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs 'README' entry\n");
|
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
entry = debugfs_create_file("trace_pipe", 0444, d_tracer,
|
|
|
|
(void *) TRACE_PIPE_ALL_CPU, &tracing_pipe_fops);
|
2008-05-13 03:20:46 +08:00
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs "
|
2008-08-16 03:08:22 +08:00
|
|
|
"'trace_pipe' entry\n");
|
2008-05-13 03:20:42 +08:00
|
|
|
|
2008-11-13 06:52:36 +08:00
|
|
|
entry = debugfs_create_file("buffer_size_kb", 0644, d_tracer,
|
2008-05-13 03:20:59 +08:00
|
|
|
&global_trace, &tracing_entries_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs "
|
2008-11-13 06:52:36 +08:00
|
|
|
"'buffer_size_kb' entry\n");
|
2008-05-13 03:20:59 +08:00
|
|
|
|
2008-09-17 03:06:42 +08:00
|
|
|
entry = debugfs_create_file("trace_marker", 0220, d_tracer,
|
|
|
|
NULL, &tracing_mark_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs "
|
|
|
|
"'trace_marker' entry\n");
|
|
|
|
|
2008-12-02 11:20:19 +08:00
|
|
|
buffers = debugfs_create_dir("binary_buffers", d_tracer);
|
|
|
|
|
|
|
|
if (!buffers)
|
|
|
|
pr_warning("Could not create buffers directory\n");
|
|
|
|
else {
|
|
|
|
int cpu;
|
|
|
|
char buf[64];
|
|
|
|
|
|
|
|
for_each_tracing_cpu(cpu) {
|
|
|
|
sprintf(buf, "%d", cpu);
|
|
|
|
|
|
|
|
entry = debugfs_create_file(buf, 0444, buffers,
|
|
|
|
(void *)(long)cpu,
|
|
|
|
&tracing_buffers_fops);
|
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs buffers "
|
|
|
|
"'%s' entry\n", buf);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-05-13 03:20:42 +08:00
|
|
|
#ifdef CONFIG_DYNAMIC_FTRACE
|
|
|
|
entry = debugfs_create_file("dyn_ftrace_total_info", 0444, d_tracer,
|
|
|
|
&ftrace_update_tot_cnt,
|
2008-10-31 04:08:33 +08:00
|
|
|
&tracing_dyn_info_fops);
|
2008-05-13 03:20:42 +08:00
|
|
|
if (!entry)
|
|
|
|
pr_warning("Could not create debugfs "
|
|
|
|
"'dyn_ftrace_total_info' entry\n");
|
|
|
|
#endif
|
2008-05-13 03:20:49 +08:00
|
|
|
#ifdef CONFIG_SYSPROF_TRACER
|
|
|
|
init_tracer_sysprof_debugfs(d_tracer);
|
|
|
|
#endif
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
|
|
|
|
for_each_tracing_cpu(cpu)
|
|
|
|
tracing_init_debugfs_percpu(cpu);
|
|
|
|
|
2008-09-23 18:34:32 +08:00
|
|
|
return 0;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
|
|
|
|
2008-12-04 06:45:11 +08:00
|
|
|
int trace_vprintk(unsigned long ip, int depth, const char *fmt, va_list args)
|
2008-08-02 00:26:41 +08:00
|
|
|
{
|
2009-03-04 19:32:55 +08:00
|
|
|
static raw_spinlock_t trace_buf_lock = __RAW_SPIN_LOCK_UNLOCKED;
|
2008-08-02 00:26:41 +08:00
|
|
|
static char trace_buf[TRACE_BUF_SIZE];
|
2008-09-04 16:24:14 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
struct ring_buffer_event *event;
|
2008-09-04 16:24:14 +08:00
|
|
|
struct trace_array *tr = &global_trace;
|
2008-08-02 00:26:41 +08:00
|
|
|
struct trace_array_cpu *data;
|
2008-10-02 01:14:09 +08:00
|
|
|
int cpu, len = 0, size, pc;
|
2008-12-08 23:55:53 +08:00
|
|
|
struct print_entry *entry;
|
|
|
|
unsigned long irq_flags;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-12-06 10:41:33 +08:00
|
|
|
if (tracing_disabled || tracing_selftest_running)
|
2008-08-02 00:26:41 +08:00
|
|
|
return 0;
|
|
|
|
|
2008-10-02 01:14:09 +08:00
|
|
|
pc = preempt_count();
|
|
|
|
preempt_disable_notrace();
|
2008-08-02 00:26:41 +08:00
|
|
|
cpu = raw_smp_processor_id();
|
|
|
|
data = tr->data[cpu];
|
|
|
|
|
2008-10-04 14:01:00 +08:00
|
|
|
if (unlikely(atomic_read(&data->disabled)))
|
2008-08-02 00:26:41 +08:00
|
|
|
goto out;
|
|
|
|
|
2008-12-06 10:43:41 +08:00
|
|
|
pause_graph_tracing();
|
2009-03-04 19:32:55 +08:00
|
|
|
raw_local_irq_save(irq_flags);
|
|
|
|
__raw_spin_lock(&trace_buf_lock);
|
2008-09-17 02:58:24 +08:00
|
|
|
len = vsnprintf(trace_buf, TRACE_BUF_SIZE, fmt, args);
|
2008-08-02 00:26:41 +08:00
|
|
|
|
|
|
|
len = min(len, TRACE_BUF_SIZE-1);
|
|
|
|
trace_buf[len] = 0;
|
|
|
|
|
2008-09-30 11:02:42 +08:00
|
|
|
size = sizeof(*entry) + len + 1;
|
tracing: Introduce trace_buffer_{lock_reserve,unlock_commit}
Impact: new API
These new functions do what previously was being open coded, reducing
the number of details ftrace plugin writers have to worry about.
It also standardizes the handling of stacktrace, userstacktrace and
other trace options we may introduce in the future.
With this patch, for instance, the blk tracer (and some others already
in the tree) can use the "userstacktrace" /d/tracing/trace_options
facility.
$ codiff /tmp/vmlinux.before /tmp/vmlinux.after
linux-2.6-tip/kernel/trace/trace.c:
trace_vprintk | -5
trace_graph_return | -22
trace_graph_entry | -26
trace_function | -45
__ftrace_trace_stack | -27
ftrace_trace_userstack | -29
tracing_sched_switch_trace | -66
tracing_stop | +1
trace_seq_to_user | -1
ftrace_trace_special | -63
ftrace_special | +1
tracing_sched_wakeup_trace | -70
tracing_reset_online_cpus | -1
13 functions changed, 2 bytes added, 355 bytes removed, diff: -353
linux-2.6-tip/block/blktrace.c:
__blk_add_trace | -58
1 function changed, 58 bytes removed, diff: -58
linux-2.6-tip/kernel/trace/trace.c:
trace_buffer_lock_reserve | +88
trace_buffer_unlock_commit | +86
2 functions changed, 174 bytes added, diff: +174
/tmp/vmlinux.after:
16 functions changed, 176 bytes added, 413 bytes removed, diff: -237
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Acked-by: Frédéric Weisbecker <fweisbec@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-06 02:14:13 +08:00
|
|
|
event = trace_buffer_lock_reserve(tr, TRACE_PRINT, size, irq_flags, pc);
|
2008-09-30 11:02:41 +08:00
|
|
|
if (!event)
|
|
|
|
goto out_unlock;
|
2008-09-30 11:02:42 +08:00
|
|
|
entry = ring_buffer_event_data(event);
|
|
|
|
entry->ip = ip;
|
2008-12-04 06:45:11 +08:00
|
|
|
entry->depth = depth;
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-09-30 11:02:42 +08:00
|
|
|
memcpy(&entry->buf, trace_buf, len);
|
|
|
|
entry->buf[len] = 0;
|
2009-02-06 02:12:56 +08:00
|
|
|
ring_buffer_unlock_commit(tr->buffer, event);
|
2008-08-02 00:26:41 +08:00
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
out_unlock:
|
2009-03-04 19:32:55 +08:00
|
|
|
__raw_spin_unlock(&trace_buf_lock);
|
|
|
|
raw_local_irq_restore(irq_flags);
|
2008-12-06 10:43:41 +08:00
|
|
|
unpause_graph_tracing();
|
2008-08-02 00:26:41 +08:00
|
|
|
out:
|
2008-10-02 01:14:09 +08:00
|
|
|
preempt_enable_notrace();
|
2008-08-02 00:26:41 +08:00
|
|
|
|
|
|
|
return len;
|
|
|
|
}
|
2008-09-17 02:58:24 +08:00
|
|
|
EXPORT_SYMBOL_GPL(trace_vprintk);
|
|
|
|
|
|
|
|
int __ftrace_printk(unsigned long ip, const char *fmt, ...)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
va_list ap;
|
|
|
|
|
|
|
|
if (!(trace_flags & TRACE_ITER_PRINTK))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
va_start(ap, fmt);
|
2008-12-05 06:51:23 +08:00
|
|
|
ret = trace_vprintk(ip, task_curr_ret_stack(current), fmt, ap);
|
2008-09-17 02:58:24 +08:00
|
|
|
va_end(ap);
|
|
|
|
return ret;
|
|
|
|
}
|
2008-08-02 00:26:41 +08:00
|
|
|
EXPORT_SYMBOL_GPL(__ftrace_printk);
|
|
|
|
|
2009-01-23 22:06:23 +08:00
|
|
|
int __ftrace_vprintk(unsigned long ip, const char *fmt, va_list ap)
|
|
|
|
{
|
|
|
|
if (!(trace_flags & TRACE_ITER_PRINTK))
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
return trace_vprintk(ip, task_curr_ret_stack(current), fmt, ap);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(__ftrace_vprintk);
|
|
|
|
|
2008-07-31 10:36:46 +08:00
|
|
|
static int trace_panic_handler(struct notifier_block *this,
|
|
|
|
unsigned long event, void *unused)
|
|
|
|
{
|
2008-10-24 07:26:08 +08:00
|
|
|
if (ftrace_dump_on_oops)
|
|
|
|
ftrace_dump();
|
2008-07-31 10:36:46 +08:00
|
|
|
return NOTIFY_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct notifier_block trace_panic_notifier = {
|
|
|
|
.notifier_call = trace_panic_handler,
|
|
|
|
.next = NULL,
|
|
|
|
.priority = 150 /* priority: INT_MAX >= x >= 0 */
|
|
|
|
};
|
|
|
|
|
|
|
|
static int trace_die_handler(struct notifier_block *self,
|
|
|
|
unsigned long val,
|
|
|
|
void *data)
|
|
|
|
{
|
|
|
|
switch (val) {
|
|
|
|
case DIE_OOPS:
|
2008-10-24 07:26:08 +08:00
|
|
|
if (ftrace_dump_on_oops)
|
|
|
|
ftrace_dump();
|
2008-07-31 10:36:46 +08:00
|
|
|
break;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return NOTIFY_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct notifier_block trace_die_notifier = {
|
|
|
|
.notifier_call = trace_die_handler,
|
|
|
|
.priority = 200
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* printk is set to max of 1024, we really don't need it that big.
|
|
|
|
* Nothing should be printing 1000 characters anyway.
|
|
|
|
*/
|
|
|
|
#define TRACE_MAX_PRINT 1000
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Define here KERN_TRACE so that we have one place to modify
|
|
|
|
* it if we decide to change what log level the ftrace dump
|
|
|
|
* should be at.
|
|
|
|
*/
|
2009-01-15 01:24:42 +08:00
|
|
|
#define KERN_TRACE KERN_EMERG
|
2008-07-31 10:36:46 +08:00
|
|
|
|
|
|
|
static void
|
|
|
|
trace_printk_seq(struct trace_seq *s)
|
|
|
|
{
|
|
|
|
/* Probably should print a warning here. */
|
|
|
|
if (s->len >= 1000)
|
|
|
|
s->len = 1000;
|
|
|
|
|
|
|
|
/* should be zero ended, but we are paranoid. */
|
|
|
|
s->buffer[s->len] = 0;
|
|
|
|
|
|
|
|
printk(KERN_TRACE "%s", s->buffer);
|
|
|
|
|
2009-03-03 03:04:40 +08:00
|
|
|
trace_seq_init(s);
|
2008-07-31 10:36:46 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void ftrace_dump(void)
|
|
|
|
{
|
|
|
|
static DEFINE_SPINLOCK(ftrace_dump_lock);
|
|
|
|
/* use static because iter can be a bit big for the stack */
|
|
|
|
static struct trace_iterator iter;
|
|
|
|
static int dump_ran;
|
2008-10-01 12:29:53 +08:00
|
|
|
unsigned long flags;
|
|
|
|
int cnt = 0, cpu;
|
2008-07-31 10:36:46 +08:00
|
|
|
|
|
|
|
/* only one dump */
|
|
|
|
spin_lock_irqsave(&ftrace_dump_lock, flags);
|
|
|
|
if (dump_ran)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
dump_ran = 1;
|
|
|
|
|
|
|
|
/* No turning back! */
|
2009-01-15 03:50:19 +08:00
|
|
|
tracing_off();
|
2008-10-23 21:33:02 +08:00
|
|
|
ftrace_kill();
|
2008-07-31 10:36:46 +08:00
|
|
|
|
2008-10-01 12:29:53 +08:00
|
|
|
for_each_tracing_cpu(cpu) {
|
|
|
|
atomic_inc(&global_trace.data[cpu]->disabled);
|
|
|
|
}
|
|
|
|
|
2008-11-22 19:28:48 +08:00
|
|
|
/* don't look at user memory in panic mode */
|
|
|
|
trace_flags &= ~TRACE_ITER_SYM_USEROBJ;
|
|
|
|
|
2008-07-31 10:36:46 +08:00
|
|
|
printk(KERN_TRACE "Dumping ftrace buffer:\n");
|
|
|
|
|
|
|
|
iter.tr = &global_trace;
|
|
|
|
iter.trace = current_trace;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* We need to stop all tracing on all CPUS to read the
|
|
|
|
* the next buffer. This is a bit expensive, but is
|
|
|
|
* not done often. We fill all what we can read,
|
|
|
|
* and then release the locks again.
|
|
|
|
*/
|
|
|
|
|
|
|
|
while (!trace_empty(&iter)) {
|
|
|
|
|
|
|
|
if (!cnt)
|
|
|
|
printk(KERN_TRACE "---------------------------------\n");
|
|
|
|
|
|
|
|
cnt++;
|
|
|
|
|
|
|
|
/* reset all but tr, trace, and overruns */
|
|
|
|
memset(&iter.seq, 0,
|
|
|
|
sizeof(struct trace_iterator) -
|
|
|
|
offsetof(struct trace_iterator, seq));
|
|
|
|
iter.iter_flags |= TRACE_FILE_LAT_FMT;
|
|
|
|
iter.pos = -1;
|
|
|
|
|
|
|
|
if (find_next_entry_inc(&iter) != NULL) {
|
|
|
|
print_trace_line(&iter);
|
|
|
|
trace_consume(&iter);
|
|
|
|
}
|
|
|
|
|
|
|
|
trace_printk_seq(&iter.seq);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!cnt)
|
|
|
|
printk(KERN_TRACE " (ftrace buffer empty)\n");
|
|
|
|
else
|
|
|
|
printk(KERN_TRACE "---------------------------------\n");
|
|
|
|
|
|
|
|
out:
|
|
|
|
spin_unlock_irqrestore(&ftrace_dump_lock, flags);
|
|
|
|
}
|
|
|
|
|
2008-09-30 11:02:41 +08:00
|
|
|
__init static int tracer_alloc_buffers(void)
|
2008-05-13 03:20:42 +08:00
|
|
|
{
|
2008-05-13 03:20:43 +08:00
|
|
|
struct trace_array_cpu *data;
|
|
|
|
int i;
|
2009-01-01 07:42:22 +08:00
|
|
|
int ret = -ENOMEM;
|
2008-05-13 03:20:43 +08:00
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
if (!alloc_cpumask_var(&tracing_buffer_mask, GFP_KERNEL))
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
if (!alloc_cpumask_var(&tracing_cpumask, GFP_KERNEL))
|
|
|
|
goto out_free_buffer_mask;
|
2008-05-13 03:20:43 +08:00
|
|
|
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
if (!alloc_cpumask_var(&tracing_reader_cpumask, GFP_KERNEL))
|
|
|
|
goto out_free_tracing_cpumask;
|
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
cpumask_copy(tracing_buffer_mask, cpu_possible_mask);
|
|
|
|
cpumask_copy(tracing_cpumask, cpu_all_mask);
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
cpumask_clear(tracing_reader_cpumask);
|
2009-01-01 07:42:22 +08:00
|
|
|
|
|
|
|
/* TODO: make the number of buffers hot pluggable with CPUS */
|
2008-09-30 11:02:41 +08:00
|
|
|
global_trace.buffer = ring_buffer_alloc(trace_buf_size,
|
|
|
|
TRACE_BUFFER_FLAGS);
|
|
|
|
if (!global_trace.buffer) {
|
|
|
|
printk(KERN_ERR "tracer: failed to allocate ring buffer!\n");
|
|
|
|
WARN_ON(1);
|
2009-01-01 07:42:22 +08:00
|
|
|
goto out_free_cpumask;
|
2008-05-13 03:20:43 +08:00
|
|
|
}
|
2008-09-30 11:02:41 +08:00
|
|
|
global_trace.entries = ring_buffer_size(global_trace.buffer);
|
2008-05-13 03:20:43 +08:00
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
|
2008-05-13 03:20:43 +08:00
|
|
|
#ifdef CONFIG_TRACER_MAX_TRACE
|
2008-09-30 11:02:41 +08:00
|
|
|
max_tr.buffer = ring_buffer_alloc(trace_buf_size,
|
|
|
|
TRACE_BUFFER_FLAGS);
|
|
|
|
if (!max_tr.buffer) {
|
|
|
|
printk(KERN_ERR "tracer: failed to allocate max ring buffer!\n");
|
|
|
|
WARN_ON(1);
|
|
|
|
ring_buffer_free(global_trace.buffer);
|
2009-01-01 07:42:22 +08:00
|
|
|
goto out_free_cpumask;
|
2008-05-13 03:20:43 +08:00
|
|
|
}
|
2008-09-30 11:02:41 +08:00
|
|
|
max_tr.entries = ring_buffer_size(max_tr.buffer);
|
|
|
|
WARN_ON(max_tr.entries != global_trace.entries);
|
2008-05-13 03:20:59 +08:00
|
|
|
#endif
|
2008-05-13 03:21:00 +08:00
|
|
|
|
2008-05-13 03:20:43 +08:00
|
|
|
/* Allocate the first page for all buffers */
|
2008-05-13 03:21:00 +08:00
|
|
|
for_each_tracing_cpu(i) {
|
2008-05-13 03:20:43 +08:00
|
|
|
data = global_trace.data[i] = &per_cpu(global_trace_cpu, i);
|
2008-05-13 03:20:42 +08:00
|
|
|
max_tr.data[i] = &per_cpu(max_data, i);
|
2008-05-13 03:20:43 +08:00
|
|
|
}
|
2008-05-13 03:20:42 +08:00
|
|
|
|
|
|
|
trace_init_cmdlines();
|
|
|
|
|
2008-09-22 02:16:30 +08:00
|
|
|
register_tracer(&nop_trace);
|
2009-02-03 10:38:33 +08:00
|
|
|
current_trace = &nop_trace;
|
2008-09-23 18:34:32 +08:00
|
|
|
#ifdef CONFIG_BOOT_TRACER
|
|
|
|
register_tracer(&boot_tracer);
|
|
|
|
#endif
|
2008-05-13 03:20:44 +08:00
|
|
|
/* All seems OK, enable tracing */
|
|
|
|
tracing_disabled = 0;
|
2008-09-30 11:02:41 +08:00
|
|
|
|
2008-07-31 10:36:46 +08:00
|
|
|
atomic_notifier_chain_register(&panic_notifier_list,
|
|
|
|
&trace_panic_notifier);
|
|
|
|
|
|
|
|
register_die_notifier(&trace_die_notifier);
|
2009-01-01 07:42:22 +08:00
|
|
|
ret = 0;
|
2008-07-31 10:36:46 +08:00
|
|
|
|
2009-01-01 07:42:22 +08:00
|
|
|
out_free_cpumask:
|
tracing/core: introduce per cpu tracing files
Impact: split up tracing output per cpu
Currently, on the tracing debugfs directory, three files are
available to the user to let him extracting the trace output:
- trace is an iterator through the ring-buffer. It's a reader
but not a consumer It doesn't block when no more traces are
available.
- trace pretty similar to the former, except that it adds more
informations such as prempt count, irq flag, ...
- trace_pipe is a reader and a consumer, it will also block
waiting for traces if necessary (heh, yes it's a pipe).
The traces coming from different cpus are curretly mixed up
inside these files. Sometimes it messes up the informations,
sometimes it's useful, depending on what does the tracer
capture.
The tracing_cpumask file is useful to filter the output and
select only the traces captured a custom defined set of cpus.
But still it is not enough powerful to extract at the same time
one trace buffer per cpu.
So this patch creates a new directory: /debug/tracing/per_cpu/.
Inside this directory, you will now find one trace_pipe file and
one trace file per cpu.
Which means if you have two cpus, you will have:
trace0
trace1
trace_pipe0
trace_pipe1
And of course, reading these files will have the same effect
than with the usual tracing files, except that you will only see
the traces from the given cpu.
The original all-in-one cpu trace file are still available on
their original place.
Until now, only one consumer was allowed on trace_pipe to avoid
racy consuming on the ring-buffer. Now the approach changed a
bit, you can have only one consumer per cpu.
Which means you are allowed to read concurrently trace_pipe0 and
trace_pipe1 But you can't have two readers on trace_pipe0 or
trace_pipe1.
Following the same logic, if there is one reader on the common
trace_pipe, you can not have at the same time another reader on
trace_pipe0 or in trace_pipe1. Because in trace_pipe is already
a consumer in all cpu buffers in essence.
Signed-off-by: Frederic Weisbecker <fweisbec@gmail.com>
Cc: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2009-02-25 10:22:28 +08:00
|
|
|
free_cpumask_var(tracing_reader_cpumask);
|
|
|
|
out_free_tracing_cpumask:
|
2009-01-01 07:42:22 +08:00
|
|
|
free_cpumask_var(tracing_cpumask);
|
|
|
|
out_free_buffer_mask:
|
|
|
|
free_cpumask_var(tracing_buffer_mask);
|
|
|
|
out:
|
|
|
|
return ret;
|
2008-05-13 03:20:42 +08:00
|
|
|
}
|
2009-02-03 10:38:32 +08:00
|
|
|
|
|
|
|
__init static int clear_boot_tracer(void)
|
|
|
|
{
|
|
|
|
/*
|
|
|
|
* The default tracer at boot buffer is an init section.
|
|
|
|
* This function is called in lateinit. If we did not
|
|
|
|
* find the boot tracer, then clear it out, to prevent
|
|
|
|
* later registration from accessing the buffer that is
|
|
|
|
* about to be freed.
|
|
|
|
*/
|
|
|
|
if (!default_bootup_tracer)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
printk(KERN_INFO "ftrace bootup tracer '%s' not registered.\n",
|
|
|
|
default_bootup_tracer);
|
|
|
|
default_bootup_tracer = NULL;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2008-09-23 18:34:32 +08:00
|
|
|
early_initcall(tracer_alloc_buffers);
|
|
|
|
fs_initcall(tracer_init_debugfs);
|
2009-02-03 10:38:32 +08:00
|
|
|
late_initcall(clear_boot_tracer);
|