ftrace: Implement fs notification for tracing_max_latency
This patch implements the feature that the tracing_max_latency file, e.g. /sys/kernel/debug/tracing/tracing_max_latency will receive notifications through the fsnotify framework when a new latency is available. One particularly interesting use of this facility is when enabling threshold tracing, through /sys/kernel/debug/tracing/tracing_thresh, together with the preempt/irqsoff tracers. This makes it possible to implement a user space program that can, with equal probability, obtain traces of latencies that occur immediately after each other in spite of the fact that the preempt/irqsoff tracers operate in overwrite mode. This facility works with the hwlat, preempt/irqsoff, and wakeup tracers. The tracers may call the latency_fsnotify() from places such as __schedule() or do_idle(); this makes it impossible to call queue_work() directly without risking a deadlock. The same would happen with a softirq, kernel thread or tasklet. For this reason we use the irq_work mechanism to call queue_work(). This patch creates a new workqueue. The reason for doing this is that I wanted to use the WQ_UNBOUND and WQ_HIGHPRI flags. My thinking was that WQ_UNBOUND might help with the latency in some important cases. If we use: queue_work(system_highpri_wq, &tr->fsnotify_work); then the work will (almost) always execute on the same CPU but if we are unlucky that CPU could be too busy while there could be another CPU in the system that would be able to process the work soon enough. queue_work_on() could be used to queue the work on another CPU but it seems difficult to select the right CPU. Link: http://lkml.kernel.org/r/20191008220824.7911-2-viktor.rosendahl@gmail.com Reviewed-by: Joel Fernandes (Google) <joel@joelfernandes.org> Signed-off-by: Viktor Rosendahl (BMW) <viktor.rosendahl@gmail.com> [ Added max() to have one compare for max latency ] Signed-off-by: Steven Rostedt (VMware) <rostedt@goodmis.org>
This commit is contained in:
parent
da537f0aef
commit
91edde2e6a
|
@ -45,6 +45,9 @@
|
||||||
#include <linux/trace.h>
|
#include <linux/trace.h>
|
||||||
#include <linux/sched/clock.h>
|
#include <linux/sched/clock.h>
|
||||||
#include <linux/sched/rt.h>
|
#include <linux/sched/rt.h>
|
||||||
|
#include <linux/fsnotify.h>
|
||||||
|
#include <linux/irq_work.h>
|
||||||
|
#include <linux/workqueue.h>
|
||||||
|
|
||||||
#include "trace.h"
|
#include "trace.h"
|
||||||
#include "trace_output.h"
|
#include "trace_output.h"
|
||||||
|
@ -1497,6 +1500,74 @@ static ssize_t trace_seq_to_buffer(struct trace_seq *s, void *buf, size_t cnt)
|
||||||
}
|
}
|
||||||
|
|
||||||
unsigned long __read_mostly tracing_thresh;
|
unsigned long __read_mostly tracing_thresh;
|
||||||
|
static const struct file_operations tracing_max_lat_fops;
|
||||||
|
|
||||||
|
#if (defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)) && \
|
||||||
|
defined(CONFIG_FSNOTIFY)
|
||||||
|
|
||||||
|
static struct workqueue_struct *fsnotify_wq;
|
||||||
|
|
||||||
|
static void latency_fsnotify_workfn(struct work_struct *work)
|
||||||
|
{
|
||||||
|
struct trace_array *tr = container_of(work, struct trace_array,
|
||||||
|
fsnotify_work);
|
||||||
|
fsnotify(tr->d_max_latency->d_inode, FS_MODIFY,
|
||||||
|
tr->d_max_latency->d_inode, FSNOTIFY_EVENT_INODE, NULL, 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void latency_fsnotify_workfn_irq(struct irq_work *iwork)
|
||||||
|
{
|
||||||
|
struct trace_array *tr = container_of(iwork, struct trace_array,
|
||||||
|
fsnotify_irqwork);
|
||||||
|
queue_work(fsnotify_wq, &tr->fsnotify_work);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void trace_create_maxlat_file(struct trace_array *tr,
|
||||||
|
struct dentry *d_tracer)
|
||||||
|
{
|
||||||
|
INIT_WORK(&tr->fsnotify_work, latency_fsnotify_workfn);
|
||||||
|
init_irq_work(&tr->fsnotify_irqwork, latency_fsnotify_workfn_irq);
|
||||||
|
tr->d_max_latency = trace_create_file("tracing_max_latency", 0644,
|
||||||
|
d_tracer, &tr->max_latency,
|
||||||
|
&tracing_max_lat_fops);
|
||||||
|
}
|
||||||
|
|
||||||
|
__init static int latency_fsnotify_init(void)
|
||||||
|
{
|
||||||
|
fsnotify_wq = alloc_workqueue("tr_max_lat_wq",
|
||||||
|
WQ_UNBOUND | WQ_HIGHPRI, 0);
|
||||||
|
if (!fsnotify_wq) {
|
||||||
|
pr_err("Unable to allocate tr_max_lat_wq\n");
|
||||||
|
return -ENOMEM;
|
||||||
|
}
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
late_initcall_sync(latency_fsnotify_init);
|
||||||
|
|
||||||
|
void latency_fsnotify(struct trace_array *tr)
|
||||||
|
{
|
||||||
|
if (!fsnotify_wq)
|
||||||
|
return;
|
||||||
|
/*
|
||||||
|
* We cannot call queue_work(&tr->fsnotify_work) from here because it's
|
||||||
|
* possible that we are called from __schedule() or do_idle(), which
|
||||||
|
* could cause a deadlock.
|
||||||
|
*/
|
||||||
|
irq_work_queue(&tr->fsnotify_irqwork);
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* (defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)) && \
|
||||||
|
* defined(CONFIG_FSNOTIFY)
|
||||||
|
*/
|
||||||
|
#else
|
||||||
|
|
||||||
|
#define trace_create_maxlat_file(tr, d_tracer) \
|
||||||
|
trace_create_file("tracing_max_latency", 0644, d_tracer, \
|
||||||
|
&tr->max_latency, &tracing_max_lat_fops)
|
||||||
|
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef CONFIG_TRACER_MAX_TRACE
|
#ifdef CONFIG_TRACER_MAX_TRACE
|
||||||
/*
|
/*
|
||||||
|
@ -1536,6 +1607,7 @@ __update_max_tr(struct trace_array *tr, struct task_struct *tsk, int cpu)
|
||||||
|
|
||||||
/* record this tasks comm */
|
/* record this tasks comm */
|
||||||
tracing_record_cmdline(tsk);
|
tracing_record_cmdline(tsk);
|
||||||
|
latency_fsnotify(tr);
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -8594,8 +8666,7 @@ init_tracer_tracefs(struct trace_array *tr, struct dentry *d_tracer)
|
||||||
create_trace_options_dir(tr);
|
create_trace_options_dir(tr);
|
||||||
|
|
||||||
#if defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)
|
#if defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)
|
||||||
trace_create_file("tracing_max_latency", 0644, d_tracer,
|
trace_create_maxlat_file(tr, d_tracer);
|
||||||
&tr->max_latency, &tracing_max_lat_fops);
|
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
if (ftrace_create_function_files(tr, d_tracer))
|
if (ftrace_create_function_files(tr, d_tracer))
|
||||||
|
|
|
@ -16,6 +16,8 @@
|
||||||
#include <linux/trace_events.h>
|
#include <linux/trace_events.h>
|
||||||
#include <linux/compiler.h>
|
#include <linux/compiler.h>
|
||||||
#include <linux/glob.h>
|
#include <linux/glob.h>
|
||||||
|
#include <linux/irq_work.h>
|
||||||
|
#include <linux/workqueue.h>
|
||||||
|
|
||||||
#ifdef CONFIG_FTRACE_SYSCALLS
|
#ifdef CONFIG_FTRACE_SYSCALLS
|
||||||
#include <asm/unistd.h> /* For NR_SYSCALLS */
|
#include <asm/unistd.h> /* For NR_SYSCALLS */
|
||||||
|
@ -264,6 +266,11 @@ struct trace_array {
|
||||||
#endif
|
#endif
|
||||||
#if defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)
|
#if defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)
|
||||||
unsigned long max_latency;
|
unsigned long max_latency;
|
||||||
|
#ifdef CONFIG_FSNOTIFY
|
||||||
|
struct dentry *d_max_latency;
|
||||||
|
struct work_struct fsnotify_work;
|
||||||
|
struct irq_work fsnotify_irqwork;
|
||||||
|
#endif
|
||||||
#endif
|
#endif
|
||||||
struct trace_pid_list __rcu *filtered_pids;
|
struct trace_pid_list __rcu *filtered_pids;
|
||||||
/*
|
/*
|
||||||
|
@ -786,6 +793,17 @@ void update_max_tr_single(struct trace_array *tr,
|
||||||
struct task_struct *tsk, int cpu);
|
struct task_struct *tsk, int cpu);
|
||||||
#endif /* CONFIG_TRACER_MAX_TRACE */
|
#endif /* CONFIG_TRACER_MAX_TRACE */
|
||||||
|
|
||||||
|
#if (defined(CONFIG_TRACER_MAX_TRACE) || defined(CONFIG_HWLAT_TRACER)) && \
|
||||||
|
defined(CONFIG_FSNOTIFY)
|
||||||
|
|
||||||
|
void latency_fsnotify(struct trace_array *tr);
|
||||||
|
|
||||||
|
#else
|
||||||
|
|
||||||
|
static void latency_fsnotify(struct trace_array *tr) { }
|
||||||
|
|
||||||
|
#endif
|
||||||
|
|
||||||
#ifdef CONFIG_STACKTRACE
|
#ifdef CONFIG_STACKTRACE
|
||||||
void __trace_stack(struct trace_array *tr, unsigned long flags, int skip,
|
void __trace_stack(struct trace_array *tr, unsigned long flags, int skip,
|
||||||
int pc);
|
int pc);
|
||||||
|
|
|
@ -237,6 +237,7 @@ static int get_sample(void)
|
||||||
/* If we exceed the threshold value, we have found a hardware latency */
|
/* If we exceed the threshold value, we have found a hardware latency */
|
||||||
if (sample > thresh || outer_sample > thresh) {
|
if (sample > thresh || outer_sample > thresh) {
|
||||||
struct hwlat_sample s;
|
struct hwlat_sample s;
|
||||||
|
u64 latency;
|
||||||
|
|
||||||
ret = 1;
|
ret = 1;
|
||||||
|
|
||||||
|
@ -253,11 +254,13 @@ static int get_sample(void)
|
||||||
s.nmi_count = nmi_count;
|
s.nmi_count = nmi_count;
|
||||||
trace_hwlat_sample(&s);
|
trace_hwlat_sample(&s);
|
||||||
|
|
||||||
|
latency = max(sample, outer_sample);
|
||||||
|
|
||||||
/* Keep a running maximum ever recorded hardware latency */
|
/* Keep a running maximum ever recorded hardware latency */
|
||||||
if (sample > tr->max_latency)
|
if (latency > tr->max_latency) {
|
||||||
tr->max_latency = sample;
|
tr->max_latency = latency;
|
||||||
if (outer_sample > tr->max_latency)
|
latency_fsnotify(tr);
|
||||||
tr->max_latency = outer_sample;
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
out:
|
out:
|
||||||
|
|
Loading…
Reference in New Issue