Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tj/percpu
[safe/jmp/linux-2.6] / kernel / trace / trace_sched_switch.c
index 2715267..5fca0f5 100644 (file)
 #include <linux/debugfs.h>
 #include <linux/kallsyms.h>
 #include <linux/uaccess.h>
-#include <linux/marker.h>
 #include <linux/ftrace.h>
+#include <trace/events/sched.h>
 
 #include "trace.h"
 
 static struct trace_array      *ctx_trace;
 static int __read_mostly       tracer_enabled;
+static int                     sched_ref;
+static DEFINE_MUTEX(sched_register_mutex);
+static int                     sched_stopped;
 
-static void notrace
-ctx_switch_func(struct task_struct *prev, struct task_struct *next)
+
+void
+tracing_sched_switch_trace(struct trace_array *tr,
+                          struct task_struct *prev,
+                          struct task_struct *next,
+                          unsigned long flags, int pc)
+{
+       struct ftrace_event_call *call = &event_context_switch;
+       struct ring_buffer *buffer = tr->buffer;
+       struct ring_buffer_event *event;
+       struct ctx_switch_entry *entry;
+
+       event = trace_buffer_lock_reserve(buffer, TRACE_CTX,
+                                         sizeof(*entry), flags, pc);
+       if (!event)
+               return;
+       entry   = ring_buffer_event_data(event);
+       entry->prev_pid                 = prev->pid;
+       entry->prev_prio                = prev->prio;
+       entry->prev_state               = prev->state;
+       entry->next_pid                 = next->pid;
+       entry->next_prio                = next->prio;
+       entry->next_state               = next->state;
+       entry->next_cpu = task_cpu(next);
+
+       if (!filter_check_discard(call, entry, buffer, event))
+               trace_buffer_unlock_commit(buffer, event, flags, pc);
+}
+
+static void
+probe_sched_switch(struct rq *__rq, struct task_struct *prev,
+                       struct task_struct *next)
 {
-       struct trace_array *tr = ctx_trace;
        struct trace_array_cpu *data;
        unsigned long flags;
-       long disabled;
        int cpu;
+       int pc;
 
-       if (!tracer_enabled)
+       if (unlikely(!sched_ref))
                return;
 
+       tracing_record_cmdline(prev);
+       tracing_record_cmdline(next);
+
+       if (!tracer_enabled || sched_stopped)
+               return;
+
+       pc = preempt_count();
        local_irq_save(flags);
        cpu = raw_smp_processor_id();
-       data = tr->data[cpu];
-       disabled = atomic_inc_return(&data->disabled);
+       data = ctx_trace->data[cpu];
 
-       if (likely(disabled == 1))
-               tracing_sched_switch_trace(tr, data, prev, next, flags);
+       if (likely(!atomic_read(&data->disabled)))
+               tracing_sched_switch_trace(ctx_trace, prev, next, flags, pc);
 
-       atomic_dec(&data->disabled);
        local_irq_restore(flags);
 }
 
-void ftrace_ctx_switch(struct task_struct *prev, struct task_struct *next)
+void
+tracing_sched_wakeup_trace(struct trace_array *tr,
+                          struct task_struct *wakee,
+                          struct task_struct *curr,
+                          unsigned long flags, int pc)
 {
-       tracing_record_cmdline(prev);
+       struct ftrace_event_call *call = &event_wakeup;
+       struct ring_buffer_event *event;
+       struct ctx_switch_entry *entry;
+       struct ring_buffer *buffer = tr->buffer;
 
-       /*
-        * If tracer_switch_func only points to the local
-        * switch func, it still needs the ptr passed to it.
-        */
-       ctx_switch_func(prev, next);
+       event = trace_buffer_lock_reserve(buffer, TRACE_WAKE,
+                                         sizeof(*entry), flags, pc);
+       if (!event)
+               return;
+       entry   = ring_buffer_event_data(event);
+       entry->prev_pid                 = curr->pid;
+       entry->prev_prio                = curr->prio;
+       entry->prev_state               = curr->state;
+       entry->next_pid                 = wakee->pid;
+       entry->next_prio                = wakee->prio;
+       entry->next_state               = wakee->state;
+       entry->next_cpu                 = task_cpu(wakee);
 
-       /*
-        * Chain to the wakeup tracer (this is a NOP if disabled):
-        */
-       wakeup_sched_switch(prev, next);
+       if (!filter_check_discard(call, entry, buffer, event))
+               ring_buffer_unlock_commit(buffer, event);
+       ftrace_trace_stack(tr->buffer, flags, 6, pc);
+       ftrace_trace_userstack(tr->buffer, flags, pc);
 }
 
-static notrace void sched_switch_reset(struct trace_array *tr)
+static void
+probe_sched_wakeup(struct rq *__rq, struct task_struct *wakee, int success)
 {
-       int cpu;
+       struct trace_array_cpu *data;
+       unsigned long flags;
+       int cpu, pc;
+
+       if (unlikely(!sched_ref))
+               return;
+
+       tracing_record_cmdline(current);
+
+       if (!tracer_enabled || sched_stopped)
+               return;
+
+       pc = preempt_count();
+       local_irq_save(flags);
+       cpu = raw_smp_processor_id();
+       data = ctx_trace->data[cpu];
+
+       if (likely(!atomic_read(&data->disabled)))
+               tracing_sched_wakeup_trace(ctx_trace, wakee, current,
+                                          flags, pc);
+
+       local_irq_restore(flags);
+}
+
+static int tracing_sched_register(void)
+{
+       int ret;
+
+       ret = register_trace_sched_wakeup(probe_sched_wakeup);
+       if (ret) {
+               pr_info("wakeup trace: Couldn't activate tracepoint"
+                       " probe to kernel_sched_wakeup\n");
+               return ret;
+       }
+
+       ret = register_trace_sched_wakeup_new(probe_sched_wakeup);
+       if (ret) {
+               pr_info("wakeup trace: Couldn't activate tracepoint"
+                       " probe to kernel_sched_wakeup_new\n");
+               goto fail_deprobe;
+       }
+
+       ret = register_trace_sched_switch(probe_sched_switch);
+       if (ret) {
+               pr_info("sched trace: Couldn't activate tracepoint"
+                       " probe to kernel_sched_switch\n");
+               goto fail_deprobe_wake_new;
+       }
+
+       return ret;
+fail_deprobe_wake_new:
+       unregister_trace_sched_wakeup_new(probe_sched_wakeup);
+fail_deprobe:
+       unregister_trace_sched_wakeup(probe_sched_wakeup);
+       return ret;
+}
 
-       tr->time_start = now(tr->cpu);
+static void tracing_sched_unregister(void)
+{
+       unregister_trace_sched_switch(probe_sched_switch);
+       unregister_trace_sched_wakeup_new(probe_sched_wakeup);
+       unregister_trace_sched_wakeup(probe_sched_wakeup);
+}
 
-       for_each_online_cpu(cpu)
-               tracing_reset(tr->data[cpu]);
+static void tracing_start_sched_switch(void)
+{
+       mutex_lock(&sched_register_mutex);
+       if (!(sched_ref++))
+               tracing_sched_register();
+       mutex_unlock(&sched_register_mutex);
 }
 
-static notrace void start_sched_trace(struct trace_array *tr)
+static void tracing_stop_sched_switch(void)
 {
-       sched_switch_reset(tr);
-       tracer_enabled = 1;
+       mutex_lock(&sched_register_mutex);
+       if (!(--sched_ref))
+               tracing_sched_unregister();
+       mutex_unlock(&sched_register_mutex);
+}
+
+void tracing_start_cmdline_record(void)
+{
+       tracing_start_sched_switch();
+}
+
+void tracing_stop_cmdline_record(void)
+{
+       tracing_stop_sched_switch();
+}
+
+/**
+ * tracing_start_sched_switch_record - start tracing context switches
+ *
+ * Turns on context switch tracing for a tracer.
+ */
+void tracing_start_sched_switch_record(void)
+{
+       if (unlikely(!ctx_trace)) {
+               WARN_ON(1);
+               return;
+       }
+
+       tracing_start_sched_switch();
+
+       mutex_lock(&sched_register_mutex);
+       tracer_enabled++;
+       mutex_unlock(&sched_register_mutex);
 }
 
-static notrace void stop_sched_trace(struct trace_array *tr)
+/**
+ * tracing_stop_sched_switch_record - start tracing context switches
+ *
+ * Turns off context switch tracing for a tracer.
+ */
+void tracing_stop_sched_switch_record(void)
 {
-       tracer_enabled = 0;
+       mutex_lock(&sched_register_mutex);
+       tracer_enabled--;
+       WARN_ON(tracer_enabled < 0);
+       mutex_unlock(&sched_register_mutex);
+
+       tracing_stop_sched_switch();
 }
 
-static notrace void sched_switch_trace_init(struct trace_array *tr)
+/**
+ * tracing_sched_switch_assign_trace - assign a trace array for ctx switch
+ * @tr: trace array pointer to assign
+ *
+ * Some tracers might want to record the context switches in their
+ * trace. This function lets those tracers assign the trace array
+ * to use.
+ */
+void tracing_sched_switch_assign_trace(struct trace_array *tr)
 {
        ctx_trace = tr;
+}
 
-       if (tr->ctrl)
-               start_sched_trace(tr);
+static void stop_sched_trace(struct trace_array *tr)
+{
+       tracing_stop_sched_switch_record();
 }
 
-static notrace void sched_switch_trace_reset(struct trace_array *tr)
+static int sched_switch_trace_init(struct trace_array *tr)
 {
-       if (tr->ctrl)
-               stop_sched_trace(tr);
+       ctx_trace = tr;
+       tracing_reset_online_cpus(tr);
+       tracing_start_sched_switch_record();
+       return 0;
 }
 
-static void sched_switch_trace_ctrl_update(struct trace_array *tr)
+static void sched_switch_trace_reset(struct trace_array *tr)
 {
-       /* When starting a new trace, reset the buffers */
-       if (tr->ctrl)
-               start_sched_trace(tr);
-       else
+       if (sched_ref)
                stop_sched_trace(tr);
 }
 
+static void sched_switch_trace_start(struct trace_array *tr)
+{
+       sched_stopped = 0;
+}
+
+static void sched_switch_trace_stop(struct trace_array *tr)
+{
+       sched_stopped = 1;
+}
+
 static struct tracer sched_switch_trace __read_mostly =
 {
        .name           = "sched_switch",
        .init           = sched_switch_trace_init,
        .reset          = sched_switch_trace_reset,
-       .ctrl_update    = sched_switch_trace_ctrl_update,
+       .start          = sched_switch_trace_start,
+       .stop           = sched_switch_trace_stop,
+       .wait_pipe      = poll_wait_pipe,
+#ifdef CONFIG_FTRACE_SELFTEST
+       .selftest    = trace_selftest_startup_sched_switch,
+#endif
 };
 
 __init static int init_sched_switch_trace(void)
@@ -114,3 +295,4 @@ __init static int init_sched_switch_trace(void)
        return register_tracer(&sched_switch_trace);
 }
 device_initcall(init_sched_switch_trace);
+