d0316554d3
* 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tj/percpu: (34 commits) m68k: rename global variable vmalloc_end to m68k_vmalloc_end percpu: add missing per_cpu_ptr_to_phys() definition for UP percpu: Fix kdump failure if booted with percpu_alloc=page percpu: make misc percpu symbols unique percpu: make percpu symbols in ia64 unique percpu: make percpu symbols in powerpc unique percpu: make percpu symbols in x86 unique percpu: make percpu symbols in xen unique percpu: make percpu symbols in cpufreq unique percpu: make percpu symbols in oprofile unique percpu: make percpu symbols in tracer unique percpu: make percpu symbols under kernel/ and mm/ unique percpu: remove some sparse warnings percpu: make alloc_percpu() handle array types vmalloc: fix use of non-existent percpu variable in put_cpu_var() this_cpu: Use this_cpu_xx in trace_functions_graph.c this_cpu: Use this_cpu_xx for ftrace this_cpu: Use this_cpu_xx in nmi handling this_cpu: Use this_cpu operations in RCU this_cpu: Use this_cpu ops for VM statistics ... Fix up trivial (famous last words) global per-cpu naming conflicts in arch/x86/kvm/svm.c mm/slab.c
313 lines
7.2 KiB
C
313 lines
7.2 KiB
C
/*
|
|
* h/w branch tracer for x86 based on BTS
|
|
*
|
|
* Copyright (C) 2008-2009 Intel Corporation.
|
|
* Markus Metzger <markus.t.metzger@gmail.com>, 2008-2009
|
|
*/
|
|
#include <linux/kallsyms.h>
|
|
#include <linux/debugfs.h>
|
|
#include <linux/ftrace.h>
|
|
#include <linux/module.h>
|
|
#include <linux/cpu.h>
|
|
#include <linux/smp.h>
|
|
#include <linux/fs.h>
|
|
|
|
#include <asm/ds.h>
|
|
|
|
#include "trace_output.h"
|
|
#include "trace.h"
|
|
|
|
|
|
#define BTS_BUFFER_SIZE (1 << 13)
|
|
|
|
static DEFINE_PER_CPU(struct bts_tracer *, hwb_tracer);
|
|
static DEFINE_PER_CPU(unsigned char[BTS_BUFFER_SIZE], hwb_buffer);
|
|
|
|
#define this_tracer per_cpu(hwb_tracer, smp_processor_id())
|
|
|
|
static int trace_hw_branches_enabled __read_mostly;
|
|
static int trace_hw_branches_suspended __read_mostly;
|
|
static struct trace_array *hw_branch_trace __read_mostly;
|
|
|
|
|
|
static void bts_trace_init_cpu(int cpu)
|
|
{
|
|
per_cpu(hwb_tracer, cpu) =
|
|
ds_request_bts_cpu(cpu, per_cpu(hwb_buffer, cpu),
|
|
BTS_BUFFER_SIZE, NULL, (size_t)-1,
|
|
BTS_KERNEL);
|
|
|
|
if (IS_ERR(per_cpu(hwb_tracer, cpu)))
|
|
per_cpu(hwb_tracer, cpu) = NULL;
|
|
}
|
|
|
|
static int bts_trace_init(struct trace_array *tr)
|
|
{
|
|
int cpu;
|
|
|
|
hw_branch_trace = tr;
|
|
trace_hw_branches_enabled = 0;
|
|
|
|
get_online_cpus();
|
|
for_each_online_cpu(cpu) {
|
|
bts_trace_init_cpu(cpu);
|
|
|
|
if (likely(per_cpu(hwb_tracer, cpu)))
|
|
trace_hw_branches_enabled = 1;
|
|
}
|
|
trace_hw_branches_suspended = 0;
|
|
put_online_cpus();
|
|
|
|
/* If we could not enable tracing on a single cpu, we fail. */
|
|
return trace_hw_branches_enabled ? 0 : -EOPNOTSUPP;
|
|
}
|
|
|
|
static void bts_trace_reset(struct trace_array *tr)
|
|
{
|
|
int cpu;
|
|
|
|
get_online_cpus();
|
|
for_each_online_cpu(cpu) {
|
|
if (likely(per_cpu(hwb_tracer, cpu))) {
|
|
ds_release_bts(per_cpu(hwb_tracer, cpu));
|
|
per_cpu(hwb_tracer, cpu) = NULL;
|
|
}
|
|
}
|
|
trace_hw_branches_enabled = 0;
|
|
trace_hw_branches_suspended = 0;
|
|
put_online_cpus();
|
|
}
|
|
|
|
static void bts_trace_start(struct trace_array *tr)
|
|
{
|
|
int cpu;
|
|
|
|
get_online_cpus();
|
|
for_each_online_cpu(cpu)
|
|
if (likely(per_cpu(hwb_tracer, cpu)))
|
|
ds_resume_bts(per_cpu(hwb_tracer, cpu));
|
|
trace_hw_branches_suspended = 0;
|
|
put_online_cpus();
|
|
}
|
|
|
|
static void bts_trace_stop(struct trace_array *tr)
|
|
{
|
|
int cpu;
|
|
|
|
get_online_cpus();
|
|
for_each_online_cpu(cpu)
|
|
if (likely(per_cpu(hwb_tracer, cpu)))
|
|
ds_suspend_bts(per_cpu(hwb_tracer, cpu));
|
|
trace_hw_branches_suspended = 1;
|
|
put_online_cpus();
|
|
}
|
|
|
|
static int __cpuinit bts_hotcpu_handler(struct notifier_block *nfb,
|
|
unsigned long action, void *hcpu)
|
|
{
|
|
int cpu = (long)hcpu;
|
|
|
|
switch (action) {
|
|
case CPU_ONLINE:
|
|
case CPU_DOWN_FAILED:
|
|
/* The notification is sent with interrupts enabled. */
|
|
if (trace_hw_branches_enabled) {
|
|
bts_trace_init_cpu(cpu);
|
|
|
|
if (trace_hw_branches_suspended &&
|
|
likely(per_cpu(hwb_tracer, cpu)))
|
|
ds_suspend_bts(per_cpu(hwb_tracer, cpu));
|
|
}
|
|
break;
|
|
|
|
case CPU_DOWN_PREPARE:
|
|
/* The notification is sent with interrupts enabled. */
|
|
if (likely(per_cpu(hwb_tracer, cpu))) {
|
|
ds_release_bts(per_cpu(hwb_tracer, cpu));
|
|
per_cpu(hwb_tracer, cpu) = NULL;
|
|
}
|
|
}
|
|
|
|
return NOTIFY_DONE;
|
|
}
|
|
|
|
static struct notifier_block bts_hotcpu_notifier __cpuinitdata = {
|
|
.notifier_call = bts_hotcpu_handler
|
|
};
|
|
|
|
static void bts_trace_print_header(struct seq_file *m)
|
|
{
|
|
seq_puts(m, "# CPU# TO <- FROM\n");
|
|
}
|
|
|
|
static enum print_line_t bts_trace_print_line(struct trace_iterator *iter)
|
|
{
|
|
unsigned long symflags = TRACE_ITER_SYM_OFFSET;
|
|
struct trace_entry *entry = iter->ent;
|
|
struct trace_seq *seq = &iter->seq;
|
|
struct hw_branch_entry *it;
|
|
|
|
trace_assign_type(it, entry);
|
|
|
|
if (entry->type == TRACE_HW_BRANCHES) {
|
|
if (trace_seq_printf(seq, "%4d ", iter->cpu) &&
|
|
seq_print_ip_sym(seq, it->to, symflags) &&
|
|
trace_seq_printf(seq, "\t <- ") &&
|
|
seq_print_ip_sym(seq, it->from, symflags) &&
|
|
trace_seq_printf(seq, "\n"))
|
|
return TRACE_TYPE_HANDLED;
|
|
return TRACE_TYPE_PARTIAL_LINE;
|
|
}
|
|
return TRACE_TYPE_UNHANDLED;
|
|
}
|
|
|
|
void trace_hw_branch(u64 from, u64 to)
|
|
{
|
|
struct ftrace_event_call *call = &event_hw_branch;
|
|
struct trace_array *tr = hw_branch_trace;
|
|
struct ring_buffer_event *event;
|
|
struct ring_buffer *buf;
|
|
struct hw_branch_entry *entry;
|
|
unsigned long irq1;
|
|
int cpu;
|
|
|
|
if (unlikely(!tr))
|
|
return;
|
|
|
|
if (unlikely(!trace_hw_branches_enabled))
|
|
return;
|
|
|
|
local_irq_save(irq1);
|
|
cpu = raw_smp_processor_id();
|
|
if (atomic_inc_return(&tr->data[cpu]->disabled) != 1)
|
|
goto out;
|
|
|
|
buf = tr->buffer;
|
|
event = trace_buffer_lock_reserve(buf, TRACE_HW_BRANCHES,
|
|
sizeof(*entry), 0, 0);
|
|
if (!event)
|
|
goto out;
|
|
entry = ring_buffer_event_data(event);
|
|
tracing_generic_entry_update(&entry->ent, 0, from);
|
|
entry->ent.type = TRACE_HW_BRANCHES;
|
|
entry->from = from;
|
|
entry->to = to;
|
|
if (!filter_check_discard(call, entry, buf, event))
|
|
trace_buffer_unlock_commit(buf, event, 0, 0);
|
|
|
|
out:
|
|
atomic_dec(&tr->data[cpu]->disabled);
|
|
local_irq_restore(irq1);
|
|
}
|
|
|
|
static void trace_bts_at(const struct bts_trace *trace, void *at)
|
|
{
|
|
struct bts_struct bts;
|
|
int err = 0;
|
|
|
|
WARN_ON_ONCE(!trace->read);
|
|
if (!trace->read)
|
|
return;
|
|
|
|
err = trace->read(this_tracer, at, &bts);
|
|
if (err < 0)
|
|
return;
|
|
|
|
switch (bts.qualifier) {
|
|
case BTS_BRANCH:
|
|
trace_hw_branch(bts.variant.lbr.from, bts.variant.lbr.to);
|
|
break;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Collect the trace on the current cpu and write it into the ftrace buffer.
|
|
*
|
|
* pre: tracing must be suspended on the current cpu
|
|
*/
|
|
static void trace_bts_cpu(void *arg)
|
|
{
|
|
struct trace_array *tr = (struct trace_array *)arg;
|
|
const struct bts_trace *trace;
|
|
unsigned char *at;
|
|
|
|
if (unlikely(!tr))
|
|
return;
|
|
|
|
if (unlikely(atomic_read(&tr->data[raw_smp_processor_id()]->disabled)))
|
|
return;
|
|
|
|
if (unlikely(!this_tracer))
|
|
return;
|
|
|
|
trace = ds_read_bts(this_tracer);
|
|
if (!trace)
|
|
return;
|
|
|
|
for (at = trace->ds.top; (void *)at < trace->ds.end;
|
|
at += trace->ds.size)
|
|
trace_bts_at(trace, at);
|
|
|
|
for (at = trace->ds.begin; (void *)at < trace->ds.top;
|
|
at += trace->ds.size)
|
|
trace_bts_at(trace, at);
|
|
}
|
|
|
|
static void trace_bts_prepare(struct trace_iterator *iter)
|
|
{
|
|
int cpu;
|
|
|
|
get_online_cpus();
|
|
for_each_online_cpu(cpu)
|
|
if (likely(per_cpu(hwb_tracer, cpu)))
|
|
ds_suspend_bts(per_cpu(hwb_tracer, cpu));
|
|
/*
|
|
* We need to collect the trace on the respective cpu since ftrace
|
|
* implicitly adds the record for the current cpu.
|
|
* Once that is more flexible, we could collect the data from any cpu.
|
|
*/
|
|
on_each_cpu(trace_bts_cpu, iter->tr, 1);
|
|
|
|
for_each_online_cpu(cpu)
|
|
if (likely(per_cpu(hwb_tracer, cpu)))
|
|
ds_resume_bts(per_cpu(hwb_tracer, cpu));
|
|
put_online_cpus();
|
|
}
|
|
|
|
static void trace_bts_close(struct trace_iterator *iter)
|
|
{
|
|
tracing_reset_online_cpus(iter->tr);
|
|
}
|
|
|
|
void trace_hw_branch_oops(void)
|
|
{
|
|
if (this_tracer) {
|
|
ds_suspend_bts_noirq(this_tracer);
|
|
trace_bts_cpu(hw_branch_trace);
|
|
ds_resume_bts_noirq(this_tracer);
|
|
}
|
|
}
|
|
|
|
struct tracer bts_tracer __read_mostly =
|
|
{
|
|
.name = "hw-branch-tracer",
|
|
.init = bts_trace_init,
|
|
.reset = bts_trace_reset,
|
|
.print_header = bts_trace_print_header,
|
|
.print_line = bts_trace_print_line,
|
|
.start = bts_trace_start,
|
|
.stop = bts_trace_stop,
|
|
.open = trace_bts_prepare,
|
|
.close = trace_bts_close,
|
|
#ifdef CONFIG_FTRACE_SELFTEST
|
|
.selftest = trace_selftest_startup_hw_branches,
|
|
#endif /* CONFIG_FTRACE_SELFTEST */
|
|
};
|
|
|
|
__init static int init_bts_trace(void)
|
|
{
|
|
register_hotcpu_notifier(&bts_hotcpu_notifier);
|
|
return register_tracer(&bts_tracer);
|
|
}
|
|
device_initcall(init_bts_trace);
|