mirror of
				https://github.com/torvalds/linux.git
				synced 2025-11-04 02:30:34 +02:00 
			
		
		
		
	The branch annotation is a bit difficult to see the worst offenders
because it only sorts by percentage:
 correct incorrect  %        Function                  File              Line
 ------- ---------  -        --------                  ----              ----
       0      163 100 qdisc_restart                  sch_generic.c        179
       0      163 100 pfifo_fast_dequeue             sch_generic.c        447
       0        4 100 pskb_trim_rcsum                skbuff.h             1689
       0        4 100 llc_rcv                        llc_input.c          170
       0       18 100 psmouse_interrupt              psmouse-base.c       304
       0        3 100 atkbd_interrupt                atkbd.c              389
       0        5 100 usb_alloc_dev                  usb.c                437
       0       11 100 vsscanf                        vsprintf.c           1897
       0        2 100 IS_ERR                         err.h                34
       0       23 100 __rmqueue_fallback             page_alloc.c         865
       0        4 100 probe_wakeup_sched_switch      trace_sched_wakeup.c 142
       0        3 100 move_masked_irq                migration.c          11
Adding the incorrect and correct values as sort keys makes this file a
bit more informative:
 correct incorrect  %        Function                  File              Line
 ------- ---------  -        --------                  ----              ----
       0   366541 100 audit_syscall_entry            auditsc.c            1637
       0   366538 100 audit_syscall_exit             auditsc.c            1685
       0   115839 100 sched_info_switch              sched_stats.h        269
       0    74567 100 sched_info_queued              sched_stats.h        222
       0    66578 100 sched_info_dequeued            sched_stats.h        177
       0    15113 100 trace_workqueue_insertion      workqueue.h          38
       0    15107 100 trace_workqueue_execution      workqueue.h          45
       0     3622 100 syscall_trace_leave            ptrace.c             1772
       0     2750 100 sched_move_task                sched.c              10100
       0     2750 100 sched_move_task                sched.c              10110
       0     1815 100 pre_schedule_rt                sched_rt.c           1462
       0      837 100 audit_alloc                    auditsc.c            879
       0      814 100 tcp_mss_split_point            tcp_output.c         1302
Signed-off-by: Steven Rostedt <rostedt@goodmis.org>
		
	
			
		
			
				
	
	
		
			407 lines
		
	
	
	
		
			8.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			407 lines
		
	
	
	
		
			8.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * unlikely profiler
 | 
						|
 *
 | 
						|
 * Copyright (C) 2008 Steven Rostedt <srostedt@redhat.com>
 | 
						|
 */
 | 
						|
#include <linux/kallsyms.h>
 | 
						|
#include <linux/seq_file.h>
 | 
						|
#include <linux/spinlock.h>
 | 
						|
#include <linux/irqflags.h>
 | 
						|
#include <linux/debugfs.h>
 | 
						|
#include <linux/uaccess.h>
 | 
						|
#include <linux/module.h>
 | 
						|
#include <linux/ftrace.h>
 | 
						|
#include <linux/hash.h>
 | 
						|
#include <linux/fs.h>
 | 
						|
#include <asm/local.h>
 | 
						|
 | 
						|
#include "trace.h"
 | 
						|
#include "trace_stat.h"
 | 
						|
#include "trace_output.h"
 | 
						|
 | 
						|
#ifdef CONFIG_BRANCH_TRACER
 | 
						|
 | 
						|
static struct tracer branch_trace;
 | 
						|
static int branch_tracing_enabled __read_mostly;
 | 
						|
static DEFINE_MUTEX(branch_tracing_mutex);
 | 
						|
 | 
						|
static struct trace_array *branch_tracer;
 | 
						|
 | 
						|
static void
 | 
						|
probe_likely_condition(struct ftrace_branch_data *f, int val, int expect)
 | 
						|
{
 | 
						|
	struct ftrace_event_call *call = &event_branch;
 | 
						|
	struct trace_array *tr = branch_tracer;
 | 
						|
	struct ring_buffer_event *event;
 | 
						|
	struct trace_branch *entry;
 | 
						|
	struct ring_buffer *buffer;
 | 
						|
	unsigned long flags;
 | 
						|
	int cpu, pc;
 | 
						|
	const char *p;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * I would love to save just the ftrace_likely_data pointer, but
 | 
						|
	 * this code can also be used by modules. Ugly things can happen
 | 
						|
	 * if the module is unloaded, and then we go and read the
 | 
						|
	 * pointer.  This is slower, but much safer.
 | 
						|
	 */
 | 
						|
 | 
						|
	if (unlikely(!tr))
 | 
						|
		return;
 | 
						|
 | 
						|
	local_irq_save(flags);
 | 
						|
	cpu = raw_smp_processor_id();
 | 
						|
	if (atomic_inc_return(&tr->data[cpu]->disabled) != 1)
 | 
						|
		goto out;
 | 
						|
 | 
						|
	pc = preempt_count();
 | 
						|
	buffer = tr->buffer;
 | 
						|
	event = trace_buffer_lock_reserve(buffer, TRACE_BRANCH,
 | 
						|
					  sizeof(*entry), flags, pc);
 | 
						|
	if (!event)
 | 
						|
		goto out;
 | 
						|
 | 
						|
	entry	= ring_buffer_event_data(event);
 | 
						|
 | 
						|
	/* Strip off the path, only save the file */
 | 
						|
	p = f->file + strlen(f->file);
 | 
						|
	while (p >= f->file && *p != '/')
 | 
						|
		p--;
 | 
						|
	p++;
 | 
						|
 | 
						|
	strncpy(entry->func, f->func, TRACE_FUNC_SIZE);
 | 
						|
	strncpy(entry->file, p, TRACE_FILE_SIZE);
 | 
						|
	entry->func[TRACE_FUNC_SIZE] = 0;
 | 
						|
	entry->file[TRACE_FILE_SIZE] = 0;
 | 
						|
	entry->line = f->line;
 | 
						|
	entry->correct = val == expect;
 | 
						|
 | 
						|
	if (!filter_check_discard(call, entry, buffer, event))
 | 
						|
		ring_buffer_unlock_commit(buffer, event);
 | 
						|
 | 
						|
 out:
 | 
						|
	atomic_dec(&tr->data[cpu]->disabled);
 | 
						|
	local_irq_restore(flags);
 | 
						|
}
 | 
						|
 | 
						|
static inline
 | 
						|
void trace_likely_condition(struct ftrace_branch_data *f, int val, int expect)
 | 
						|
{
 | 
						|
	if (!branch_tracing_enabled)
 | 
						|
		return;
 | 
						|
 | 
						|
	probe_likely_condition(f, val, expect);
 | 
						|
}
 | 
						|
 | 
						|
int enable_branch_tracing(struct trace_array *tr)
 | 
						|
{
 | 
						|
	mutex_lock(&branch_tracing_mutex);
 | 
						|
	branch_tracer = tr;
 | 
						|
	/*
 | 
						|
	 * Must be seen before enabling. The reader is a condition
 | 
						|
	 * where we do not need a matching rmb()
 | 
						|
	 */
 | 
						|
	smp_wmb();
 | 
						|
	branch_tracing_enabled++;
 | 
						|
	mutex_unlock(&branch_tracing_mutex);
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
void disable_branch_tracing(void)
 | 
						|
{
 | 
						|
	mutex_lock(&branch_tracing_mutex);
 | 
						|
 | 
						|
	if (!branch_tracing_enabled)
 | 
						|
		goto out_unlock;
 | 
						|
 | 
						|
	branch_tracing_enabled--;
 | 
						|
 | 
						|
 out_unlock:
 | 
						|
	mutex_unlock(&branch_tracing_mutex);
 | 
						|
}
 | 
						|
 | 
						|
static void start_branch_trace(struct trace_array *tr)
 | 
						|
{
 | 
						|
	enable_branch_tracing(tr);
 | 
						|
}
 | 
						|
 | 
						|
static void stop_branch_trace(struct trace_array *tr)
 | 
						|
{
 | 
						|
	disable_branch_tracing();
 | 
						|
}
 | 
						|
 | 
						|
static int branch_trace_init(struct trace_array *tr)
 | 
						|
{
 | 
						|
	start_branch_trace(tr);
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static void branch_trace_reset(struct trace_array *tr)
 | 
						|
{
 | 
						|
	stop_branch_trace(tr);
 | 
						|
}
 | 
						|
 | 
						|
static enum print_line_t trace_branch_print(struct trace_iterator *iter,
 | 
						|
					    int flags)
 | 
						|
{
 | 
						|
	struct trace_branch *field;
 | 
						|
 | 
						|
	trace_assign_type(field, iter->ent);
 | 
						|
 | 
						|
	if (trace_seq_printf(&iter->seq, "[%s] %s:%s:%d\n",
 | 
						|
			     field->correct ? "  ok  " : " MISS ",
 | 
						|
			     field->func,
 | 
						|
			     field->file,
 | 
						|
			     field->line))
 | 
						|
		return TRACE_TYPE_PARTIAL_LINE;
 | 
						|
 | 
						|
	return TRACE_TYPE_HANDLED;
 | 
						|
}
 | 
						|
 | 
						|
static void branch_print_header(struct seq_file *s)
 | 
						|
{
 | 
						|
	seq_puts(s, "#           TASK-PID    CPU#    TIMESTAMP  CORRECT"
 | 
						|
		"  FUNC:FILE:LINE\n");
 | 
						|
	seq_puts(s, "#              | |       |          |         |   "
 | 
						|
		"    |\n");
 | 
						|
}
 | 
						|
 | 
						|
static struct trace_event trace_branch_event = {
 | 
						|
	.type		= TRACE_BRANCH,
 | 
						|
	.trace		= trace_branch_print,
 | 
						|
};
 | 
						|
 | 
						|
static struct tracer branch_trace __read_mostly =
 | 
						|
{
 | 
						|
	.name		= "branch",
 | 
						|
	.init		= branch_trace_init,
 | 
						|
	.reset		= branch_trace_reset,
 | 
						|
#ifdef CONFIG_FTRACE_SELFTEST
 | 
						|
	.selftest	= trace_selftest_startup_branch,
 | 
						|
#endif /* CONFIG_FTRACE_SELFTEST */
 | 
						|
	.print_header	= branch_print_header,
 | 
						|
};
 | 
						|
 | 
						|
__init static int init_branch_tracer(void)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	ret = register_ftrace_event(&trace_branch_event);
 | 
						|
	if (!ret) {
 | 
						|
		printk(KERN_WARNING "Warning: could not register "
 | 
						|
				    "branch events\n");
 | 
						|
		return 1;
 | 
						|
	}
 | 
						|
	return register_tracer(&branch_trace);
 | 
						|
}
 | 
						|
device_initcall(init_branch_tracer);
 | 
						|
 | 
						|
#else
 | 
						|
static inline
 | 
						|
void trace_likely_condition(struct ftrace_branch_data *f, int val, int expect)
 | 
						|
{
 | 
						|
}
 | 
						|
#endif /* CONFIG_BRANCH_TRACER */
 | 
						|
 | 
						|
void ftrace_likely_update(struct ftrace_branch_data *f, int val, int expect)
 | 
						|
{
 | 
						|
	/*
 | 
						|
	 * I would love to have a trace point here instead, but the
 | 
						|
	 * trace point code is so inundated with unlikely and likely
 | 
						|
	 * conditions that the recursive nightmare that exists is too
 | 
						|
	 * much to try to get working. At least for now.
 | 
						|
	 */
 | 
						|
	trace_likely_condition(f, val, expect);
 | 
						|
 | 
						|
	/* FIXME: Make this atomic! */
 | 
						|
	if (val == expect)
 | 
						|
		f->correct++;
 | 
						|
	else
 | 
						|
		f->incorrect++;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(ftrace_likely_update);
 | 
						|
 | 
						|
extern unsigned long __start_annotated_branch_profile[];
 | 
						|
extern unsigned long __stop_annotated_branch_profile[];
 | 
						|
 | 
						|
static int annotated_branch_stat_headers(struct seq_file *m)
 | 
						|
{
 | 
						|
	seq_printf(m, " correct incorrect  %% ");
 | 
						|
	seq_printf(m, "       Function                "
 | 
						|
			      "  File              Line\n"
 | 
						|
			      " ------- ---------  - "
 | 
						|
			      "       --------                "
 | 
						|
			      "  ----              ----\n");
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static inline long get_incorrect_percent(struct ftrace_branch_data *p)
 | 
						|
{
 | 
						|
	long percent;
 | 
						|
 | 
						|
	if (p->correct) {
 | 
						|
		percent = p->incorrect * 100;
 | 
						|
		percent /= p->correct + p->incorrect;
 | 
						|
	} else
 | 
						|
		percent = p->incorrect ? 100 : -1;
 | 
						|
 | 
						|
	return percent;
 | 
						|
}
 | 
						|
 | 
						|
static int branch_stat_show(struct seq_file *m, void *v)
 | 
						|
{
 | 
						|
	struct ftrace_branch_data *p = v;
 | 
						|
	const char *f;
 | 
						|
	long percent;
 | 
						|
 | 
						|
	/* Only print the file, not the path */
 | 
						|
	f = p->file + strlen(p->file);
 | 
						|
	while (f >= p->file && *f != '/')
 | 
						|
		f--;
 | 
						|
	f++;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * The miss is overlayed on correct, and hit on incorrect.
 | 
						|
	 */
 | 
						|
	percent = get_incorrect_percent(p);
 | 
						|
 | 
						|
	seq_printf(m, "%8lu %8lu ",  p->correct, p->incorrect);
 | 
						|
	if (percent < 0)
 | 
						|
		seq_printf(m, "  X ");
 | 
						|
	else
 | 
						|
		seq_printf(m, "%3ld ", percent);
 | 
						|
	seq_printf(m, "%-30.30s %-20.20s %d\n", p->func, f, p->line);
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static void *annotated_branch_stat_start(struct tracer_stat *trace)
 | 
						|
{
 | 
						|
	return __start_annotated_branch_profile;
 | 
						|
}
 | 
						|
 | 
						|
static void *
 | 
						|
annotated_branch_stat_next(void *v, int idx)
 | 
						|
{
 | 
						|
	struct ftrace_branch_data *p = v;
 | 
						|
 | 
						|
	++p;
 | 
						|
 | 
						|
	if ((void *)p >= (void *)__stop_annotated_branch_profile)
 | 
						|
		return NULL;
 | 
						|
 | 
						|
	return p;
 | 
						|
}
 | 
						|
 | 
						|
static int annotated_branch_stat_cmp(void *p1, void *p2)
 | 
						|
{
 | 
						|
	struct ftrace_branch_data *a = p1;
 | 
						|
	struct ftrace_branch_data *b = p2;
 | 
						|
 | 
						|
	long percent_a, percent_b;
 | 
						|
 | 
						|
	percent_a = get_incorrect_percent(a);
 | 
						|
	percent_b = get_incorrect_percent(b);
 | 
						|
 | 
						|
	if (percent_a < percent_b)
 | 
						|
		return -1;
 | 
						|
	if (percent_a > percent_b)
 | 
						|
		return 1;
 | 
						|
 | 
						|
	if (a->incorrect < b->incorrect)
 | 
						|
		return -1;
 | 
						|
	if (a->incorrect > b->incorrect)
 | 
						|
		return 1;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Since the above shows worse (incorrect) cases
 | 
						|
	 * first, we continue that by showing best (correct)
 | 
						|
	 * cases last.
 | 
						|
	 */
 | 
						|
	if (a->correct > b->correct)
 | 
						|
		return -1;
 | 
						|
	if (a->correct < b->correct)
 | 
						|
		return 1;
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static struct tracer_stat annotated_branch_stats = {
 | 
						|
	.name = "branch_annotated",
 | 
						|
	.stat_start = annotated_branch_stat_start,
 | 
						|
	.stat_next = annotated_branch_stat_next,
 | 
						|
	.stat_cmp = annotated_branch_stat_cmp,
 | 
						|
	.stat_headers = annotated_branch_stat_headers,
 | 
						|
	.stat_show = branch_stat_show
 | 
						|
};
 | 
						|
 | 
						|
__init static int init_annotated_branch_stats(void)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	ret = register_stat_tracer(&annotated_branch_stats);
 | 
						|
	if (!ret) {
 | 
						|
		printk(KERN_WARNING "Warning: could not register "
 | 
						|
				    "annotated branches stats\n");
 | 
						|
		return 1;
 | 
						|
	}
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
fs_initcall(init_annotated_branch_stats);
 | 
						|
 | 
						|
#ifdef CONFIG_PROFILE_ALL_BRANCHES
 | 
						|
 | 
						|
extern unsigned long __start_branch_profile[];
 | 
						|
extern unsigned long __stop_branch_profile[];
 | 
						|
 | 
						|
static int all_branch_stat_headers(struct seq_file *m)
 | 
						|
{
 | 
						|
	seq_printf(m, "   miss      hit    %% ");
 | 
						|
	seq_printf(m, "       Function                "
 | 
						|
			      "  File              Line\n"
 | 
						|
			      " ------- ---------  - "
 | 
						|
			      "       --------                "
 | 
						|
			      "  ----              ----\n");
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static void *all_branch_stat_start(struct tracer_stat *trace)
 | 
						|
{
 | 
						|
	return __start_branch_profile;
 | 
						|
}
 | 
						|
 | 
						|
static void *
 | 
						|
all_branch_stat_next(void *v, int idx)
 | 
						|
{
 | 
						|
	struct ftrace_branch_data *p = v;
 | 
						|
 | 
						|
	++p;
 | 
						|
 | 
						|
	if ((void *)p >= (void *)__stop_branch_profile)
 | 
						|
		return NULL;
 | 
						|
 | 
						|
	return p;
 | 
						|
}
 | 
						|
 | 
						|
static struct tracer_stat all_branch_stats = {
 | 
						|
	.name = "branch_all",
 | 
						|
	.stat_start = all_branch_stat_start,
 | 
						|
	.stat_next = all_branch_stat_next,
 | 
						|
	.stat_headers = all_branch_stat_headers,
 | 
						|
	.stat_show = branch_stat_show
 | 
						|
};
 | 
						|
 | 
						|
__init static int all_annotated_branch_stats(void)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	ret = register_stat_tracer(&all_branch_stats);
 | 
						|
	if (!ret) {
 | 
						|
		printk(KERN_WARNING "Warning: could not register "
 | 
						|
				    "all branches stats\n");
 | 
						|
		return 1;
 | 
						|
	}
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
fs_initcall(all_annotated_branch_stats);
 | 
						|
#endif /* CONFIG_PROFILE_ALL_BRANCHES */
 |