mirror of
				https://github.com/torvalds/linux.git
				synced 2025-11-04 02:30:34 +02:00 
			
		
		
		
	Impact: use percpu data instead of a global structure Use: static DEFINE_PER_CPU(struct workqueue_global_stats, all_workqueue_stat); instead of allocating a global structure. percpu data also works well on NUMA. Signed-off-by: Lai Jiangshan <laijs@cn.fujitsu.com> Signed-off-by: Steven Rostedt <srostedt@redhat.com> Signed-off-by: Ingo Molnar <mingo@elte.hu>
		
			
				
	
	
		
			281 lines
		
	
	
	
		
			7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			281 lines
		
	
	
	
		
			7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * Workqueue statistical tracer.
 | 
						|
 *
 | 
						|
 * Copyright (C) 2008 Frederic Weisbecker <fweisbec@gmail.com>
 | 
						|
 *
 | 
						|
 */
 | 
						|
 | 
						|
 | 
						|
#include <trace/workqueue.h>
 | 
						|
#include <linux/list.h>
 | 
						|
#include <linux/percpu.h>
 | 
						|
#include "trace_stat.h"
 | 
						|
#include "trace.h"
 | 
						|
 | 
						|
 | 
						|
/* A cpu workqueue thread */
 | 
						|
struct cpu_workqueue_stats {
 | 
						|
	struct list_head            list;
 | 
						|
/* Useful to know if we print the cpu headers */
 | 
						|
	bool		            first_entry;
 | 
						|
	int		            cpu;
 | 
						|
	pid_t 			    pid;
 | 
						|
/* Can be inserted from interrupt or user context, need to be atomic */
 | 
						|
	atomic_t 	            inserted;
 | 
						|
/*
 | 
						|
 *  Don't need to be atomic, works are serialized in a single workqueue thread
 | 
						|
 *  on a single CPU.
 | 
						|
 */
 | 
						|
	unsigned int 	 	    executed;
 | 
						|
};
 | 
						|
 | 
						|
/* List of workqueue threads on one cpu */
 | 
						|
struct workqueue_global_stats {
 | 
						|
	struct list_head	list;
 | 
						|
	spinlock_t		lock;
 | 
						|
};
 | 
						|
 | 
						|
/* Don't need a global lock because allocated before the workqueues, and
 | 
						|
 * never freed.
 | 
						|
 */
 | 
						|
static DEFINE_PER_CPU(struct workqueue_global_stats, all_workqueue_stat);
 | 
						|
#define workqueue_cpu_stat(cpu) (&per_cpu(all_workqueue_stat, cpu))
 | 
						|
 | 
						|
/* Insertion of a work */
 | 
						|
static void
 | 
						|
probe_workqueue_insertion(struct task_struct *wq_thread,
 | 
						|
			  struct work_struct *work)
 | 
						|
{
 | 
						|
	int cpu = cpumask_first(&wq_thread->cpus_allowed);
 | 
						|
	struct cpu_workqueue_stats *node, *next;
 | 
						|
	unsigned long flags;
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
	list_for_each_entry_safe(node, next, &workqueue_cpu_stat(cpu)->list,
 | 
						|
							list) {
 | 
						|
		if (node->pid == wq_thread->pid) {
 | 
						|
			atomic_inc(&node->inserted);
 | 
						|
			goto found;
 | 
						|
		}
 | 
						|
	}
 | 
						|
	pr_debug("trace_workqueue: entry not found\n");
 | 
						|
found:
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
}
 | 
						|
 | 
						|
/* Execution of a work */
 | 
						|
static void
 | 
						|
probe_workqueue_execution(struct task_struct *wq_thread,
 | 
						|
			  struct work_struct *work)
 | 
						|
{
 | 
						|
	int cpu = cpumask_first(&wq_thread->cpus_allowed);
 | 
						|
	struct cpu_workqueue_stats *node, *next;
 | 
						|
	unsigned long flags;
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
	list_for_each_entry_safe(node, next, &workqueue_cpu_stat(cpu)->list,
 | 
						|
							list) {
 | 
						|
		if (node->pid == wq_thread->pid) {
 | 
						|
			node->executed++;
 | 
						|
			goto found;
 | 
						|
		}
 | 
						|
	}
 | 
						|
	pr_debug("trace_workqueue: entry not found\n");
 | 
						|
found:
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
}
 | 
						|
 | 
						|
/* Creation of a cpu workqueue thread */
 | 
						|
static void probe_workqueue_creation(struct task_struct *wq_thread, int cpu)
 | 
						|
{
 | 
						|
	struct cpu_workqueue_stats *cws;
 | 
						|
	unsigned long flags;
 | 
						|
 | 
						|
	WARN_ON(cpu < 0 || cpu >= num_possible_cpus());
 | 
						|
 | 
						|
	/* Workqueues are sometimes created in atomic context */
 | 
						|
	cws = kzalloc(sizeof(struct cpu_workqueue_stats), GFP_ATOMIC);
 | 
						|
	if (!cws) {
 | 
						|
		pr_warning("trace_workqueue: not enough memory\n");
 | 
						|
		return;
 | 
						|
	}
 | 
						|
	tracing_record_cmdline(wq_thread);
 | 
						|
 | 
						|
	INIT_LIST_HEAD(&cws->list);
 | 
						|
	cws->cpu = cpu;
 | 
						|
 | 
						|
	cws->pid = wq_thread->pid;
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
	if (list_empty(&workqueue_cpu_stat(cpu)->list))
 | 
						|
		cws->first_entry = true;
 | 
						|
	list_add_tail(&cws->list, &workqueue_cpu_stat(cpu)->list);
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
}
 | 
						|
 | 
						|
/* Destruction of a cpu workqueue thread */
 | 
						|
static void probe_workqueue_destruction(struct task_struct *wq_thread)
 | 
						|
{
 | 
						|
	/* Workqueue only execute on one cpu */
 | 
						|
	int cpu = cpumask_first(&wq_thread->cpus_allowed);
 | 
						|
	struct cpu_workqueue_stats *node, *next;
 | 
						|
	unsigned long flags;
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
	list_for_each_entry_safe(node, next, &workqueue_cpu_stat(cpu)->list,
 | 
						|
							list) {
 | 
						|
		if (node->pid == wq_thread->pid) {
 | 
						|
			list_del(&node->list);
 | 
						|
			kfree(node);
 | 
						|
			goto found;
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	pr_debug("trace_workqueue: don't find workqueue to destroy\n");
 | 
						|
found:
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
static struct cpu_workqueue_stats *workqueue_stat_start_cpu(int cpu)
 | 
						|
{
 | 
						|
	unsigned long flags;
 | 
						|
	struct cpu_workqueue_stats *ret = NULL;
 | 
						|
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
 | 
						|
	if (!list_empty(&workqueue_cpu_stat(cpu)->list))
 | 
						|
		ret = list_entry(workqueue_cpu_stat(cpu)->list.next,
 | 
						|
				 struct cpu_workqueue_stats, list);
 | 
						|
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
 | 
						|
static void *workqueue_stat_start(void)
 | 
						|
{
 | 
						|
	int cpu;
 | 
						|
	void *ret = NULL;
 | 
						|
 | 
						|
	for_each_possible_cpu(cpu) {
 | 
						|
		ret = workqueue_stat_start_cpu(cpu);
 | 
						|
		if (ret)
 | 
						|
			return ret;
 | 
						|
	}
 | 
						|
	return NULL;
 | 
						|
}
 | 
						|
 | 
						|
static void *workqueue_stat_next(void *prev, int idx)
 | 
						|
{
 | 
						|
	struct cpu_workqueue_stats *prev_cws = prev;
 | 
						|
	int cpu = prev_cws->cpu;
 | 
						|
	unsigned long flags;
 | 
						|
	void *ret = NULL;
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
	if (list_is_last(&prev_cws->list, &workqueue_cpu_stat(cpu)->list)) {
 | 
						|
		spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
		for (++cpu ; cpu < num_possible_cpus(); cpu++) {
 | 
						|
			ret = workqueue_stat_start_cpu(cpu);
 | 
						|
			if (ret)
 | 
						|
				return ret;
 | 
						|
		}
 | 
						|
		return NULL;
 | 
						|
	}
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
 | 
						|
	return list_entry(prev_cws->list.next, struct cpu_workqueue_stats,
 | 
						|
			  list);
 | 
						|
}
 | 
						|
 | 
						|
static int workqueue_stat_show(struct seq_file *s, void *p)
 | 
						|
{
 | 
						|
	struct cpu_workqueue_stats *cws = p;
 | 
						|
	unsigned long flags;
 | 
						|
	int cpu = cws->cpu;
 | 
						|
 | 
						|
	seq_printf(s, "%3d %6d     %6u       %s\n", cws->cpu,
 | 
						|
		   atomic_read(&cws->inserted),
 | 
						|
		   cws->executed,
 | 
						|
		   trace_find_cmdline(cws->pid));
 | 
						|
 | 
						|
	spin_lock_irqsave(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
	if (&cws->list == workqueue_cpu_stat(cpu)->list.next)
 | 
						|
		seq_printf(s, "\n");
 | 
						|
	spin_unlock_irqrestore(&workqueue_cpu_stat(cpu)->lock, flags);
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
static int workqueue_stat_headers(struct seq_file *s)
 | 
						|
{
 | 
						|
	seq_printf(s, "# CPU  INSERTED  EXECUTED   NAME\n");
 | 
						|
	seq_printf(s, "# |      |         |          |\n\n");
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
struct tracer_stat workqueue_stats __read_mostly = {
 | 
						|
	.name = "workqueues",
 | 
						|
	.stat_start = workqueue_stat_start,
 | 
						|
	.stat_next = workqueue_stat_next,
 | 
						|
	.stat_show = workqueue_stat_show,
 | 
						|
	.stat_headers = workqueue_stat_headers
 | 
						|
};
 | 
						|
 | 
						|
 | 
						|
int __init stat_workqueue_init(void)
 | 
						|
{
 | 
						|
	if (register_stat_tracer(&workqueue_stats)) {
 | 
						|
		pr_warning("Unable to register workqueue stat tracer\n");
 | 
						|
		return 1;
 | 
						|
	}
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
fs_initcall(stat_workqueue_init);
 | 
						|
 | 
						|
/*
 | 
						|
 * Workqueues are created very early, just after pre-smp initcalls.
 | 
						|
 * So we must register our tracepoints at this stage.
 | 
						|
 */
 | 
						|
int __init trace_workqueue_early_init(void)
 | 
						|
{
 | 
						|
	int ret, cpu;
 | 
						|
 | 
						|
	ret = register_trace_workqueue_insertion(probe_workqueue_insertion);
 | 
						|
	if (ret)
 | 
						|
		goto out;
 | 
						|
 | 
						|
	ret = register_trace_workqueue_execution(probe_workqueue_execution);
 | 
						|
	if (ret)
 | 
						|
		goto no_insertion;
 | 
						|
 | 
						|
	ret = register_trace_workqueue_creation(probe_workqueue_creation);
 | 
						|
	if (ret)
 | 
						|
		goto no_execution;
 | 
						|
 | 
						|
	ret = register_trace_workqueue_destruction(probe_workqueue_destruction);
 | 
						|
	if (ret)
 | 
						|
		goto no_creation;
 | 
						|
 | 
						|
	for_each_possible_cpu(cpu) {
 | 
						|
		spin_lock_init(&workqueue_cpu_stat(cpu)->lock);
 | 
						|
		INIT_LIST_HEAD(&workqueue_cpu_stat(cpu)->list);
 | 
						|
	}
 | 
						|
 | 
						|
	return 0;
 | 
						|
 | 
						|
no_creation:
 | 
						|
	unregister_trace_workqueue_creation(probe_workqueue_creation);
 | 
						|
no_execution:
 | 
						|
	unregister_trace_workqueue_execution(probe_workqueue_execution);
 | 
						|
no_insertion:
 | 
						|
	unregister_trace_workqueue_insertion(probe_workqueue_insertion);
 | 
						|
out:
 | 
						|
	pr_warning("trace_workqueue: unable to trace workqueues\n");
 | 
						|
 | 
						|
	return 1;
 | 
						|
}
 | 
						|
early_initcall(trace_workqueue_early_init);
 |