trace_sysprof.c 5.7 KB
Newer Older
I
Ingo Molnar 已提交
1 2 3 4 5
/*
 * trace stack traces
 *
 * Copyright (C) 2007 Steven Rostedt <srostedt@redhat.com>
 * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
6
 * Copyright (C) 2004, 2005, Soeren Sandmann
I
Ingo Molnar 已提交
7 8
 */
#include <linux/kallsyms.h>
I
Ingo Molnar 已提交
9 10
#include <linux/debugfs.h>
#include <linux/hrtimer.h>
I
Ingo Molnar 已提交
11 12
#include <linux/uaccess.h>
#include <linux/ftrace.h>
I
Ingo Molnar 已提交
13
#include <linux/module.h>
14
#include <linux/irq.h>
I
Ingo Molnar 已提交
15
#include <linux/fs.h>
I
Ingo Molnar 已提交
16 17 18

#include "trace.h"

19
static struct trace_array	*sysprof_trace;
I
Ingo Molnar 已提交
20 21
static int __read_mostly	tracer_enabled;

22
/*
I
Ingo Molnar 已提交
23
 * 1 msec sample interval by default:
24
 */
I
Ingo Molnar 已提交
25
static unsigned long sample_period = 1000000;
I
Ingo Molnar 已提交
26
static const unsigned int sample_max_depth = 512;
I
Ingo Molnar 已提交
27

I
Ingo Molnar 已提交
28
static DEFINE_MUTEX(sample_timer_lock);
I
Ingo Molnar 已提交
29 30 31 32 33
/*
 * Per CPU hrtimers that do the profiling:
 */
static DEFINE_PER_CPU(struct hrtimer, stack_trace_hrtimer);

34 35 36 37 38 39 40
struct stack_frame {
	const void __user	*next_fp;
	unsigned long		return_address;
};

static int copy_stack_frame(const void __user *fp, struct stack_frame *frame)
{
I
Ingo Molnar 已提交
41 42
	int ret;

43 44 45
	if (!access_ok(VERIFY_READ, fp, sizeof(*frame)))
		return 0;

I
Ingo Molnar 已提交
46 47 48 49 50
	ret = 1;
	pagefault_disable();
	if (__copy_from_user_inatomic(frame, fp, sizeof(*frame)))
		ret = 0;
	pagefault_enable();
51

I
Ingo Molnar 已提交
52
	return ret;
53 54 55 56 57 58 59
}

static void timer_notify(struct pt_regs *regs, int cpu)
{
	struct trace_array_cpu *data;
	struct stack_frame frame;
	struct trace_array *tr;
I
Ingo Molnar 已提交
60
	const void __user *fp;
61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83
	int is_user;
	int i;

	if (!regs)
		return;

	tr = sysprof_trace;
	data = tr->data[cpu];
	is_user = user_mode(regs);

	if (!current || current->pid == 0)
		return;

	if (is_user && current->state != TASK_RUNNING)
		return;

	if (!is_user) {
		/* kernel */
		ftrace(tr, data, current->pid, 1, 0);
		return;

	}

T
Thomas Gleixner 已提交
84
	__trace_special(tr, data, 0, current->pid, regs->ip);
85

I
Ingo Molnar 已提交
86
	fp = (void __user *)regs->bp;
87

I
Ingo Molnar 已提交
88
	for (i = 0; i < sample_max_depth; i++) {
I
Ingo Molnar 已提交
89 90 91
		frame.next_fp = 0;
		frame.return_address = 0;
		if (!copy_stack_frame(fp, &frame))
92
			break;
I
Ingo Molnar 已提交
93
		if ((unsigned long)fp < regs->sp)
94 95
			break;

T
Thomas Gleixner 已提交
96
		__trace_special(tr, data, 1, frame.return_address,
I
Ingo Molnar 已提交
97 98
			      (unsigned long)fp);
		fp = frame.next_fp;
99 100
	}

T
Thomas Gleixner 已提交
101
	__trace_special(tr, data, 2, current->pid, i);
102

I
Ingo Molnar 已提交
103 104 105
	/*
	 * Special trace entry if we overflow the max depth:
	 */
I
Ingo Molnar 已提交
106
	if (i == sample_max_depth)
T
Thomas Gleixner 已提交
107
		__trace_special(tr, data, -1, -1, -1);
108 109
}

I
Ingo Molnar 已提交
110 111 112
static enum hrtimer_restart stack_trace_timer_fn(struct hrtimer *hrtimer)
{
	/* trace here */
113
	timer_notify(get_irq_regs(), smp_processor_id());
I
Ingo Molnar 已提交
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157

	hrtimer_forward_now(hrtimer, ns_to_ktime(sample_period));

	return HRTIMER_RESTART;
}

static void start_stack_timer(int cpu)
{
	struct hrtimer *hrtimer = &per_cpu(stack_trace_hrtimer, cpu);

	hrtimer_init(hrtimer, CLOCK_MONOTONIC, HRTIMER_MODE_REL);
	hrtimer->function = stack_trace_timer_fn;
	hrtimer->cb_mode = HRTIMER_CB_IRQSAFE_NO_SOFTIRQ;

	hrtimer_start(hrtimer, ns_to_ktime(sample_period), HRTIMER_MODE_REL);
}

static void start_stack_timers(void)
{
	cpumask_t saved_mask = current->cpus_allowed;
	int cpu;

	for_each_online_cpu(cpu) {
		set_cpus_allowed_ptr(current, &cpumask_of_cpu(cpu));
		start_stack_timer(cpu);
	}
	set_cpus_allowed_ptr(current, &saved_mask);
}

static void stop_stack_timer(int cpu)
{
	struct hrtimer *hrtimer = &per_cpu(stack_trace_hrtimer, cpu);

	hrtimer_cancel(hrtimer);
}

static void stop_stack_timers(void)
{
	int cpu;

	for_each_online_cpu(cpu)
		stop_stack_timer(cpu);
}

T
Thomas Gleixner 已提交
158
static void stack_reset(struct trace_array *tr)
I
Ingo Molnar 已提交
159 160 161 162 163 164 165 166 167
{
	int cpu;

	tr->time_start = ftrace_now(tr->cpu);

	for_each_online_cpu(cpu)
		tracing_reset(tr->data[cpu]);
}

T
Thomas Gleixner 已提交
168
static void start_stack_trace(struct trace_array *tr)
I
Ingo Molnar 已提交
169
{
I
Ingo Molnar 已提交
170
	mutex_lock(&sample_timer_lock);
I
Ingo Molnar 已提交
171
	stack_reset(tr);
I
Ingo Molnar 已提交
172
	start_stack_timers();
I
Ingo Molnar 已提交
173
	tracer_enabled = 1;
I
Ingo Molnar 已提交
174
	mutex_unlock(&sample_timer_lock);
I
Ingo Molnar 已提交
175 176
}

T
Thomas Gleixner 已提交
177
static void stop_stack_trace(struct trace_array *tr)
I
Ingo Molnar 已提交
178
{
I
Ingo Molnar 已提交
179
	mutex_lock(&sample_timer_lock);
I
Ingo Molnar 已提交
180
	stop_stack_timers();
I
Ingo Molnar 已提交
181
	tracer_enabled = 0;
I
Ingo Molnar 已提交
182
	mutex_unlock(&sample_timer_lock);
I
Ingo Molnar 已提交
183 184
}

T
Thomas Gleixner 已提交
185
static void stack_trace_init(struct trace_array *tr)
I
Ingo Molnar 已提交
186
{
187
	sysprof_trace = tr;
I
Ingo Molnar 已提交
188 189 190 191 192

	if (tr->ctrl)
		start_stack_trace(tr);
}

T
Thomas Gleixner 已提交
193
static void stack_trace_reset(struct trace_array *tr)
I
Ingo Molnar 已提交
194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214
{
	if (tr->ctrl)
		stop_stack_trace(tr);
}

static void stack_trace_ctrl_update(struct trace_array *tr)
{
	/* When starting a new trace, reset the buffers */
	if (tr->ctrl)
		start_stack_trace(tr);
	else
		stop_stack_trace(tr);
}

static struct tracer stack_trace __read_mostly =
{
	.name		= "sysprof",
	.init		= stack_trace_init,
	.reset		= stack_trace_reset,
	.ctrl_update	= stack_trace_ctrl_update,
#ifdef CONFIG_FTRACE_SELFTEST
215
	.selftest    = trace_selftest_startup_sysprof,
I
Ingo Molnar 已提交
216 217 218 219 220 221 222 223
#endif
};

__init static int init_stack_trace(void)
{
	return register_tracer(&stack_trace);
}
device_initcall(init_stack_trace);
I
Ingo Molnar 已提交
224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284

#define MAX_LONG_DIGITS 22

static ssize_t
sysprof_sample_read(struct file *filp, char __user *ubuf,
		    size_t cnt, loff_t *ppos)
{
	char buf[MAX_LONG_DIGITS];
	int r;

	r = sprintf(buf, "%ld\n", nsecs_to_usecs(sample_period));

	return simple_read_from_buffer(ubuf, cnt, ppos, buf, r);
}

static ssize_t
sysprof_sample_write(struct file *filp, const char __user *ubuf,
		     size_t cnt, loff_t *ppos)
{
	char buf[MAX_LONG_DIGITS];
	unsigned long val;

	if (cnt > MAX_LONG_DIGITS-1)
		cnt = MAX_LONG_DIGITS-1;

	if (copy_from_user(&buf, ubuf, cnt))
		return -EFAULT;

	buf[cnt] = 0;

	val = simple_strtoul(buf, NULL, 10);
	/*
	 * Enforce a minimum sample period of 100 usecs:
	 */
	if (val < 100)
		val = 100;

	mutex_lock(&sample_timer_lock);
	stop_stack_timers();
	sample_period = val * 1000;
	start_stack_timers();
	mutex_unlock(&sample_timer_lock);

	return cnt;
}

static struct file_operations sysprof_sample_fops = {
	.read		= sysprof_sample_read,
	.write		= sysprof_sample_write,
};

void init_tracer_sysprof_debugfs(struct dentry *d_tracer)
{
	struct dentry *entry;

	entry = debugfs_create_file("sysprof_sample_period", 0644,
			d_tracer, NULL, &sysprof_sample_fops);
	if (entry)
		return;
	pr_warning("Could not create debugfs 'dyn_ftrace_total_info' entry\n");
}