ftrace.c 10.6 KB
Newer Older
1 2 3 4
/*
 * Code for replacing ftrace calls with jumps.
 *
 * Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com>
5
 * Copyright (C) 2009, 2010 DSLab, Lanzhou University, China
6
 * Author: Wu Zhangjin <wuzhangjin@gmail.com>
7 8 9 10 11 12 13
 *
 * Thanks goes to Steven Rostedt for writing the original x86 version.
 */

#include <linux/uaccess.h>
#include <linux/init.h>
#include <linux/ftrace.h>
R
Ralf Baechle 已提交
14
#include <linux/syscalls.h>
15

16 17
#include <asm/asm.h>
#include <asm/asm-offsets.h>
18
#include <asm/cacheflush.h>
R
Ralf Baechle 已提交
19
#include <asm/syscall.h>
20
#include <asm/uasm.h>
R
Ralf Baechle 已提交
21
#include <asm/unistd.h>
22

23
#include <asm-generic/sections.h>
24

25 26 27 28 29 30
#if defined(KBUILD_MCOUNT_RA_ADDRESS) && defined(CONFIG_32BIT)
#define MCOUNT_OFFSET_INSNS 5
#else
#define MCOUNT_OFFSET_INSNS 4
#endif

31 32
#ifdef CONFIG_DYNAMIC_FTRACE

33 34 35 36 37 38
/* Arch override because MIPS doesn't need to run this from stop_machine() */
void arch_ftrace_update_code(int command)
{
	ftrace_modify_all_code(command);
}

39 40
#endif

41 42 43 44
#ifdef CONFIG_DYNAMIC_FTRACE

#define JAL 0x0c000000		/* jump & link: ip --> ra, jump to target */
#define ADDR_MASK 0x03ffffff	/*  op_code|addr : 31...26|25 ....0 */
45
#define JUMP_RANGE_MASK ((1UL << 28) - 1)
46

47
#define INSN_NOP 0x00000000	/* nop */
48 49 50 51
#define INSN_JAL(addr)	\
	((unsigned int)(JAL | (((addr) >> 2) & ADDR_MASK)))

static unsigned int insn_jal_ftrace_caller __read_mostly;
52
static unsigned int insn_la_mcount[2] __read_mostly;
53 54 55 56 57 58 59
static unsigned int insn_j_ftrace_graph_caller __maybe_unused __read_mostly;

static inline void ftrace_dyn_arch_init_insns(void)
{
	u32 *buf;
	unsigned int v1;

60
	/* la v1, _mcount */
61
	v1 = 3;
62 63
	buf = (u32 *)&insn_la_mcount[0];
	UASM_i_LA(&buf, v1, MCOUNT_ADDR);
64 65 66

	/* jal (ftrace_caller + 8), jump over the first two instruction */
	buf = (u32 *)&insn_jal_ftrace_caller;
67
	uasm_i_jal(&buf, (FTRACE_ADDR + 8) & JUMP_RANGE_MASK);
68 69 70 71

#ifdef CONFIG_FUNCTION_GRAPH_TRACER
	/* j ftrace_graph_caller */
	buf = (u32 *)&insn_j_ftrace_graph_caller;
72
	uasm_i_j(&buf, (unsigned long)ftrace_graph_caller & JUMP_RANGE_MASK);
73 74
#endif
}
75 76 77

static int ftrace_modify_code(unsigned long ip, unsigned int new_code)
{
78
	int faulted;
79
	mm_segment_t old_fs;
80 81 82 83 84 85

	/* *(unsigned int *)ip = new_code; */
	safe_store_code(new_code, ip, faulted);

	if (unlikely(faulted))
		return -EFAULT;
86

87 88
	old_fs = get_fs();
	set_fs(get_ds());
89
	flush_icache_range(ip, ip + 8);
90
	set_fs(old_fs);
91 92 93 94

	return 0;
}

95 96 97 98 99
#ifndef CONFIG_64BIT
static int ftrace_modify_code_2(unsigned long ip, unsigned int new_code1,
				unsigned int new_code2)
{
	int faulted;
100
	mm_segment_t old_fs;
101 102 103 104

	safe_store_code(new_code1, ip, faulted);
	if (unlikely(faulted))
		return -EFAULT;
105 106 107

	ip += 4;
	safe_store_code(new_code2, ip, faulted);
108 109
	if (unlikely(faulted))
		return -EFAULT;
110 111 112 113

	ip -= 4;
	old_fs = get_fs();
	set_fs(get_ds());
114
	flush_icache_range(ip, ip + 8);
115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140
	set_fs(old_fs);

	return 0;
}

static int ftrace_modify_code_2r(unsigned long ip, unsigned int new_code1,
				 unsigned int new_code2)
{
	int faulted;
	mm_segment_t old_fs;

	ip += 4;
	safe_store_code(new_code2, ip, faulted);
	if (unlikely(faulted))
		return -EFAULT;

	ip -= 4;
	safe_store_code(new_code1, ip, faulted);
	if (unlikely(faulted))
		return -EFAULT;

	old_fs = get_fs();
	set_fs(get_ds());
	flush_icache_range(ip, ip + 8);
	set_fs(old_fs);

141 142 143 144
	return 0;
}
#endif

145 146 147 148 149 150 151
/*
 * The details about the calling site of mcount on MIPS
 *
 * 1. For kernel:
 *
 * move at, ra
 * jal _mcount		--> nop
152
 *  sub sp, sp, 8	--> nop  (CONFIG_32BIT)
153 154 155 156 157
 *
 * 2. For modules:
 *
 * 2.1 For KBUILD_MCOUNT_RA_ADDRESS and CONFIG_32BIT
 *
R
Ralf Baechle 已提交
158
 * lui v1, hi_16bit_of_mcount	     --> b 1f (0x10000005)
159
 * addiu v1, v1, low_16bit_of_mcount --> nop  (CONFIG_32BIT)
160 161 162 163
 * move at, ra
 * move $12, ra_address
 * jalr v1
 *  sub sp, sp, 8
R
Ralf Baechle 已提交
164
 *				    1: offset = 5 instructions
165 166
 * 2.2 For the Other situations
 *
R
Ralf Baechle 已提交
167
 * lui v1, hi_16bit_of_mcount	     --> b 1f (0x10000004)
168
 * addiu v1, v1, low_16bit_of_mcount --> nop  (CONFIG_32BIT)
169 170 171
 * move at, ra
 * jalr v1
 *  nop | move $12, ra_address | sub sp, sp, 8
R
Ralf Baechle 已提交
172
 *				    1: offset = 4 instructions
173 174 175 176
 */

#define INSN_B_1F (0x10000000 | MCOUNT_OFFSET_INSNS)

177 178 179 180 181 182
int ftrace_make_nop(struct module *mod,
		    struct dyn_ftrace *rec, unsigned long addr)
{
	unsigned int new;
	unsigned long ip = rec->ip;

183
	/*
184 185
	 * If ip is in kernel space, no long call, otherwise, long call is
	 * needed.
186
	 */
187
	new = core_kernel_text(ip) ? INSN_NOP : INSN_B_1F;
188
#ifdef CONFIG_64BIT
189
	return ftrace_modify_code(ip, new);
190 191 192 193 194 195 196 197 198 199
#else
	/*
	 * On 32 bit MIPS platforms, gcc adds a stack adjust
	 * instruction in the delay slot after the branch to
	 * mcount and expects mcount to restore the sp on return.
	 * This is based on a legacy API and does nothing but
	 * waste instructions so it's being removed at runtime.
	 */
	return ftrace_modify_code_2(ip, new, INSN_NOP);
#endif
200 201 202 203 204 205 206
}

int ftrace_make_call(struct dyn_ftrace *rec, unsigned long addr)
{
	unsigned int new;
	unsigned long ip = rec->ip;

207
	new = core_kernel_text(ip) ? insn_jal_ftrace_caller : insn_la_mcount[0];
208

209
#ifdef CONFIG_64BIT
210
	return ftrace_modify_code(ip, new);
211
#else
212
	return ftrace_modify_code_2r(ip, new, core_kernel_text(ip) ?
213 214
						INSN_NOP : insn_la_mcount[1]);
#endif
215 216 217 218 219 220 221 222
}

#define FTRACE_CALL_IP ((unsigned long)(&ftrace_call))

int ftrace_update_ftrace_func(ftrace_func_t func)
{
	unsigned int new;

223
	new = INSN_JAL((unsigned long)func);
224 225 226 227

	return ftrace_modify_code(FTRACE_CALL_IP, new);
}

228
int __init ftrace_dyn_arch_init(void)
229
{
230 231 232 233 234 235
	/* Encode the instructions when booting */
	ftrace_dyn_arch_init_insns();

	/* Remove "b ftrace_stub" to ensure ftrace_caller() is executed */
	ftrace_modify_code(MCOUNT_ADDR, INSN_NOP);

236 237
	return 0;
}
238
#endif	/* CONFIG_DYNAMIC_FTRACE */
239 240 241

#ifdef CONFIG_FUNCTION_GRAPH_TRACER

242 243 244 245 246 247 248 249
#ifdef CONFIG_DYNAMIC_FTRACE

extern void ftrace_graph_call(void);
#define FTRACE_GRAPH_CALL_IP	((unsigned long)(&ftrace_graph_call))

int ftrace_enable_ftrace_graph_caller(void)
{
	return ftrace_modify_code(FTRACE_GRAPH_CALL_IP,
250
			insn_j_ftrace_graph_caller);
251 252 253 254
}

int ftrace_disable_ftrace_graph_caller(void)
{
255
	return ftrace_modify_code(FTRACE_GRAPH_CALL_IP, INSN_NOP);
256 257
}

258
#endif	/* CONFIG_DYNAMIC_FTRACE */
259

260
#ifndef KBUILD_MCOUNT_RA_ADDRESS
261

R
Ralf Baechle 已提交
262 263
#define S_RA_SP (0xafbf << 16)	/* s{d,w} ra, offset(sp) */
#define S_R_SP	(0xafb0 << 16)	/* s{d,w} R, offset(sp) */
264 265
#define OFFSET_MASK	0xffff	/* stack offset range: 0 ~ PT_SIZE */

266 267
unsigned long ftrace_get_parent_ra_addr(unsigned long self_ra, unsigned long
		old_parent_ra, unsigned long parent_ra_addr, unsigned long fp)
268
{
269
	unsigned long sp, ip, tmp;
270
	unsigned int code;
271
	int faulted;
272

273
	/*
274
	 * For module, move the ip from the return address after the
275 276
	 * instruction "lui v1, hi_16bit_of_mcount"(offset is 24), but for
	 * kernel, move after the instruction "move ra, at"(offset is 16)
277
	 */
278
	ip = self_ra - (core_kernel_text(self_ra) ? 16 : 24);
279

280 281 282 283
	/*
	 * search the text until finding the non-store instruction or "s{d,w}
	 * ra, offset(sp)" instruction
	 */
284
	do {
285 286 287 288 289
		/* get the code at "ip": code = *(unsigned int *)ip; */
		safe_load_code(code, ip, faulted);

		if (unlikely(faulted))
			return 0;
290 291
		/*
		 * If we hit the non-store instruction before finding where the
292
		 * ra is stored, then this is a leaf function and it does not
293 294
		 * store the ra on the stack
		 */
295
		if ((code & S_R_SP) != S_R_SP)
296
			return parent_ra_addr;
297

298 299 300
		/* Move to the next instruction */
		ip -= 4;
	} while ((code & S_RA_SP) != S_RA_SP);
301 302

	sp = fp + (code & OFFSET_MASK);
303

304 305
	/* tmp = *(unsigned long *)sp; */
	safe_load_stack(tmp, sp, faulted);
306 307
	if (unlikely(faulted))
		return 0;
308

309
	if (tmp == old_parent_ra)
310 311 312 313
		return sp;
	return 0;
}

314
#endif	/* !KBUILD_MCOUNT_RA_ADDRESS */
315

316 317 318 319
/*
 * Hook the return address and push it in the stack of return addrs
 * in current thread info.
 */
320
void prepare_ftrace_return(unsigned long *parent_ra_addr, unsigned long self_ra,
321 322
			   unsigned long fp)
{
323
	unsigned long old_parent_ra;
324 325 326
	struct ftrace_graph_ent trace;
	unsigned long return_hooker = (unsigned long)
	    &return_to_handler;
327
	int faulted, insns;
328

329 330 331
	if (unlikely(ftrace_graph_is_dead()))
		return;

332 333 334
	if (unlikely(atomic_read(&current->tracing_graph_pause)))
		return;

335
	/*
336 337
	 * "parent_ra_addr" is the stack address saved the return address of
	 * the caller of _mcount.
338 339 340 341 342 343
	 *
	 * if the gcc < 4.5, a leaf function does not save the return address
	 * in the stack address, so, we "emulate" one in _mcount's stack space,
	 * and hijack it directly, but for a non-leaf function, it save the
	 * return address to the its own stack space, we can not hijack it
	 * directly, but need to find the real stack address,
344
	 * ftrace_get_parent_addr() does it!
345 346 347 348 349
	 *
	 * if gcc>= 4.5, with the new -mmcount-ra-address option, for a
	 * non-leaf function, the location of the return address will be saved
	 * to $12 for us, and for a leaf function, only put a zero into $12. we
	 * do it in ftrace_graph_caller of mcount.S.
350 351
	 */

352 353
	/* old_parent_ra = *parent_ra_addr; */
	safe_load_stack(old_parent_ra, parent_ra_addr, faulted);
354 355
	if (unlikely(faulted))
		goto out;
356
#ifndef KBUILD_MCOUNT_RA_ADDRESS
357 358
	parent_ra_addr = (unsigned long *)ftrace_get_parent_ra_addr(self_ra,
			old_parent_ra, (unsigned long)parent_ra_addr, fp);
359 360 361 362
	/*
	 * If fails when getting the stack address of the non-leaf function's
	 * ra, stop function graph tracer and return
	 */
363
	if (parent_ra_addr == 0)
364
		goto out;
365
#endif
366 367
	/* *parent_ra_addr = return_hooker; */
	safe_store_stack(return_hooker, parent_ra_addr, faulted);
368 369
	if (unlikely(faulted))
		goto out;
370

371 372
	if (ftrace_push_return_trace(old_parent_ra, self_ra, &trace.depth, fp,
				     NULL) == -EBUSY) {
373
		*parent_ra_addr = old_parent_ra;
374 375 376
		return;
	}

377 378 379 380 381 382
	/*
	 * Get the recorded ip of the current mcount calling site in the
	 * __mcount_loc section, which will be used to filter the function
	 * entries configured through the tracing/set_graph_function interface.
	 */

383
	insns = core_kernel_text(self_ra) ? 2 : MCOUNT_OFFSET_INSNS + 1;
384
	trace.func = self_ra - (MCOUNT_INSN_SIZE * insns);
385 386 387 388

	/* Only trace if the calling function expects to */
	if (!ftrace_graph_entry(&trace)) {
		current->curr_ret_stack--;
389
		*parent_ra_addr = old_parent_ra;
390
	}
391 392 393 394
	return;
out:
	ftrace_graph_stop();
	WARN_ON(1);
395
}
396
#endif	/* CONFIG_FUNCTION_GRAPH_TRACER */
R
Ralf Baechle 已提交
397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412

#ifdef CONFIG_FTRACE_SYSCALLS

#ifdef CONFIG_32BIT
unsigned long __init arch_syscall_addr(int nr)
{
	return (unsigned long)sys_call_table[nr - __NR_O32_Linux];
}
#endif

#ifdef CONFIG_64BIT

unsigned long __init arch_syscall_addr(int nr)
{
#ifdef CONFIG_MIPS32_N32
	if (nr >= __NR_N32_Linux && nr <= __NR_N32_Linux + __NR_N32_Linux_syscalls)
413
		return (unsigned long)sysn32_call_table[nr - __NR_N32_Linux];
R
Ralf Baechle 已提交
414 415 416 417 418 419 420 421 422 423 424 425 426
#endif
	if (nr >= __NR_64_Linux  && nr <= __NR_64_Linux + __NR_64_Linux_syscalls)
		return (unsigned long)sys_call_table[nr - __NR_64_Linux];
#ifdef CONFIG_MIPS32_O32
	if (nr >= __NR_O32_Linux && nr <= __NR_O32_Linux + __NR_O32_Linux_syscalls)
		return (unsigned long)sys32_call_table[nr - __NR_O32_Linux];
#endif

	return (unsigned long) &sys_ni_syscall;
}
#endif

#endif /* CONFIG_FTRACE_SYSCALLS */