extable.c 4.8 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/* Rewritten by Rusty Russell, on the backs of many others...
   Copyright (C) 2001 Rusty Russell, 2002 Rusty Russell IBM.

    This program is free software; you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation; either version 2 of the License, or
    (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with this program; if not, write to the Free Software
    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
*/
18
#include <linux/ftrace.h>
19
#include <linux/memory.h>
20
#include <linux/extable.h>
L
Linus Torvalds 已提交
21
#include <linux/module.h>
22
#include <linux/mutex.h>
L
Linus Torvalds 已提交
23
#include <linux/init.h>
24
#include <linux/kprobes.h>
25
#include <linux/filter.h>
26

L
Linus Torvalds 已提交
27
#include <asm/sections.h>
28
#include <linux/uaccess.h>
29 30 31 32 33

/*
 * mutex protecting text section modification (dynamic code patching).
 * some users need to sleep (allocating memory...) while they hold this lock.
 *
34 35
 * Note: Also protects SMP-alternatives modification on x86.
 *
36 37 38
 * NOT exported to modules - patching kernel text is a really delicate matter.
 */
DEFINE_MUTEX(text_mutex);
L
Linus Torvalds 已提交
39 40 41 42

extern struct exception_table_entry __start___ex_table[];
extern struct exception_table_entry __stop___ex_table[];

43
/* Cleared by build time tools if the table is already sorted. */
44
u32 __initdata __visible main_extable_sort_needed = 1;
45

L
Linus Torvalds 已提交
46 47 48
/* Sort the kernel's built-in exception table */
void __init sort_main_extable(void)
{
49
	if (main_extable_sort_needed && __stop___ex_table > __start___ex_table) {
50
		pr_notice("Sorting __ex_table...\n");
51
		sort_extable(__start___ex_table, __stop___ex_table);
52
	}
L
Linus Torvalds 已提交
53 54 55 56 57 58 59
}

/* Given an address, look for it in the exception tables. */
const struct exception_table_entry *search_exception_tables(unsigned long addr)
{
	const struct exception_table_entry *e;

60 61
	e = search_extable(__start___ex_table,
			   __stop___ex_table - __start___ex_table, addr);
L
Linus Torvalds 已提交
62 63 64 65 66
	if (!e)
		e = search_module_extables(addr);
	return e;
}

67
int init_kernel_text(unsigned long addr)
68 69
{
	if (addr >= (unsigned long)_sinittext &&
70
	    addr < (unsigned long)_einittext)
71 72 73 74
		return 1;
	return 0;
}

75
int notrace core_kernel_text(unsigned long addr)
L
Linus Torvalds 已提交
76 77
{
	if (addr >= (unsigned long)_stext &&
78
	    addr < (unsigned long)_etext)
L
Linus Torvalds 已提交
79 80
		return 1;

81
	if (system_state < SYSTEM_RUNNING &&
82
	    init_kernel_text(addr))
L
Linus Torvalds 已提交
83 84 85 86
		return 1;
	return 0;
}

87 88 89 90 91 92 93 94 95 96
/**
 * core_kernel_data - tell if addr points to kernel data
 * @addr: address to test
 *
 * Returns true if @addr passed in is from the core kernel data
 * section.
 *
 * Note: On some archs it may return true for core RODATA, and false
 *  for others. But will always be true for core RW data.
 */
97 98
int core_kernel_data(unsigned long addr)
{
99
	if (addr >= (unsigned long)_sdata &&
100 101 102 103 104
	    addr < (unsigned long)_edata)
		return 1;
	return 0;
}

105
int __kernel_text_address(unsigned long addr)
L
Linus Torvalds 已提交
106
{
107
	if (kernel_text_address(addr))
108
		return 1;
109 110 111 112 113 114 115 116 117 118 119
	/*
	 * There might be init symbols in saved stacktraces.
	 * Give those symbols a chance to be printed in
	 * backtraces (such as lockdep traces).
	 *
	 * Since we are after the module-symbols check, there's
	 * no danger of address overlap:
	 */
	if (init_kernel_text(addr))
		return 1;
	return 0;
L
Linus Torvalds 已提交
120 121 122 123
}

int kernel_text_address(unsigned long addr)
{
124 125 126
	bool no_rcu;
	int ret = 1;

L
Linus Torvalds 已提交
127 128
	if (core_kernel_text(addr))
		return 1;
129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145

	/*
	 * If a stack dump happens while RCU is not watching, then
	 * RCU needs to be notified that it requires to start
	 * watching again. This can happen either by tracing that
	 * triggers a stack trace, or a WARN() that happens during
	 * coming back from idle, or cpu on or offlining.
	 *
	 * is_module_text_address() as well as the kprobe slots
	 * and is_bpf_text_address() require RCU to be watching.
	 */
	no_rcu = !rcu_is_watching();

	/* Treat this like an NMI as it can happen anywhere */
	if (no_rcu)
		rcu_nmi_enter();

146
	if (is_module_text_address(addr))
147
		goto out;
148
	if (is_ftrace_trampoline(addr))
149
		goto out;
150
	if (is_kprobe_optinsn_slot(addr) || is_kprobe_insn_slot(addr))
151
		goto out;
152
	if (is_bpf_text_address(addr))
153 154 155 156 157 158 159
		goto out;
	ret = 0;
out:
	if (no_rcu)
		rcu_nmi_exit();

	return ret;
L
Linus Torvalds 已提交
160
}
161 162 163 164 165 166 167 168 169 170 171 172 173 174

/*
 * On some architectures (PPC64, IA64) function pointers
 * are actually only tokens to some data that then holds the
 * real function address. As a result, to find if a function
 * pointer is part of the kernel text, we need to do some
 * special dereferencing first.
 */
int func_ptr_is_kernel_text(void *ptr)
{
	unsigned long addr;
	addr = (unsigned long) dereference_function_descriptor(ptr);
	if (core_kernel_text(addr))
		return 1;
175
	return is_module_text_address(addr);
176
}