1 /* Rewritten by Rusty Russell, on the backs of many others...
2    Copyright (C) 2001 Rusty Russell, 2002 Rusty Russell IBM.
3 
4     This program is free software; you can redistribute it and/or modify
5     it under the terms of the GNU General Public License as published by
6     the Free Software Foundation; either version 2 of the License, or
7     (at your option) any later version.
8 
9     This program is distributed in the hope that it will be useful,
10     but WITHOUT ANY WARRANTY; without even the implied warranty of
11     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12     GNU General Public License for more details.
13 
14     You should have received a copy of the GNU General Public License
15     along with this program; if not, write to the Free Software
16     Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
17 */
18 #include <linux/ftrace.h>
19 #include <linux/memory.h>
20 #include <linux/extable.h>
21 #include <linux/module.h>
22 #include <linux/mutex.h>
23 #include <linux/init.h>
24 #include <linux/kprobes.h>
25 #include <linux/filter.h>
26 
27 #include <asm/sections.h>
28 #include <linux/uaccess.h>
29 
30 /*
31  * mutex protecting text section modification (dynamic code patching).
32  * some users need to sleep (allocating memory...) while they hold this lock.
33  *
34  * Note: Also protects SMP-alternatives modification on x86.
35  *
36  * NOT exported to modules - patching kernel text is a really delicate matter.
37  */
38 DEFINE_MUTEX(text_mutex);
39 
40 extern struct exception_table_entry __start___ex_table[];
41 extern struct exception_table_entry __stop___ex_table[];
42 
43 /* Cleared by build time tools if the table is already sorted. */
44 u32 __initdata __visible main_extable_sort_needed = 1;
45 
46 /* Sort the kernel's built-in exception table */
sort_main_extable(void)47 void __init sort_main_extable(void)
48 {
49 	if (main_extable_sort_needed && __stop___ex_table > __start___ex_table) {
50 		pr_notice("Sorting __ex_table...\n");
51 		sort_extable(__start___ex_table, __stop___ex_table);
52 	}
53 }
54 
55 /* Given an address, look for it in the exception tables. */
search_exception_tables(unsigned long addr)56 const struct exception_table_entry *search_exception_tables(unsigned long addr)
57 {
58 	const struct exception_table_entry *e;
59 
60 	e = search_extable(__start___ex_table,
61 			   __stop___ex_table - __start___ex_table, addr);
62 	if (!e)
63 		e = search_module_extables(addr);
64 	return e;
65 }
66 
init_kernel_text(unsigned long addr)67 int init_kernel_text(unsigned long addr)
68 {
69 	if (addr >= (unsigned long)_sinittext &&
70 	    addr < (unsigned long)_einittext)
71 		return 1;
72 	return 0;
73 }
74 
core_kernel_text(unsigned long addr)75 int notrace core_kernel_text(unsigned long addr)
76 {
77 	if (addr >= (unsigned long)_stext &&
78 	    addr < (unsigned long)_etext)
79 		return 1;
80 
81 	if (system_state < SYSTEM_RUNNING &&
82 	    init_kernel_text(addr))
83 		return 1;
84 	return 0;
85 }
86 
87 /**
88  * core_kernel_data - tell if addr points to kernel data
89  * @addr: address to test
90  *
91  * Returns true if @addr passed in is from the core kernel data
92  * section.
93  *
94  * Note: On some archs it may return true for core RODATA, and false
95  *  for others. But will always be true for core RW data.
96  */
core_kernel_data(unsigned long addr)97 int core_kernel_data(unsigned long addr)
98 {
99 	if (addr >= (unsigned long)_sdata &&
100 	    addr < (unsigned long)_edata)
101 		return 1;
102 	return 0;
103 }
104 
__kernel_text_address(unsigned long addr)105 int __kernel_text_address(unsigned long addr)
106 {
107 	if (kernel_text_address(addr))
108 		return 1;
109 	/*
110 	 * There might be init symbols in saved stacktraces.
111 	 * Give those symbols a chance to be printed in
112 	 * backtraces (such as lockdep traces).
113 	 *
114 	 * Since we are after the module-symbols check, there's
115 	 * no danger of address overlap:
116 	 */
117 	if (init_kernel_text(addr))
118 		return 1;
119 	return 0;
120 }
121 
kernel_text_address(unsigned long addr)122 int kernel_text_address(unsigned long addr)
123 {
124 	bool no_rcu;
125 	int ret = 1;
126 
127 	if (core_kernel_text(addr))
128 		return 1;
129 
130 	/*
131 	 * If a stack dump happens while RCU is not watching, then
132 	 * RCU needs to be notified that it requires to start
133 	 * watching again. This can happen either by tracing that
134 	 * triggers a stack trace, or a WARN() that happens during
135 	 * coming back from idle, or cpu on or offlining.
136 	 *
137 	 * is_module_text_address() as well as the kprobe slots
138 	 * and is_bpf_text_address() require RCU to be watching.
139 	 */
140 	no_rcu = !rcu_is_watching();
141 
142 	/* Treat this like an NMI as it can happen anywhere */
143 	if (no_rcu)
144 		rcu_nmi_enter();
145 
146 	if (is_module_text_address(addr))
147 		goto out;
148 	if (is_ftrace_trampoline(addr))
149 		goto out;
150 	if (is_kprobe_optinsn_slot(addr) || is_kprobe_insn_slot(addr))
151 		goto out;
152 	if (is_bpf_text_address(addr))
153 		goto out;
154 	ret = 0;
155 out:
156 	if (no_rcu)
157 		rcu_nmi_exit();
158 
159 	return ret;
160 }
161 
162 /*
163  * On some architectures (PPC64, IA64) function pointers
164  * are actually only tokens to some data that then holds the
165  * real function address. As a result, to find if a function
166  * pointer is part of the kernel text, we need to do some
167  * special dereferencing first.
168  */
func_ptr_is_kernel_text(void * ptr)169 int func_ptr_is_kernel_text(void *ptr)
170 {
171 	unsigned long addr;
172 	addr = (unsigned long) dereference_function_descriptor(ptr);
173 	if (core_kernel_text(addr))
174 		return 1;
175 	return is_module_text_address(addr);
176 }
177