blob: a17fdb63dc3e470955dcfd5e5861920b9db2749f [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* Rewritten by Rusty Russell, on the backs of many others...
2 Copyright (C) 2001 Rusty Russell, 2002 Rusty Russell IBM.
3
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2 of the License, or
7 (at your option) any later version.
8
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
13
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17*/
Frederic Weisbecker8b96f012008-12-06 03:40:00 +010018#include <linux/ftrace.h>
Dmitri Vorobievf80d2d72009-03-22 19:11:10 +020019#include <linux/memory.h>
Paul Gortmaker8a293be2016-07-23 14:01:45 -040020#include <linux/extable.h>
Ingo Molnar505f2b92009-03-20 11:05:04 +010021#include <linux/module.h>
22#include <linux/mutex.h>
23#include <linux/init.h>
Masami Hiramatsu5b485622017-01-08 23:58:09 +090024#include <linux/kprobes.h>
Daniel Borkmann74451e662017-02-16 22:24:50 +010025#include <linux/filter.h>
Ingo Molnar505f2b92009-03-20 11:05:04 +010026
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <asm/sections.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080028#include <linux/uaccess.h>
Ingo Molnar505f2b92009-03-20 11:05:04 +010029
30/*
31 * mutex protecting text section modification (dynamic code patching).
32 * some users need to sleep (allocating memory...) while they hold this lock.
33 *
Zhou Chengminge846d132017-11-02 09:18:21 +080034 * Note: Also protects SMP-alternatives modification on x86.
35 *
Ingo Molnar505f2b92009-03-20 11:05:04 +010036 * NOT exported to modules - patching kernel text is a really delicate matter.
37 */
38DEFINE_MUTEX(text_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -070039
40extern struct exception_table_entry __start___ex_table[];
41extern struct exception_table_entry __stop___ex_table[];
42
David Daneyd219e2e2012-04-19 14:59:56 -070043/* Cleared by build time tools if the table is already sorted. */
Andi Kleen00b71032014-02-08 08:52:04 +010044u32 __initdata __visible main_extable_sort_needed = 1;
David Daneyd219e2e2012-04-19 14:59:56 -070045
Linus Torvalds1da177e2005-04-16 15:20:36 -070046/* Sort the kernel's built-in exception table */
47void __init sort_main_extable(void)
48{
Uwe Kleine-Könige656a632013-09-11 14:23:27 -070049 if (main_extable_sort_needed && __stop___ex_table > __start___ex_table) {
Borislav Petkovbec1b9e2013-04-15 12:51:49 +020050 pr_notice("Sorting __ex_table...\n");
David Daneyd219e2e2012-04-19 14:59:56 -070051 sort_extable(__start___ex_table, __stop___ex_table);
Borislav Petkovbec1b9e2013-04-15 12:51:49 +020052 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070053}
54
55/* Given an address, look for it in the exception tables. */
56const struct exception_table_entry *search_exception_tables(unsigned long addr)
57{
58 const struct exception_table_entry *e;
59
Thomas Meyera94c33d2017-07-10 15:51:58 -070060 e = search_extable(__start___ex_table,
61 __stop___ex_table - __start___ex_table, addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -070062 if (!e)
63 e = search_module_extables(addr);
64 return e;
65}
66
Ingo Molnar4a44bac2009-03-19 13:21:44 +010067static inline int init_kernel_text(unsigned long addr)
68{
69 if (addr >= (unsigned long)_sinittext &&
Helge Deller5ecbe3c2013-11-28 09:16:33 +010070 addr < (unsigned long)_einittext)
Ingo Molnar4a44bac2009-03-19 13:21:44 +010071 return 1;
72 return 0;
73}
74
Marcin Nowakowskic0d80dd2017-07-06 15:35:31 -070075int notrace core_kernel_text(unsigned long addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070076{
77 if (addr >= (unsigned long)_stext &&
Helge Deller5ecbe3c2013-11-28 09:16:33 +010078 addr < (unsigned long)_etext)
Linus Torvalds1da177e2005-04-16 15:20:36 -070079 return 1;
80
Thomas Gleixner05947292017-05-16 20:42:44 +020081 if (system_state < SYSTEM_RUNNING &&
Ingo Molnar4a44bac2009-03-19 13:21:44 +010082 init_kernel_text(addr))
Linus Torvalds1da177e2005-04-16 15:20:36 -070083 return 1;
84 return 0;
85}
86
Steven Rostedta2d063a2011-05-19 21:34:58 -040087/**
88 * core_kernel_data - tell if addr points to kernel data
89 * @addr: address to test
90 *
91 * Returns true if @addr passed in is from the core kernel data
92 * section.
93 *
94 * Note: On some archs it may return true for core RODATA, and false
95 * for others. But will always be true for core RW data.
96 */
Steven Rostedtcdbe61b2011-05-05 21:14:55 -040097int core_kernel_data(unsigned long addr)
98{
Steven Rostedta2d063a2011-05-19 21:34:58 -040099 if (addr >= (unsigned long)_sdata &&
Steven Rostedtcdbe61b2011-05-05 21:14:55 -0400100 addr < (unsigned long)_edata)
101 return 1;
102 return 0;
103}
104
Frederic Weisbecker3861a172009-02-08 00:04:02 +0100105int __kernel_text_address(unsigned long addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106{
Steven Rostedt (VMware)9aadde92017-09-22 17:22:19 -0400107 if (kernel_text_address(addr))
Daniel Borkmann74451e662017-02-16 22:24:50 +0100108 return 1;
Ingo Molnar4a44bac2009-03-19 13:21:44 +0100109 /*
110 * There might be init symbols in saved stacktraces.
111 * Give those symbols a chance to be printed in
112 * backtraces (such as lockdep traces).
113 *
114 * Since we are after the module-symbols check, there's
115 * no danger of address overlap:
116 */
117 if (init_kernel_text(addr))
118 return 1;
119 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120}
121
122int kernel_text_address(unsigned long addr)
123{
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400124 bool no_rcu;
125 int ret = 1;
126
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127 if (core_kernel_text(addr))
128 return 1;
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400129
130 /*
131 * If a stack dump happens while RCU is not watching, then
132 * RCU needs to be notified that it requires to start
133 * watching again. This can happen either by tracing that
134 * triggers a stack trace, or a WARN() that happens during
135 * coming back from idle, or cpu on or offlining.
136 *
137 * is_module_text_address() as well as the kprobe slots
138 * and is_bpf_text_address() require RCU to be watching.
139 */
140 no_rcu = !rcu_is_watching();
141
142 /* Treat this like an NMI as it can happen anywhere */
143 if (no_rcu)
144 rcu_nmi_enter();
145
Steven Rostedt (Red Hat)aec0be22014-11-18 21:14:11 -0500146 if (is_module_text_address(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400147 goto out;
Masami Hiramatsu5b485622017-01-08 23:58:09 +0900148 if (is_ftrace_trampoline(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400149 goto out;
Masami Hiramatsu5b485622017-01-08 23:58:09 +0900150 if (is_kprobe_optinsn_slot(addr) || is_kprobe_insn_slot(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400151 goto out;
Daniel Borkmann74451e662017-02-16 22:24:50 +0100152 if (is_bpf_text_address(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400153 goto out;
154 ret = 0;
155out:
156 if (no_rcu)
157 rcu_nmi_exit();
158
159 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160}
Arjan van de Venab7476c2008-08-15 15:29:38 -0700161
162/*
163 * On some architectures (PPC64, IA64) function pointers
164 * are actually only tokens to some data that then holds the
165 * real function address. As a result, to find if a function
166 * pointer is part of the kernel text, we need to do some
167 * special dereferencing first.
168 */
169int func_ptr_is_kernel_text(void *ptr)
170{
171 unsigned long addr;
172 addr = (unsigned long) dereference_function_descriptor(ptr);
173 if (core_kernel_text(addr))
174 return 1;
Rusty Russella6e6abd2009-03-31 13:05:31 -0600175 return is_module_text_address(addr);
Arjan van de Venab7476c2008-08-15 15:29:38 -0700176}