blob: 9aa1cc41ecf79c8c2cc5fb9dbd3fbd418025c0dd [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* Rewritten by Rusty Russell, on the backs of many others...
2 Copyright (C) 2001 Rusty Russell, 2002 Rusty Russell IBM.
3
4 This program is free software; you can redistribute it and/or modify
5 it under the terms of the GNU General Public License as published by
6 the Free Software Foundation; either version 2 of the License, or
7 (at your option) any later version.
8
9 This program is distributed in the hope that it will be useful,
10 but WITHOUT ANY WARRANTY; without even the implied warranty of
11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 GNU General Public License for more details.
13
14 You should have received a copy of the GNU General Public License
15 along with this program; if not, write to the Free Software
16 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17*/
Frederic Weisbecker8b96f012008-12-06 03:40:00 +010018#include <linux/ftrace.h>
Dmitri Vorobievf80d2d72009-03-22 19:11:10 +020019#include <linux/memory.h>
Paul Gortmaker8a293be2016-07-23 14:01:45 -040020#include <linux/extable.h>
Ingo Molnar505f2b92009-03-20 11:05:04 +010021#include <linux/module.h>
22#include <linux/mutex.h>
23#include <linux/init.h>
Masami Hiramatsu5b485622017-01-08 23:58:09 +090024#include <linux/kprobes.h>
Daniel Borkmann74451e662017-02-16 22:24:50 +010025#include <linux/filter.h>
Ingo Molnar505f2b92009-03-20 11:05:04 +010026
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <asm/sections.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080028#include <linux/uaccess.h>
Ingo Molnar505f2b92009-03-20 11:05:04 +010029
30/*
31 * mutex protecting text section modification (dynamic code patching).
32 * some users need to sleep (allocating memory...) while they hold this lock.
33 *
34 * NOT exported to modules - patching kernel text is a really delicate matter.
35 */
36DEFINE_MUTEX(text_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -070037
38extern struct exception_table_entry __start___ex_table[];
39extern struct exception_table_entry __stop___ex_table[];
40
David Daneyd219e2e2012-04-19 14:59:56 -070041/* Cleared by build time tools if the table is already sorted. */
Andi Kleen00b71032014-02-08 08:52:04 +010042u32 __initdata __visible main_extable_sort_needed = 1;
David Daneyd219e2e2012-04-19 14:59:56 -070043
Linus Torvalds1da177e2005-04-16 15:20:36 -070044/* Sort the kernel's built-in exception table */
45void __init sort_main_extable(void)
46{
Uwe Kleine-Könige656a632013-09-11 14:23:27 -070047 if (main_extable_sort_needed && __stop___ex_table > __start___ex_table) {
Borislav Petkovbec1b9e2013-04-15 12:51:49 +020048 pr_notice("Sorting __ex_table...\n");
David Daneyd219e2e2012-04-19 14:59:56 -070049 sort_extable(__start___ex_table, __stop___ex_table);
Borislav Petkovbec1b9e2013-04-15 12:51:49 +020050 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070051}
52
53/* Given an address, look for it in the exception tables. */
54const struct exception_table_entry *search_exception_tables(unsigned long addr)
55{
56 const struct exception_table_entry *e;
57
Thomas Meyera94c33d2017-07-10 15:51:58 -070058 e = search_extable(__start___ex_table,
59 __stop___ex_table - __start___ex_table, addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -070060 if (!e)
61 e = search_module_extables(addr);
62 return e;
63}
64
Ingo Molnar4a44bac2009-03-19 13:21:44 +010065static inline int init_kernel_text(unsigned long addr)
66{
67 if (addr >= (unsigned long)_sinittext &&
Helge Deller5ecbe3c2013-11-28 09:16:33 +010068 addr < (unsigned long)_einittext)
Ingo Molnar4a44bac2009-03-19 13:21:44 +010069 return 1;
70 return 0;
71}
72
Marcin Nowakowskic0d80dd2017-07-06 15:35:31 -070073int notrace core_kernel_text(unsigned long addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070074{
75 if (addr >= (unsigned long)_stext &&
Helge Deller5ecbe3c2013-11-28 09:16:33 +010076 addr < (unsigned long)_etext)
Linus Torvalds1da177e2005-04-16 15:20:36 -070077 return 1;
78
Thomas Gleixner05947292017-05-16 20:42:44 +020079 if (system_state < SYSTEM_RUNNING &&
Ingo Molnar4a44bac2009-03-19 13:21:44 +010080 init_kernel_text(addr))
Linus Torvalds1da177e2005-04-16 15:20:36 -070081 return 1;
82 return 0;
83}
84
Steven Rostedta2d063a2011-05-19 21:34:58 -040085/**
86 * core_kernel_data - tell if addr points to kernel data
87 * @addr: address to test
88 *
89 * Returns true if @addr passed in is from the core kernel data
90 * section.
91 *
92 * Note: On some archs it may return true for core RODATA, and false
93 * for others. But will always be true for core RW data.
94 */
Steven Rostedtcdbe61b2011-05-05 21:14:55 -040095int core_kernel_data(unsigned long addr)
96{
Steven Rostedta2d063a2011-05-19 21:34:58 -040097 if (addr >= (unsigned long)_sdata &&
Steven Rostedtcdbe61b2011-05-05 21:14:55 -040098 addr < (unsigned long)_edata)
99 return 1;
100 return 0;
101}
102
Frederic Weisbecker3861a172009-02-08 00:04:02 +0100103int __kernel_text_address(unsigned long addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104{
Steven Rostedt (VMware)9aadde92017-09-22 17:22:19 -0400105 if (kernel_text_address(addr))
Daniel Borkmann74451e662017-02-16 22:24:50 +0100106 return 1;
Ingo Molnar4a44bac2009-03-19 13:21:44 +0100107 /*
108 * There might be init symbols in saved stacktraces.
109 * Give those symbols a chance to be printed in
110 * backtraces (such as lockdep traces).
111 *
112 * Since we are after the module-symbols check, there's
113 * no danger of address overlap:
114 */
115 if (init_kernel_text(addr))
116 return 1;
117 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118}
119
120int kernel_text_address(unsigned long addr)
121{
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400122 bool no_rcu;
123 int ret = 1;
124
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125 if (core_kernel_text(addr))
126 return 1;
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400127
128 /*
129 * If a stack dump happens while RCU is not watching, then
130 * RCU needs to be notified that it requires to start
131 * watching again. This can happen either by tracing that
132 * triggers a stack trace, or a WARN() that happens during
133 * coming back from idle, or cpu on or offlining.
134 *
135 * is_module_text_address() as well as the kprobe slots
136 * and is_bpf_text_address() require RCU to be watching.
137 */
138 no_rcu = !rcu_is_watching();
139
140 /* Treat this like an NMI as it can happen anywhere */
141 if (no_rcu)
142 rcu_nmi_enter();
143
Steven Rostedt (Red Hat)aec0be22014-11-18 21:14:11 -0500144 if (is_module_text_address(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400145 goto out;
Masami Hiramatsu5b485622017-01-08 23:58:09 +0900146 if (is_ftrace_trampoline(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400147 goto out;
Masami Hiramatsu5b485622017-01-08 23:58:09 +0900148 if (is_kprobe_optinsn_slot(addr) || is_kprobe_insn_slot(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400149 goto out;
Daniel Borkmann74451e662017-02-16 22:24:50 +0100150 if (is_bpf_text_address(addr))
Steven Rostedt (VMware)e8cac8b2017-09-22 17:36:32 -0400151 goto out;
152 ret = 0;
153out:
154 if (no_rcu)
155 rcu_nmi_exit();
156
157 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158}
Arjan van de Venab7476c2008-08-15 15:29:38 -0700159
160/*
161 * On some architectures (PPC64, IA64) function pointers
162 * are actually only tokens to some data that then holds the
163 * real function address. As a result, to find if a function
164 * pointer is part of the kernel text, we need to do some
165 * special dereferencing first.
166 */
167int func_ptr_is_kernel_text(void *ptr)
168{
169 unsigned long addr;
170 addr = (unsigned long) dereference_function_descriptor(ptr);
171 if (core_kernel_text(addr))
172 return 1;
Rusty Russella6e6abd2009-03-31 13:05:31 -0600173 return is_module_text_address(addr);
Arjan van de Venab7476c2008-08-15 15:29:38 -0700174}