Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 2 | /* |
Andy Lutomirski | 95c46b5 | 2014-10-29 14:33:46 -0700 | [diff] [blame] | 3 | * Copyright (c) 2012-2014 Andy Lutomirski <luto@amacapital.net> |
| 4 | * |
| 5 | * Based on the original implementation which is: |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 6 | * Copyright (C) 2001 Andrea Arcangeli <andrea@suse.de> SuSE |
| 7 | * Copyright 2003 Andi Kleen, SuSE Labs. |
| 8 | * |
Andy Lutomirski | 95c46b5 | 2014-10-29 14:33:46 -0700 | [diff] [blame] | 9 | * Parts of the original code have been moved to arch/x86/vdso/vma.c |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 10 | * |
Andy Lutomirski | 95c46b5 | 2014-10-29 14:33:46 -0700 | [diff] [blame] | 11 | * This file implements vsyscall emulation. vsyscalls are a legacy ABI: |
| 12 | * Userspace can request certain kernel services by calling fixed |
| 13 | * addresses. This concept is problematic: |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 14 | * |
Andy Lutomirski | 95c46b5 | 2014-10-29 14:33:46 -0700 | [diff] [blame] | 15 | * - It interferes with ASLR. |
| 16 | * - It's awkward to write code that lives in kernel addresses but is |
| 17 | * callable by userspace at fixed addresses. |
| 18 | * - The whole concept is impossible for 32-bit compat userspace. |
| 19 | * - UML cannot easily virtualize a vsyscall. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 20 | * |
Andy Lutomirski | 95c46b5 | 2014-10-29 14:33:46 -0700 | [diff] [blame] | 21 | * As of mid-2014, I believe that there is no new userspace code that |
| 22 | * will use a vsyscall if the vDSO is present. I hope that there will |
| 23 | * soon be no new userspace code that will ever use a vsyscall. |
| 24 | * |
| 25 | * The code in this file emulates vsyscalls when notified of a page |
| 26 | * fault to a vsyscall address. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 27 | */ |
| 28 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 29 | #include <linux/kernel.h> |
| 30 | #include <linux/timer.h> |
Ingo Molnar | 3f07c01 | 2017-02-08 18:51:30 +0100 | [diff] [blame] | 31 | #include <linux/sched/signal.h> |
Ingo Molnar | 589ee62 | 2017-02-04 00:16:44 +0100 | [diff] [blame] | 32 | #include <linux/mm_types.h> |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 33 | #include <linux/syscalls.h> |
| 34 | #include <linux/ratelimit.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | |
| 36 | #include <asm/vsyscall.h> |
john stultz | 7460ed2 | 2007-02-16 01:28:21 -0800 | [diff] [blame] | 37 | #include <asm/unistd.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 38 | #include <asm/fixmap.h> |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 39 | #include <asm/traps.h> |
Andy Lutomirski | 49275fe | 2017-12-10 22:47:19 -0800 | [diff] [blame] | 40 | #include <asm/paravirt.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 41 | |
Andy Lutomirski | c149a66 | 2011-08-03 09:31:54 -0400 | [diff] [blame] | 42 | #define CREATE_TRACE_POINTS |
| 43 | #include "vsyscall_trace.h" |
| 44 | |
Kees Cook | 3dc33bd | 2015-08-12 17:55:19 -0700 | [diff] [blame] | 45 | static enum { EMULATE, NATIVE, NONE } vsyscall_mode = |
Borislav Petkov | 93f13a9 | 2015-09-21 09:48:29 +0200 | [diff] [blame] | 46 | #if defined(CONFIG_LEGACY_VSYSCALL_NATIVE) |
Kees Cook | 3dc33bd | 2015-08-12 17:55:19 -0700 | [diff] [blame] | 47 | NATIVE; |
Borislav Petkov | 93f13a9 | 2015-09-21 09:48:29 +0200 | [diff] [blame] | 48 | #elif defined(CONFIG_LEGACY_VSYSCALL_NONE) |
Kees Cook | 3dc33bd | 2015-08-12 17:55:19 -0700 | [diff] [blame] | 49 | NONE; |
| 50 | #else |
| 51 | EMULATE; |
| 52 | #endif |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 53 | |
| 54 | static int __init vsyscall_setup(char *str) |
| 55 | { |
| 56 | if (str) { |
| 57 | if (!strcmp("emulate", str)) |
| 58 | vsyscall_mode = EMULATE; |
| 59 | else if (!strcmp("native", str)) |
| 60 | vsyscall_mode = NATIVE; |
| 61 | else if (!strcmp("none", str)) |
| 62 | vsyscall_mode = NONE; |
| 63 | else |
| 64 | return -EINVAL; |
| 65 | |
| 66 | return 0; |
| 67 | } |
| 68 | |
| 69 | return -EINVAL; |
| 70 | } |
| 71 | early_param("vsyscall", vsyscall_setup); |
| 72 | |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 73 | static void warn_bad_vsyscall(const char *level, struct pt_regs *regs, |
| 74 | const char *message) |
| 75 | { |
Joe Perches | c767a54 | 2012-05-21 19:50:07 -0700 | [diff] [blame] | 76 | if (!show_unhandled_signals) |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 77 | return; |
| 78 | |
Andy Lutomirski | 53b884a | 2014-07-25 16:30:27 -0700 | [diff] [blame] | 79 | printk_ratelimited("%s%s[%d] %s ip:%lx cs:%lx sp:%lx ax:%lx si:%lx di:%lx\n", |
| 80 | level, current->comm, task_pid_nr(current), |
| 81 | message, regs->ip, regs->cs, |
| 82 | regs->sp, regs->ax, regs->si, regs->di); |
Andy Lutomirski | c971294 | 2011-07-13 09:24:09 -0400 | [diff] [blame] | 83 | } |
| 84 | |
| 85 | static int addr_to_vsyscall_nr(unsigned long addr) |
| 86 | { |
| 87 | int nr; |
| 88 | |
Andy Lutomirski | f40c330 | 2014-05-05 12:19:36 -0700 | [diff] [blame] | 89 | if ((addr & ~0xC00UL) != VSYSCALL_ADDR) |
Andy Lutomirski | c971294 | 2011-07-13 09:24:09 -0400 | [diff] [blame] | 90 | return -EINVAL; |
| 91 | |
| 92 | nr = (addr & 0xC00UL) >> 10; |
| 93 | if (nr >= 3) |
| 94 | return -EINVAL; |
| 95 | |
| 96 | return nr; |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 97 | } |
| 98 | |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 99 | static bool write_ok_or_segv(unsigned long ptr, size_t size) |
| 100 | { |
| 101 | /* |
| 102 | * XXX: if access_ok, get_user, and put_user handled |
Ingo Molnar | 2a53ccb | 2016-07-15 10:21:11 +0200 | [diff] [blame] | 103 | * sig_on_uaccess_err, this could go away. |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 104 | */ |
| 105 | |
| 106 | if (!access_ok(VERIFY_WRITE, (void __user *)ptr, size)) { |
| 107 | siginfo_t info; |
| 108 | struct thread_struct *thread = ¤t->thread; |
| 109 | |
| 110 | thread->error_code = 6; /* user fault, no page, write */ |
| 111 | thread->cr2 = ptr; |
Srikar Dronamraju | 51e7dc7 | 2012-03-12 14:55:55 +0530 | [diff] [blame] | 112 | thread->trap_nr = X86_TRAP_PF; |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 113 | |
| 114 | memset(&info, 0, sizeof(info)); |
| 115 | info.si_signo = SIGSEGV; |
| 116 | info.si_errno = 0; |
| 117 | info.si_code = SEGV_MAPERR; |
| 118 | info.si_addr = (void __user *)ptr; |
| 119 | |
| 120 | force_sig_info(SIGSEGV, &info, current); |
| 121 | return false; |
| 122 | } else { |
| 123 | return true; |
| 124 | } |
| 125 | } |
| 126 | |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 127 | bool emulate_vsyscall(struct pt_regs *regs, unsigned long address) |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 128 | { |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 129 | struct task_struct *tsk; |
| 130 | unsigned long caller; |
Andy Lutomirski | 87b526d | 2012-10-01 11:40:45 -0700 | [diff] [blame] | 131 | int vsyscall_nr, syscall_nr, tmp; |
Ingo Molnar | 2a53ccb | 2016-07-15 10:21:11 +0200 | [diff] [blame] | 132 | int prev_sig_on_uaccess_err; |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 133 | long ret; |
| 134 | |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 135 | /* |
| 136 | * No point in checking CS -- the only way to get here is a user mode |
| 137 | * trap to a high address, which means that we're in 64-bit user code. |
| 138 | */ |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 139 | |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 140 | WARN_ON_ONCE(address != regs->ip); |
Andy Lutomirski | c971294 | 2011-07-13 09:24:09 -0400 | [diff] [blame] | 141 | |
Andy Lutomirski | 4831b77 | 2017-12-10 22:47:20 -0800 | [diff] [blame] | 142 | /* This should be unreachable in NATIVE mode. */ |
| 143 | if (WARN_ON(vsyscall_mode == NATIVE)) |
| 144 | return false; |
| 145 | |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 146 | if (vsyscall_mode == NONE) { |
| 147 | warn_bad_vsyscall(KERN_INFO, regs, |
| 148 | "vsyscall attempted with vsyscall=none"); |
| 149 | return false; |
Andy Lutomirski | c971294 | 2011-07-13 09:24:09 -0400 | [diff] [blame] | 150 | } |
| 151 | |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 152 | vsyscall_nr = addr_to_vsyscall_nr(address); |
Andy Lutomirski | c149a66 | 2011-08-03 09:31:54 -0400 | [diff] [blame] | 153 | |
| 154 | trace_emulate_vsyscall(vsyscall_nr); |
| 155 | |
Andy Lutomirski | c971294 | 2011-07-13 09:24:09 -0400 | [diff] [blame] | 156 | if (vsyscall_nr < 0) { |
| 157 | warn_bad_vsyscall(KERN_WARNING, regs, |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 158 | "misaligned vsyscall (exploit attempt or buggy program) -- look up the vsyscall kernel parameter if you need a workaround"); |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 159 | goto sigsegv; |
| 160 | } |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 161 | |
| 162 | if (get_user(caller, (unsigned long __user *)regs->sp) != 0) { |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 163 | warn_bad_vsyscall(KERN_WARNING, regs, |
| 164 | "vsyscall with bad stack (exploit attempt?)"); |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 165 | goto sigsegv; |
| 166 | } |
| 167 | |
| 168 | tsk = current; |
Andy Lutomirski | 87b526d | 2012-10-01 11:40:45 -0700 | [diff] [blame] | 169 | |
| 170 | /* |
| 171 | * Check for access_ok violations and find the syscall nr. |
| 172 | * |
| 173 | * NULL is a valid user pointer (in the access_ok sense) on 32-bit and |
| 174 | * 64-bit, so we don't need to special-case it here. For all the |
| 175 | * vsyscalls, NULL means "don't write anything" not "write it at |
| 176 | * address 0". |
| 177 | */ |
| 178 | switch (vsyscall_nr) { |
| 179 | case 0: |
| 180 | if (!write_ok_or_segv(regs->di, sizeof(struct timeval)) || |
| 181 | !write_ok_or_segv(regs->si, sizeof(struct timezone))) { |
| 182 | ret = -EFAULT; |
| 183 | goto check_fault; |
| 184 | } |
| 185 | |
| 186 | syscall_nr = __NR_gettimeofday; |
| 187 | break; |
| 188 | |
| 189 | case 1: |
| 190 | if (!write_ok_or_segv(regs->di, sizeof(time_t))) { |
| 191 | ret = -EFAULT; |
| 192 | goto check_fault; |
| 193 | } |
| 194 | |
| 195 | syscall_nr = __NR_time; |
| 196 | break; |
| 197 | |
| 198 | case 2: |
| 199 | if (!write_ok_or_segv(regs->di, sizeof(unsigned)) || |
| 200 | !write_ok_or_segv(regs->si, sizeof(unsigned))) { |
| 201 | ret = -EFAULT; |
| 202 | goto check_fault; |
| 203 | } |
| 204 | |
| 205 | syscall_nr = __NR_getcpu; |
| 206 | break; |
| 207 | } |
| 208 | |
| 209 | /* |
| 210 | * Handle seccomp. regs->ip must be the original value. |
| 211 | * See seccomp_send_sigsys and Documentation/prctl/seccomp_filter.txt. |
| 212 | * |
| 213 | * We could optimize the seccomp disabled case, but performance |
| 214 | * here doesn't matter. |
| 215 | */ |
| 216 | regs->orig_ax = syscall_nr; |
| 217 | regs->ax = -ENOSYS; |
Andy Lutomirski | 2f275de | 2016-05-27 12:57:02 -0700 | [diff] [blame] | 218 | tmp = secure_computing(NULL); |
Andy Lutomirski | 87b526d | 2012-10-01 11:40:45 -0700 | [diff] [blame] | 219 | if ((!tmp && regs->orig_ax != syscall_nr) || regs->ip != address) { |
| 220 | warn_bad_vsyscall(KERN_DEBUG, regs, |
| 221 | "seccomp tried to change syscall nr or ip"); |
| 222 | do_exit(SIGSYS); |
| 223 | } |
Andy Lutomirski | 2689310 | 2014-11-04 15:36:50 -0800 | [diff] [blame] | 224 | regs->orig_ax = -1; |
Andy Lutomirski | 87b526d | 2012-10-01 11:40:45 -0700 | [diff] [blame] | 225 | if (tmp) |
| 226 | goto do_ret; /* skip requested */ |
| 227 | |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 228 | /* |
| 229 | * With a real vsyscall, page faults cause SIGSEGV. We want to |
| 230 | * preserve that behavior to make writing exploits harder. |
| 231 | */ |
Ingo Molnar | 2a53ccb | 2016-07-15 10:21:11 +0200 | [diff] [blame] | 232 | prev_sig_on_uaccess_err = current->thread.sig_on_uaccess_err; |
| 233 | current->thread.sig_on_uaccess_err = 1; |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 234 | |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 235 | ret = -EFAULT; |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 236 | switch (vsyscall_nr) { |
| 237 | case 0: |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 238 | ret = sys_gettimeofday( |
| 239 | (struct timeval __user *)regs->di, |
| 240 | (struct timezone __user *)regs->si); |
| 241 | break; |
| 242 | |
| 243 | case 1: |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 244 | ret = sys_time((time_t __user *)regs->di); |
| 245 | break; |
| 246 | |
| 247 | case 2: |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 248 | ret = sys_getcpu((unsigned __user *)regs->di, |
| 249 | (unsigned __user *)regs->si, |
Emil Goode | 46ed99d | 2012-04-01 20:48:04 +0200 | [diff] [blame] | 250 | NULL); |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 251 | break; |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 252 | } |
| 253 | |
Ingo Molnar | 2a53ccb | 2016-07-15 10:21:11 +0200 | [diff] [blame] | 254 | current->thread.sig_on_uaccess_err = prev_sig_on_uaccess_err; |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 255 | |
Andy Lutomirski | 87b526d | 2012-10-01 11:40:45 -0700 | [diff] [blame] | 256 | check_fault: |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 257 | if (ret == -EFAULT) { |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 258 | /* Bad news -- userspace fed a bad pointer to a vsyscall. */ |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 259 | warn_bad_vsyscall(KERN_INFO, regs, |
| 260 | "vsyscall fault (exploit attempt?)"); |
Andy Lutomirski | 4fc3490 | 2011-11-07 16:33:40 -0800 | [diff] [blame] | 261 | |
| 262 | /* |
| 263 | * If we failed to generate a signal for any reason, |
| 264 | * generate one here. (This should be impossible.) |
| 265 | */ |
| 266 | if (WARN_ON_ONCE(!sigismember(&tsk->pending.signal, SIGBUS) && |
| 267 | !sigismember(&tsk->pending.signal, SIGSEGV))) |
| 268 | goto sigsegv; |
| 269 | |
| 270 | return true; /* Don't emulate the ret. */ |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 271 | } |
| 272 | |
| 273 | regs->ax = ret; |
| 274 | |
Will Drewry | 5651721 | 2012-07-13 12:06:35 -0500 | [diff] [blame] | 275 | do_ret: |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 276 | /* Emulate a ret instruction. */ |
| 277 | regs->ip = caller; |
| 278 | regs->sp += 8; |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 279 | return true; |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 280 | |
| 281 | sigsegv: |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 282 | force_sig(SIGSEGV, current); |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 283 | return true; |
Andy Lutomirski | 5cec93c | 2011-06-05 13:50:24 -0400 | [diff] [blame] | 284 | } |
| 285 | |
| 286 | /* |
Andy Lutomirski | b935909 | 2014-09-23 10:50:51 -0700 | [diff] [blame] | 287 | * A pseudo VMA to allow ptrace access for the vsyscall page. This only |
| 288 | * covers the 64bit vsyscall page now. 32bit has a real VMA now and does |
| 289 | * not need special handling anymore: |
| 290 | */ |
| 291 | static const char *gate_vma_name(struct vm_area_struct *vma) |
| 292 | { |
| 293 | return "[vsyscall]"; |
| 294 | } |
Kirill A. Shutemov | 7cbea8d | 2015-09-09 15:39:26 -0700 | [diff] [blame] | 295 | static const struct vm_operations_struct gate_vma_ops = { |
Andy Lutomirski | b935909 | 2014-09-23 10:50:51 -0700 | [diff] [blame] | 296 | .name = gate_vma_name, |
| 297 | }; |
| 298 | static struct vm_area_struct gate_vma = { |
| 299 | .vm_start = VSYSCALL_ADDR, |
| 300 | .vm_end = VSYSCALL_ADDR + PAGE_SIZE, |
| 301 | .vm_page_prot = PAGE_READONLY_EXEC, |
| 302 | .vm_flags = VM_READ | VM_EXEC, |
| 303 | .vm_ops = &gate_vma_ops, |
| 304 | }; |
| 305 | |
| 306 | struct vm_area_struct *get_gate_vma(struct mm_struct *mm) |
| 307 | { |
Brian Gerst | c338867 | 2015-06-22 07:55:16 -0400 | [diff] [blame] | 308 | #ifdef CONFIG_COMPAT |
Andy Lutomirski | b935909 | 2014-09-23 10:50:51 -0700 | [diff] [blame] | 309 | if (!mm || mm->context.ia32_compat) |
| 310 | return NULL; |
| 311 | #endif |
Andy Lutomirski | 87983c6 | 2014-10-29 14:33:45 -0700 | [diff] [blame] | 312 | if (vsyscall_mode == NONE) |
| 313 | return NULL; |
Andy Lutomirski | b935909 | 2014-09-23 10:50:51 -0700 | [diff] [blame] | 314 | return &gate_vma; |
| 315 | } |
| 316 | |
| 317 | int in_gate_area(struct mm_struct *mm, unsigned long addr) |
| 318 | { |
| 319 | struct vm_area_struct *vma = get_gate_vma(mm); |
| 320 | |
| 321 | if (!vma) |
| 322 | return 0; |
| 323 | |
| 324 | return (addr >= vma->vm_start) && (addr < vma->vm_end); |
| 325 | } |
| 326 | |
| 327 | /* |
| 328 | * Use this when you have no reliable mm, typically from interrupt |
| 329 | * context. It is less reliable than using a task's mm and may give |
| 330 | * false positives. |
| 331 | */ |
| 332 | int in_gate_area_no_mm(unsigned long addr) |
| 333 | { |
Andy Lutomirski | 87983c6 | 2014-10-29 14:33:45 -0700 | [diff] [blame] | 334 | return vsyscall_mode != NONE && (addr & PAGE_MASK) == VSYSCALL_ADDR; |
Andy Lutomirski | b935909 | 2014-09-23 10:50:51 -0700 | [diff] [blame] | 335 | } |
| 336 | |
Andy Lutomirski | 49275fe | 2017-12-10 22:47:19 -0800 | [diff] [blame] | 337 | /* |
| 338 | * The VSYSCALL page is the only user-accessible page in the kernel address |
| 339 | * range. Normally, the kernel page tables can have _PAGE_USER clear, but |
| 340 | * the tables covering VSYSCALL_ADDR need _PAGE_USER set if vsyscalls |
| 341 | * are enabled. |
| 342 | * |
| 343 | * Some day we may create a "minimal" vsyscall mode in which we emulate |
| 344 | * vsyscalls but leave the page not present. If so, we skip calling |
| 345 | * this. |
| 346 | */ |
Andy Lutomirski | 85900ea | 2017-12-12 07:56:42 -0800 | [diff] [blame] | 347 | void __init set_vsyscall_pgtable_user_bits(pgd_t *root) |
Andy Lutomirski | 49275fe | 2017-12-10 22:47:19 -0800 | [diff] [blame] | 348 | { |
| 349 | pgd_t *pgd; |
| 350 | p4d_t *p4d; |
| 351 | pud_t *pud; |
| 352 | pmd_t *pmd; |
| 353 | |
Andy Lutomirski | 85900ea | 2017-12-12 07:56:42 -0800 | [diff] [blame] | 354 | pgd = pgd_offset_pgd(root, VSYSCALL_ADDR); |
Andy Lutomirski | 49275fe | 2017-12-10 22:47:19 -0800 | [diff] [blame] | 355 | set_pgd(pgd, __pgd(pgd_val(*pgd) | _PAGE_USER)); |
| 356 | p4d = p4d_offset(pgd, VSYSCALL_ADDR); |
| 357 | #if CONFIG_PGTABLE_LEVELS >= 5 |
| 358 | p4d->p4d |= _PAGE_USER; |
| 359 | #endif |
| 360 | pud = pud_offset(p4d, VSYSCALL_ADDR); |
| 361 | set_pud(pud, __pud(pud_val(*pud) | _PAGE_USER)); |
| 362 | pmd = pmd_offset(pud, VSYSCALL_ADDR); |
| 363 | set_pmd(pmd, __pmd(pmd_val(*pmd) | _PAGE_USER)); |
| 364 | } |
| 365 | |
Ingo Molnar | e402644 | 2008-01-30 13:32:39 +0100 | [diff] [blame] | 366 | void __init map_vsyscall(void) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 367 | { |
Andy Lutomirski | 3ae3665 | 2011-08-10 11:15:32 -0400 | [diff] [blame] | 368 | extern char __vsyscall_page; |
| 369 | unsigned long physaddr_vsyscall = __pa_symbol(&__vsyscall_page); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 370 | |
Andy Lutomirski | 49275fe | 2017-12-10 22:47:19 -0800 | [diff] [blame] | 371 | if (vsyscall_mode != NONE) { |
Andy Lutomirski | 87983c6 | 2014-10-29 14:33:45 -0700 | [diff] [blame] | 372 | __set_fixmap(VSYSCALL_PAGE, physaddr_vsyscall, |
| 373 | vsyscall_mode == NATIVE |
| 374 | ? PAGE_KERNEL_VSYSCALL |
| 375 | : PAGE_KERNEL_VVAR); |
Andy Lutomirski | 85900ea | 2017-12-12 07:56:42 -0800 | [diff] [blame] | 376 | set_vsyscall_pgtable_user_bits(swapper_pg_dir); |
Andy Lutomirski | 49275fe | 2017-12-10 22:47:19 -0800 | [diff] [blame] | 377 | } |
Andy Lutomirski | 87983c6 | 2014-10-29 14:33:45 -0700 | [diff] [blame] | 378 | |
Andy Lutomirski | f40c330 | 2014-05-05 12:19:36 -0700 | [diff] [blame] | 379 | BUILD_BUG_ON((unsigned long)__fix_to_virt(VSYSCALL_PAGE) != |
| 380 | (unsigned long)VSYSCALL_ADDR); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 381 | } |