blob: 04c4aa7a1df2c59716abaa12aefdf29fd7d4630c [file] [log] [blame]
Thomas Gleixner09c434b2019-05-19 13:08:20 +01001// SPDX-License-Identifier: GPL-2.0-only
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * linux/fs/binfmt_elf.c
4 *
5 * These are the functions used to load ELF format executables as used
6 * on SVr4 machines. Information on the format may be found in the book
7 * "UNIX SYSTEM V RELEASE 4 Programmers Guide: Ansi C and Programming Support
8 * Tools".
9 *
10 * Copyright 1993, 1994: Eric Youngdale (ericy@cais.com).
11 */
12
13#include <linux/module.h>
14#include <linux/kernel.h>
15#include <linux/fs.h>
Chris Kennellyce81bb22020-10-15 20:12:32 -070016#include <linux/log2.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/mm.h>
18#include <linux/mman.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <linux/errno.h>
20#include <linux/signal.h>
21#include <linux/binfmts.h>
22#include <linux/string.h>
23#include <linux/file.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/personality.h>
26#include <linux/elfcore.h>
27#include <linux/init.h>
28#include <linux/highuid.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029#include <linux/compiler.h>
30#include <linux/highmem.h>
Anshuman Khandual03911132020-04-06 20:03:51 -070031#include <linux/hugetlb.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/pagemap.h>
Denys Vlasenko2aa362c2012-10-04 17:15:36 -070033#include <linux/vmalloc.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070034#include <linux/security.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/random.h>
Jesper Juhlf4e5cc22006-06-23 02:05:35 -070036#include <linux/elf.h>
Kees Cookd1fd8362015-04-14 15:48:07 -070037#include <linux/elf-randomize.h>
Alexey Dobriyan7e80d0d2007-05-08 00:28:59 -070038#include <linux/utsname.h>
Daisuke HATAYAMA088e7af2010-03-05 13:44:06 -080039#include <linux/coredump.h>
Frederic Weisbecker6fac4822012-11-13 14:20:55 +010040#include <linux/sched.h>
Ingo Molnarf7ccbae2017-02-08 18:51:30 +010041#include <linux/sched/coredump.h>
Ingo Molnar68db0cf2017-02-08 18:51:37 +010042#include <linux/sched/task_stack.h>
Ingo Molnar32ef5512017-02-05 11:48:36 +010043#include <linux/sched/cputime.h>
Dave Martin00e19ce2020-03-16 16:50:44 +000044#include <linux/sizes.h>
45#include <linux/types.h>
Ingo Molnar5b825c32017-02-02 17:54:15 +010046#include <linux/cred.h>
Ross Zwisler50378352015-10-05 16:33:36 -060047#include <linux/dax.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080048#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070049#include <asm/param.h>
50#include <asm/page.h>
51
Dave Martin00e19ce2020-03-16 16:50:44 +000052#ifndef ELF_COMPAT
53#define ELF_COMPAT 0
54#endif
55
Denys Vlasenko2aa362c2012-10-04 17:15:36 -070056#ifndef user_long_t
57#define user_long_t long
58#endif
Denys Vlasenko49ae4d42012-10-04 17:15:35 -070059#ifndef user_siginfo_t
60#define user_siginfo_t siginfo_t
61#endif
62
Nicolas Pitre47552002017-08-16 16:05:13 -040063/* That's for binfmt_elf_fdpic to deal with */
64#ifndef elf_check_fdpic
65#define elf_check_fdpic(ex) false
66#endif
67
Al Viro71613c32012-10-20 22:00:48 -040068static int load_elf_binary(struct linux_binprm *bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -070069
Josh Triplett69369a72014-04-03 14:48:27 -070070#ifdef CONFIG_USELIB
71static int load_elf_library(struct file *);
72#else
73#define load_elf_library NULL
74#endif
75
Linus Torvalds1da177e2005-04-16 15:20:36 -070076/*
77 * If we don't support core dumping, then supply a NULL so we
78 * don't even try.
79 */
Christoph Hellwig698ba7b2009-12-15 16:47:37 -080080#ifdef CONFIG_ELF_CORE
Masami Hiramatsuf6151df2009-12-17 15:27:16 -080081static int elf_core_dump(struct coredump_params *cprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -070082#else
83#define elf_core_dump NULL
84#endif
85
86#if ELF_EXEC_PAGESIZE > PAGE_SIZE
Jesper Juhlf4e5cc22006-06-23 02:05:35 -070087#define ELF_MIN_ALIGN ELF_EXEC_PAGESIZE
Linus Torvalds1da177e2005-04-16 15:20:36 -070088#else
Jesper Juhlf4e5cc22006-06-23 02:05:35 -070089#define ELF_MIN_ALIGN PAGE_SIZE
Linus Torvalds1da177e2005-04-16 15:20:36 -070090#endif
91
92#ifndef ELF_CORE_EFLAGS
93#define ELF_CORE_EFLAGS 0
94#endif
95
96#define ELF_PAGESTART(_v) ((_v) & ~(unsigned long)(ELF_MIN_ALIGN-1))
97#define ELF_PAGEOFFSET(_v) ((_v) & (ELF_MIN_ALIGN-1))
98#define ELF_PAGEALIGN(_v) (((_v) + ELF_MIN_ALIGN - 1) & ~(ELF_MIN_ALIGN - 1))
99
100static struct linux_binfmt elf_format = {
Mikael Petterssonf670d0e2011-01-12 17:00:02 -0800101 .module = THIS_MODULE,
102 .load_binary = load_elf_binary,
103 .load_shlib = load_elf_library,
104 .core_dump = elf_core_dump,
105 .min_coredump = ELF_EXEC_PAGESIZE,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106};
107
Alexey Dobriyan18676ff2020-01-30 22:17:01 -0800108#define BAD_ADDR(x) (unlikely((unsigned long)(x) >= TASK_SIZE))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800110static int set_brk(unsigned long start, unsigned long end, int prot)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111{
112 start = ELF_PAGEALIGN(start);
113 end = ELF_PAGEALIGN(end);
114 if (end > start) {
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800115 /*
116 * Map the last of the bss segment.
117 * If the header is requesting these pages to be
118 * executable, honour that (ppc32 needs this).
119 */
120 int error = vm_brk_flags(start, end - start,
121 prot & PROT_EXEC ? VM_EXEC : 0);
Linus Torvalds5d22fc22016-05-27 15:57:31 -0700122 if (error)
123 return error;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124 }
125 current->mm->start_brk = current->mm->brk = end;
126 return 0;
127}
128
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129/* We need to explicitly zero any fractional pages
130 after the data section (i.e. bss). This would
131 contain the junk from the file that should not
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700132 be in memory
133 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134static int padzero(unsigned long elf_bss)
135{
136 unsigned long nbyte;
137
138 nbyte = ELF_PAGEOFFSET(elf_bss);
139 if (nbyte) {
140 nbyte = ELF_MIN_ALIGN - nbyte;
141 if (clear_user((void __user *) elf_bss, nbyte))
142 return -EFAULT;
143 }
144 return 0;
145}
146
Ohad Ben-Cohen09c6dd32008-02-03 18:05:15 +0200147/* Let's use some macros to make this stack manipulation a little clearer */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148#ifdef CONFIG_STACK_GROWSUP
149#define STACK_ADD(sp, items) ((elf_addr_t __user *)(sp) + (items))
150#define STACK_ROUND(sp, items) \
151 ((15 + (unsigned long) ((sp) + (items))) &~ 15UL)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700152#define STACK_ALLOC(sp, len) ({ \
153 elf_addr_t __user *old_sp = (elf_addr_t __user *)sp; sp += len; \
154 old_sp; })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155#else
156#define STACK_ADD(sp, items) ((elf_addr_t __user *)(sp) - (items))
157#define STACK_ROUND(sp, items) \
158 (((unsigned long) (sp - items)) &~ 15UL)
159#define STACK_ALLOC(sp, len) ({ sp -= len ; sp; })
160#endif
161
Nathan Lynch483fad12008-07-22 04:48:46 +1000162#ifndef ELF_BASE_PLATFORM
163/*
164 * AT_BASE_PLATFORM indicates the "real" hardware/microarchitecture.
165 * If the arch defines ELF_BASE_PLATFORM (in asm/elf.h), the value
166 * will be copied to the user stack in the same manner as AT_PLATFORM.
167 */
168#define ELF_BASE_PLATFORM NULL
169#endif
170
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171static int
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800172create_elf_tables(struct linux_binprm *bprm, const struct elfhdr *exec,
173 unsigned long load_addr, unsigned long interp_load_addr,
174 unsigned long e_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175{
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800176 struct mm_struct *mm = current->mm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 unsigned long p = bprm->p;
178 int argc = bprm->argc;
179 int envc = bprm->envc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 elf_addr_t __user *sp;
181 elf_addr_t __user *u_platform;
Nathan Lynch483fad12008-07-22 04:48:46 +1000182 elf_addr_t __user *u_base_platform;
Kees Cookf06295b2009-01-07 18:08:52 -0800183 elf_addr_t __user *u_rand_bytes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 const char *k_platform = ELF_PLATFORM;
Nathan Lynch483fad12008-07-22 04:48:46 +1000185 const char *k_base_platform = ELF_BASE_PLATFORM;
Kees Cookf06295b2009-01-07 18:08:52 -0800186 unsigned char k_rand_bytes[16];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187 int items;
188 elf_addr_t *elf_info;
Alexey Dobriyan1f83d802020-01-30 22:16:50 -0800189 int ei_index;
David Howells86a264a2008-11-14 10:39:18 +1100190 const struct cred *cred = current_cred();
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700191 struct vm_area_struct *vma;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192
193 /*
Franck Bui-Huud68c9d62007-10-16 23:30:24 -0700194 * In some cases (e.g. Hyper-Threading), we want to avoid L1
195 * evictions by the processes running on the same package. One
196 * thing we can do is to shuffle the initial stack for them.
197 */
198
199 p = arch_align_stack(p);
200
201 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 * If this architecture has a platform capability string, copy it
203 * to userspace. In some cases (Sparc), this info is impossible
204 * for userspace to get any other way, in others (i386) it is
205 * merely difficult.
206 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207 u_platform = NULL;
208 if (k_platform) {
209 size_t len = strlen(k_platform) + 1;
210
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211 u_platform = (elf_addr_t __user *)STACK_ALLOC(p, len);
Al Viro646e84d2020-02-19 09:23:34 -0500212 if (copy_to_user(u_platform, k_platform, len))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 return -EFAULT;
214 }
215
Nathan Lynch483fad12008-07-22 04:48:46 +1000216 /*
217 * If this architecture has a "base" platform capability
218 * string, copy it to userspace.
219 */
220 u_base_platform = NULL;
221 if (k_base_platform) {
222 size_t len = strlen(k_base_platform) + 1;
223
224 u_base_platform = (elf_addr_t __user *)STACK_ALLOC(p, len);
Al Viro646e84d2020-02-19 09:23:34 -0500225 if (copy_to_user(u_base_platform, k_base_platform, len))
Nathan Lynch483fad12008-07-22 04:48:46 +1000226 return -EFAULT;
227 }
228
Kees Cookf06295b2009-01-07 18:08:52 -0800229 /*
230 * Generate 16 random bytes for userspace PRNG seeding.
231 */
232 get_random_bytes(k_rand_bytes, sizeof(k_rand_bytes));
233 u_rand_bytes = (elf_addr_t __user *)
234 STACK_ALLOC(p, sizeof(k_rand_bytes));
Al Viro646e84d2020-02-19 09:23:34 -0500235 if (copy_to_user(u_rand_bytes, k_rand_bytes, sizeof(k_rand_bytes)))
Kees Cookf06295b2009-01-07 18:08:52 -0800236 return -EFAULT;
237
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238 /* Create the ELF interpreter info */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800239 elf_info = (elf_addr_t *)mm->saved_auxv;
Olaf Hering4f9a58d2007-10-16 23:30:12 -0700240 /* update AT_VECTOR_SIZE_BASE if the number of NEW_AUX_ENT() changes */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241#define NEW_AUX_ENT(id, val) \
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700242 do { \
Alexey Dobriyan1f83d802020-01-30 22:16:50 -0800243 *elf_info++ = id; \
244 *elf_info++ = val; \
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700245 } while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246
247#ifdef ARCH_DLINFO
248 /*
249 * ARCH_DLINFO must come first so PPC can do its special alignment of
250 * AUXV.
Olaf Hering4f9a58d2007-10-16 23:30:12 -0700251 * update AT_VECTOR_SIZE_ARCH if the number of NEW_AUX_ENT() in
252 * ARCH_DLINFO changes
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 */
254 ARCH_DLINFO;
255#endif
256 NEW_AUX_ENT(AT_HWCAP, ELF_HWCAP);
257 NEW_AUX_ENT(AT_PAGESZ, ELF_EXEC_PAGESIZE);
258 NEW_AUX_ENT(AT_CLKTCK, CLOCKS_PER_SEC);
259 NEW_AUX_ENT(AT_PHDR, load_addr + exec->e_phoff);
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700260 NEW_AUX_ENT(AT_PHENT, sizeof(struct elf_phdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 NEW_AUX_ENT(AT_PHNUM, exec->e_phnum);
262 NEW_AUX_ENT(AT_BASE, interp_load_addr);
263 NEW_AUX_ENT(AT_FLAGS, 0);
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800264 NEW_AUX_ENT(AT_ENTRY, e_entry);
Eric W. Biedermanebc887b2012-02-07 18:36:10 -0800265 NEW_AUX_ENT(AT_UID, from_kuid_munged(cred->user_ns, cred->uid));
266 NEW_AUX_ENT(AT_EUID, from_kuid_munged(cred->user_ns, cred->euid));
267 NEW_AUX_ENT(AT_GID, from_kgid_munged(cred->user_ns, cred->gid));
268 NEW_AUX_ENT(AT_EGID, from_kgid_munged(cred->user_ns, cred->egid));
Kees Cookc425e182017-07-18 15:25:22 -0700269 NEW_AUX_ENT(AT_SECURE, bprm->secureexec);
Kees Cookf06295b2009-01-07 18:08:52 -0800270 NEW_AUX_ENT(AT_RANDOM, (elf_addr_t)(unsigned long)u_rand_bytes);
Michael Neuling21713642013-04-17 17:33:11 +0000271#ifdef ELF_HWCAP2
272 NEW_AUX_ENT(AT_HWCAP2, ELF_HWCAP2);
273#endif
John Reiser65191082008-07-21 14:21:32 -0700274 NEW_AUX_ENT(AT_EXECFN, bprm->exec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 if (k_platform) {
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700276 NEW_AUX_ENT(AT_PLATFORM,
Jesper Juhl785d5572006-06-23 02:05:35 -0700277 (elf_addr_t)(unsigned long)u_platform);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 }
Nathan Lynch483fad12008-07-22 04:48:46 +1000279 if (k_base_platform) {
280 NEW_AUX_ENT(AT_BASE_PLATFORM,
281 (elf_addr_t)(unsigned long)u_base_platform);
282 }
Eric W. Biedermanb8a61c92020-05-14 15:17:40 -0500283 if (bprm->have_execfd) {
284 NEW_AUX_ENT(AT_EXECFD, bprm->execfd);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285 }
286#undef NEW_AUX_ENT
287 /* AT_NULL is zero; clear the rest too */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800288 memset(elf_info, 0, (char *)mm->saved_auxv +
289 sizeof(mm->saved_auxv) - (char *)elf_info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290
291 /* And advance past the AT_NULL entry. */
Alexey Dobriyan1f83d802020-01-30 22:16:50 -0800292 elf_info += 2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800294 ei_index = elf_info - (elf_addr_t *)mm->saved_auxv;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 sp = STACK_ADD(p, ei_index);
296
Andi Kleend20894a2008-02-08 04:21:54 -0800297 items = (argc + 1) + (envc + 1) + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298 bprm->p = STACK_ROUND(sp, items);
299
300 /* Point sp at the lowest address on the stack */
301#ifdef CONFIG_STACK_GROWSUP
302 sp = (elf_addr_t __user *)bprm->p - items - ei_index;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700303 bprm->exec = (unsigned long)sp; /* XXX: PARISC HACK */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304#else
305 sp = (elf_addr_t __user *)bprm->p;
306#endif
307
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700308
309 /*
310 * Grow the stack manually; some architectures have a limit on how
311 * far ahead a user-space access may be in order to grow the stack.
312 */
Jann Hornb2767d92020-10-17 16:14:15 -0700313 if (mmap_read_lock_killable(mm))
314 return -EINTR;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800315 vma = find_extend_vma(mm, bprm->p);
Jann Hornb2767d92020-10-17 16:14:15 -0700316 mmap_read_unlock(mm);
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700317 if (!vma)
318 return -EFAULT;
319
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 /* Now, let's put argc (and argv, envp if appropriate) on the stack */
Al Viro646e84d2020-02-19 09:23:34 -0500321 if (put_user(argc, sp++))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323
Kees Cook67c67772017-07-10 15:52:54 -0700324 /* Populate list of argv pointers back to argv strings. */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800325 p = mm->arg_end = mm->arg_start;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326 while (argc-- > 0) {
327 size_t len;
Al Viro646e84d2020-02-19 09:23:34 -0500328 if (put_user((elf_addr_t)p, sp++))
Heiko Carstens841d5fb2006-12-06 20:36:35 -0800329 return -EFAULT;
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700330 len = strnlen_user((void __user *)p, MAX_ARG_STRLEN);
331 if (!len || len > MAX_ARG_STRLEN)
WANG Cong23c49712008-05-08 21:52:33 +0800332 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 p += len;
334 }
Al Viro646e84d2020-02-19 09:23:34 -0500335 if (put_user(0, sp++))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 return -EFAULT;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800337 mm->arg_end = p;
Kees Cook67c67772017-07-10 15:52:54 -0700338
339 /* Populate list of envp pointers back to envp strings. */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800340 mm->env_end = mm->env_start = p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 while (envc-- > 0) {
342 size_t len;
Al Viro646e84d2020-02-19 09:23:34 -0500343 if (put_user((elf_addr_t)p, sp++))
Heiko Carstens841d5fb2006-12-06 20:36:35 -0800344 return -EFAULT;
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700345 len = strnlen_user((void __user *)p, MAX_ARG_STRLEN);
346 if (!len || len > MAX_ARG_STRLEN)
WANG Cong23c49712008-05-08 21:52:33 +0800347 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 p += len;
349 }
Al Viro646e84d2020-02-19 09:23:34 -0500350 if (put_user(0, sp++))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 return -EFAULT;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800352 mm->env_end = p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700353
354 /* Put the elf_info on the stack in the right place. */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800355 if (copy_to_user(sp, mm->saved_auxv, ei_index * sizeof(elf_addr_t)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 return -EFAULT;
357 return 0;
358}
359
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360static unsigned long elf_map(struct file *filep, unsigned long addr,
Alexey Dobriyan49ac9812019-03-07 16:29:03 -0800361 const struct elf_phdr *eppnt, int prot, int type,
Jiri Kosinacc503c12008-01-30 13:31:07 +0100362 unsigned long total_size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363{
364 unsigned long map_addr;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100365 unsigned long size = eppnt->p_filesz + ELF_PAGEOFFSET(eppnt->p_vaddr);
366 unsigned long off = eppnt->p_offset - ELF_PAGEOFFSET(eppnt->p_vaddr);
367 addr = ELF_PAGESTART(addr);
368 size = ELF_PAGEALIGN(size);
Jan Kratochvil60bfba72007-07-15 23:40:06 -0700369
Andrew Mortond4e3cc32007-07-21 04:37:32 -0700370 /* mmap() will return -EINVAL if given a zero size, but a
371 * segment with zero filesize is perfectly valid */
Jiri Kosinacc503c12008-01-30 13:31:07 +0100372 if (!size)
373 return addr;
374
Jiri Kosinacc503c12008-01-30 13:31:07 +0100375 /*
376 * total_size is the size of the ELF (interpreter) image.
377 * The _first_ mmap needs to know the full size, otherwise
378 * randomization might put this image into an overlapping
379 * position with the ELF binary image. (since size < total_size)
380 * So we first map the 'big' image - and unmap the remainder at
381 * the end. (which unmap is needed for ELF images with holes.)
382 */
383 if (total_size) {
384 total_size = ELF_PAGEALIGN(total_size);
Al Viro5a5e4c22012-05-30 01:49:38 -0400385 map_addr = vm_mmap(filep, addr, total_size, prot, type, off);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100386 if (!BAD_ADDR(map_addr))
Al Viro5a5e4c22012-05-30 01:49:38 -0400387 vm_munmap(map_addr+size, total_size-size);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100388 } else
Al Viro5a5e4c22012-05-30 01:49:38 -0400389 map_addr = vm_mmap(filep, addr, size, prot, type, off);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100390
Tetsuo Handad23a61e2018-04-20 14:56:13 -0700391 if ((type & MAP_FIXED_NOREPLACE) &&
392 PTR_ERR((void *)map_addr) == -EEXIST)
393 pr_info("%d (%s): Uhuuh, elf segment at %px requested but the memory is mapped already\n",
394 task_pid_nr(current), current->comm, (void *)addr);
Michal Hocko4ed28632018-04-10 16:36:01 -0700395
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396 return(map_addr);
397}
398
Alexey Dobriyan49ac9812019-03-07 16:29:03 -0800399static unsigned long total_mapping_size(const struct elf_phdr *cmds, int nr)
Jiri Kosinacc503c12008-01-30 13:31:07 +0100400{
401 int i, first_idx = -1, last_idx = -1;
402
403 for (i = 0; i < nr; i++) {
404 if (cmds[i].p_type == PT_LOAD) {
405 last_idx = i;
406 if (first_idx == -1)
407 first_idx = i;
408 }
409 }
410 if (first_idx == -1)
411 return 0;
412
413 return cmds[last_idx].p_vaddr + cmds[last_idx].p_memsz -
414 ELF_PAGESTART(cmds[first_idx].p_vaddr);
415}
416
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800417static int elf_read(struct file *file, void *buf, size_t len, loff_t pos)
418{
419 ssize_t rv;
420
421 rv = kernel_read(file, buf, len, &pos);
422 if (unlikely(rv != len)) {
423 return (rv < 0) ? rv : -EIO;
424 }
425 return 0;
426}
427
Chris Kennellyce81bb22020-10-15 20:12:32 -0700428static unsigned long maximum_alignment(struct elf_phdr *cmds, int nr)
429{
430 unsigned long alignment = 0;
431 int i;
432
433 for (i = 0; i < nr; i++) {
434 if (cmds[i].p_type == PT_LOAD) {
435 unsigned long p_align = cmds[i].p_align;
436
437 /* skip non-power of two alignments as invalid */
438 if (!is_power_of_2(p_align))
439 continue;
440 alignment = max(alignment, p_align);
441 }
442 }
443
444 /* ensure we align to at least one page */
445 return ELF_PAGEALIGN(alignment);
446}
447
Paul Burton6a8d3892014-09-11 08:30:14 +0100448/**
449 * load_elf_phdrs() - load ELF program headers
450 * @elf_ex: ELF header of the binary whose program headers should be loaded
451 * @elf_file: the opened ELF binary file
452 *
453 * Loads ELF program headers from the binary file elf_file, which has the ELF
454 * header pointed to by elf_ex, into a newly allocated array. The caller is
455 * responsible for freeing the allocated data. Returns an ERR_PTR upon failure.
456 */
Alexey Dobriyan49ac9812019-03-07 16:29:03 -0800457static struct elf_phdr *load_elf_phdrs(const struct elfhdr *elf_ex,
Paul Burton6a8d3892014-09-11 08:30:14 +0100458 struct file *elf_file)
459{
460 struct elf_phdr *elf_phdata = NULL;
Alexey Dobriyanfaf1c312019-03-07 16:28:56 -0800461 int retval, err = -1;
Alexey Dobriyanfaf1c312019-03-07 16:28:56 -0800462 unsigned int size;
Paul Burton6a8d3892014-09-11 08:30:14 +0100463
464 /*
465 * If the size of this structure has changed, then punt, since
466 * we will be doing the wrong thing.
467 */
468 if (elf_ex->e_phentsize != sizeof(struct elf_phdr))
469 goto out;
470
471 /* Sanity check the number of program headers... */
Paul Burton6a8d3892014-09-11 08:30:14 +0100472 /* ...and their total size. */
473 size = sizeof(struct elf_phdr) * elf_ex->e_phnum;
Alexey Dobriyanfaf1c312019-03-07 16:28:56 -0800474 if (size == 0 || size > 65536 || size > ELF_MIN_ALIGN)
Paul Burton6a8d3892014-09-11 08:30:14 +0100475 goto out;
476
477 elf_phdata = kmalloc(size, GFP_KERNEL);
478 if (!elf_phdata)
479 goto out;
480
481 /* Read in the program headers */
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800482 retval = elf_read(elf_file, elf_phdata, size, elf_ex->e_phoff);
483 if (retval < 0) {
484 err = retval;
Paul Burton6a8d3892014-09-11 08:30:14 +0100485 goto out;
486 }
487
488 /* Success! */
489 err = 0;
490out:
491 if (err) {
492 kfree(elf_phdata);
493 elf_phdata = NULL;
494 }
495 return elf_phdata;
496}
Jiri Kosinacc503c12008-01-30 13:31:07 +0100497
Paul Burton774c1052014-09-11 08:30:16 +0100498#ifndef CONFIG_ARCH_BINFMT_ELF_STATE
499
500/**
501 * struct arch_elf_state - arch-specific ELF loading state
502 *
503 * This structure is used to preserve architecture specific data during
504 * the loading of an ELF file, throughout the checking of architecture
505 * specific ELF headers & through to the point where the ELF load is
506 * known to be proceeding (ie. SET_PERSONALITY).
507 *
508 * This implementation is a dummy for architectures which require no
509 * specific state.
510 */
511struct arch_elf_state {
512};
513
514#define INIT_ARCH_ELF_STATE {}
515
516/**
517 * arch_elf_pt_proc() - check a PT_LOPROC..PT_HIPROC ELF program header
518 * @ehdr: The main ELF header
519 * @phdr: The program header to check
520 * @elf: The open ELF file
521 * @is_interp: True if the phdr is from the interpreter of the ELF being
522 * loaded, else false.
523 * @state: Architecture-specific state preserved throughout the process
524 * of loading the ELF.
525 *
526 * Inspects the program header phdr to validate its correctness and/or
527 * suitability for the system. Called once per ELF program header in the
528 * range PT_LOPROC to PT_HIPROC, for both the ELF being loaded and its
529 * interpreter.
530 *
531 * Return: Zero to proceed with the ELF load, non-zero to fail the ELF load
532 * with that return code.
533 */
534static inline int arch_elf_pt_proc(struct elfhdr *ehdr,
535 struct elf_phdr *phdr,
536 struct file *elf, bool is_interp,
537 struct arch_elf_state *state)
538{
539 /* Dummy implementation, always proceed */
540 return 0;
541}
542
543/**
Maciej W. Rozycki54d157142015-10-26 15:47:57 +0000544 * arch_check_elf() - check an ELF executable
Paul Burton774c1052014-09-11 08:30:16 +0100545 * @ehdr: The main ELF header
546 * @has_interp: True if the ELF has an interpreter, else false.
Maciej W. Rozyckieb4bc072015-11-13 00:47:48 +0000547 * @interp_ehdr: The interpreter's ELF header
Paul Burton774c1052014-09-11 08:30:16 +0100548 * @state: Architecture-specific state preserved throughout the process
549 * of loading the ELF.
550 *
551 * Provides a final opportunity for architecture code to reject the loading
552 * of the ELF & cause an exec syscall to return an error. This is called after
553 * all program headers to be checked by arch_elf_pt_proc have been.
554 *
555 * Return: Zero to proceed with the ELF load, non-zero to fail the ELF load
556 * with that return code.
557 */
558static inline int arch_check_elf(struct elfhdr *ehdr, bool has_interp,
Maciej W. Rozyckieb4bc072015-11-13 00:47:48 +0000559 struct elfhdr *interp_ehdr,
Paul Burton774c1052014-09-11 08:30:16 +0100560 struct arch_elf_state *state)
561{
562 /* Dummy implementation, always proceed */
563 return 0;
564}
565
566#endif /* !CONFIG_ARCH_BINFMT_ELF_STATE */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700567
Dave Martinfe0f6762020-03-16 16:50:46 +0000568static inline int make_prot(u32 p_flags, struct arch_elf_state *arch_state,
569 bool has_interp, bool is_interp)
Alexey Dobriyand8e7cb32019-05-14 15:43:51 -0700570{
571 int prot = 0;
572
573 if (p_flags & PF_R)
574 prot |= PROT_READ;
575 if (p_flags & PF_W)
576 prot |= PROT_WRITE;
577 if (p_flags & PF_X)
578 prot |= PROT_EXEC;
Dave Martinfe0f6762020-03-16 16:50:46 +0000579
580 return arch_elf_adjust_prot(prot, arch_state, has_interp, is_interp);
Alexey Dobriyand8e7cb32019-05-14 15:43:51 -0700581}
582
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583/* This is much more generalized than the library routine read function,
584 so we keep this separate. Technically the library read function
585 is only provided so that we can read a.out libraries that have
586 an ELF header */
587
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700588static unsigned long load_elf_interp(struct elfhdr *interp_elf_ex,
Alexey Dobriyan81696d52019-12-04 16:52:22 -0800589 struct file *interpreter,
Dave Martinfe0f6762020-03-16 16:50:46 +0000590 unsigned long no_base, struct elf_phdr *interp_elf_phdata,
591 struct arch_elf_state *arch_state)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 struct elf_phdr *eppnt;
594 unsigned long load_addr = 0;
595 int load_addr_set = 0;
596 unsigned long last_bss = 0, elf_bss = 0;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800597 int bss_prot = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598 unsigned long error = ~0UL;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100599 unsigned long total_size;
Paul Burton6a8d3892014-09-11 08:30:14 +0100600 int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601
602 /* First of all, some simple consistency checks */
603 if (interp_elf_ex->e_type != ET_EXEC &&
604 interp_elf_ex->e_type != ET_DYN)
605 goto out;
Nicolas Pitre47552002017-08-16 16:05:13 -0400606 if (!elf_check_arch(interp_elf_ex) ||
607 elf_check_fdpic(interp_elf_ex))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700608 goto out;
Al Viro72c2d532013-09-22 16:27:52 -0400609 if (!interpreter->f_op->mmap)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700610 goto out;
611
Paul Burtona9d9ef12014-09-11 08:30:15 +0100612 total_size = total_mapping_size(interp_elf_phdata,
613 interp_elf_ex->e_phnum);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100614 if (!total_size) {
615 error = -EINVAL;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100616 goto out;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100617 }
618
Paul Burtona9d9ef12014-09-11 08:30:15 +0100619 eppnt = interp_elf_phdata;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700620 for (i = 0; i < interp_elf_ex->e_phnum; i++, eppnt++) {
621 if (eppnt->p_type == PT_LOAD) {
622 int elf_type = MAP_PRIVATE | MAP_DENYWRITE;
Dave Martinfe0f6762020-03-16 16:50:46 +0000623 int elf_prot = make_prot(eppnt->p_flags, arch_state,
624 true, true);
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700625 unsigned long vaddr = 0;
626 unsigned long k, map_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700628 vaddr = eppnt->p_vaddr;
629 if (interp_elf_ex->e_type == ET_EXEC || load_addr_set)
Chen Jingwen15fd3952021-09-28 20:56:57 +0800630 elf_type |= MAP_FIXED;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100631 else if (no_base && interp_elf_ex->e_type == ET_DYN)
632 load_addr = -vaddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700633
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700634 map_addr = elf_map(interpreter, load_addr + vaddr,
Andrew Mortonbb1ad822008-01-30 13:31:07 +0100635 eppnt, elf_prot, elf_type, total_size);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100636 total_size = 0;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700637 error = map_addr;
638 if (BAD_ADDR(map_addr))
Paul Burtona9d9ef12014-09-11 08:30:15 +0100639 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700641 if (!load_addr_set &&
642 interp_elf_ex->e_type == ET_DYN) {
643 load_addr = map_addr - ELF_PAGESTART(vaddr);
644 load_addr_set = 1;
645 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700646
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700647 /*
648 * Check to see if the section's size will overflow the
649 * allowed task size. Note that p_filesz must always be
650 * <= p_memsize so it's only necessary to check p_memsz.
651 */
652 k = load_addr + eppnt->p_vaddr;
Chuck Ebbertce510592006-07-03 00:24:14 -0700653 if (BAD_ADDR(k) ||
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700654 eppnt->p_filesz > eppnt->p_memsz ||
655 eppnt->p_memsz > TASK_SIZE ||
656 TASK_SIZE - eppnt->p_memsz < k) {
657 error = -ENOMEM;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100658 goto out;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700659 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700661 /*
662 * Find the end of the file mapping for this phdr, and
663 * keep track of the largest address we see for this.
664 */
665 k = load_addr + eppnt->p_vaddr + eppnt->p_filesz;
666 if (k > elf_bss)
667 elf_bss = k;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700669 /*
670 * Do the same thing for the memory mapping - between
671 * elf_bss and last_bss is the bss section.
672 */
Kees Cook0036d1f2016-08-02 14:04:51 -0700673 k = load_addr + eppnt->p_vaddr + eppnt->p_memsz;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800674 if (k > last_bss) {
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700675 last_bss = k;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800676 bss_prot = elf_prot;
677 }
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700678 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679 }
680
Kees Cook0036d1f2016-08-02 14:04:51 -0700681 /*
682 * Now fill out the bss section: first pad the last page from
683 * the file up to the page boundary, and zero it from elf_bss
684 * up to the end of the page.
685 */
686 if (padzero(elf_bss)) {
687 error = -EFAULT;
688 goto out;
689 }
690 /*
691 * Next, align both the file and mem bss up to the page size,
692 * since this is where elf_bss was just zeroed up to, and where
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800693 * last_bss will end after the vm_brk_flags() below.
Kees Cook0036d1f2016-08-02 14:04:51 -0700694 */
695 elf_bss = ELF_PAGEALIGN(elf_bss);
696 last_bss = ELF_PAGEALIGN(last_bss);
697 /* Finally, if there is still more bss to allocate, do it. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 if (last_bss > elf_bss) {
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800699 error = vm_brk_flags(elf_bss, last_bss - elf_bss,
700 bss_prot & PROT_EXEC ? VM_EXEC : 0);
Linus Torvalds5d22fc22016-05-27 15:57:31 -0700701 if (error)
Paul Burtona9d9ef12014-09-11 08:30:15 +0100702 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700703 }
704
Jiri Kosinacc503c12008-01-30 13:31:07 +0100705 error = load_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706out:
707 return error;
708}
709
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710/*
711 * These are the functions used to load ELF style executables and shared
712 * libraries. There is no binary dependent code anywhere else.
713 */
714
Dave Martin00e19ce2020-03-16 16:50:44 +0000715static int parse_elf_property(const char *data, size_t *off, size_t datasz,
716 struct arch_elf_state *arch,
717 bool have_prev_type, u32 *prev_type)
718{
719 size_t o, step;
720 const struct gnu_property *pr;
721 int ret;
722
723 if (*off == datasz)
724 return -ENOENT;
725
726 if (WARN_ON_ONCE(*off > datasz || *off % ELF_GNU_PROPERTY_ALIGN))
727 return -EIO;
728 o = *off;
729 datasz -= *off;
730
731 if (datasz < sizeof(*pr))
732 return -ENOEXEC;
733 pr = (const struct gnu_property *)(data + o);
734 o += sizeof(*pr);
735 datasz -= sizeof(*pr);
736
737 if (pr->pr_datasz > datasz)
738 return -ENOEXEC;
739
740 WARN_ON_ONCE(o % ELF_GNU_PROPERTY_ALIGN);
741 step = round_up(pr->pr_datasz, ELF_GNU_PROPERTY_ALIGN);
742 if (step > datasz)
743 return -ENOEXEC;
744
745 /* Properties are supposed to be unique and sorted on pr_type: */
746 if (have_prev_type && pr->pr_type <= *prev_type)
747 return -ENOEXEC;
748 *prev_type = pr->pr_type;
749
750 ret = arch_parse_elf_property(pr->pr_type, data + o,
751 pr->pr_datasz, ELF_COMPAT, arch);
752 if (ret)
753 return ret;
754
755 *off = o + step;
756 return 0;
757}
758
759#define NOTE_DATA_SZ SZ_1K
760#define GNU_PROPERTY_TYPE_0_NAME "GNU"
761#define NOTE_NAME_SZ (sizeof(GNU_PROPERTY_TYPE_0_NAME))
762
763static int parse_elf_properties(struct file *f, const struct elf_phdr *phdr,
764 struct arch_elf_state *arch)
765{
766 union {
767 struct elf_note nhdr;
768 char data[NOTE_DATA_SZ];
769 } note;
770 loff_t pos;
771 ssize_t n;
772 size_t off, datasz;
773 int ret;
774 bool have_prev_type;
775 u32 prev_type;
776
777 if (!IS_ENABLED(CONFIG_ARCH_USE_GNU_PROPERTY) || !phdr)
778 return 0;
779
780 /* load_elf_binary() shouldn't call us unless this is true... */
781 if (WARN_ON_ONCE(phdr->p_type != PT_GNU_PROPERTY))
782 return -ENOEXEC;
783
784 /* If the properties are crazy large, that's too bad (for now): */
785 if (phdr->p_filesz > sizeof(note))
786 return -ENOEXEC;
787
788 pos = phdr->p_offset;
789 n = kernel_read(f, &note, phdr->p_filesz, &pos);
790
791 BUILD_BUG_ON(sizeof(note) < sizeof(note.nhdr) + NOTE_NAME_SZ);
792 if (n < 0 || n < sizeof(note.nhdr) + NOTE_NAME_SZ)
793 return -EIO;
794
795 if (note.nhdr.n_type != NT_GNU_PROPERTY_TYPE_0 ||
796 note.nhdr.n_namesz != NOTE_NAME_SZ ||
797 strncmp(note.data + sizeof(note.nhdr),
798 GNU_PROPERTY_TYPE_0_NAME, n - sizeof(note.nhdr)))
799 return -ENOEXEC;
800
801 off = round_up(sizeof(note.nhdr) + NOTE_NAME_SZ,
802 ELF_GNU_PROPERTY_ALIGN);
803 if (off > n)
804 return -ENOEXEC;
805
806 if (note.nhdr.n_descsz > n - off)
807 return -ENOEXEC;
808 datasz = off + note.nhdr.n_descsz;
809
810 have_prev_type = false;
811 do {
812 ret = parse_elf_property(note.data, &off, datasz, arch,
813 have_prev_type, &prev_type);
814 have_prev_type = true;
815 } while (!ret);
816
817 return ret == -ENOENT ? 0 : ret;
818}
819
Al Viro71613c32012-10-20 22:00:48 -0400820static int load_elf_binary(struct linux_binprm *bprm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700821{
822 struct file *interpreter = NULL; /* to shut gcc up */
823 unsigned long load_addr = 0, load_bias = 0;
824 int load_addr_set = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700825 unsigned long error;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100826 struct elf_phdr *elf_ppnt, *elf_phdata, *interp_elf_phdata = NULL;
Dave Martin00e19ce2020-03-16 16:50:44 +0000827 struct elf_phdr *elf_property_phdata = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700828 unsigned long elf_bss, elf_brk;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800829 int bss_prot = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830 int retval, i;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100831 unsigned long elf_entry;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800832 unsigned long e_entry;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100833 unsigned long interp_load_addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700834 unsigned long start_code, end_code, start_data, end_data;
David Daney1a530a62011-03-22 16:34:48 -0700835 unsigned long reloc_func_desc __maybe_unused = 0;
David Rientjes8de61e62006-12-06 20:40:16 -0800836 int executable_stack = EXSTACK_DEFAULT;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800837 struct elfhdr *elf_ex = (struct elfhdr *)bprm->buf;
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -0700838 struct elfhdr *interp_elf_ex = NULL;
Paul Burton774c1052014-09-11 08:30:16 +0100839 struct arch_elf_state arch_state = INIT_ARCH_ELF_STATE;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800840 struct mm_struct *mm;
Alexey Dobriyan249b08e2019-05-14 15:43:54 -0700841 struct pt_regs *regs;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842
Linus Torvalds1da177e2005-04-16 15:20:36 -0700843 retval = -ENOEXEC;
844 /* First of all, some simple consistency checks */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800845 if (memcmp(elf_ex->e_ident, ELFMAG, SELFMAG) != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700846 goto out;
847
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800848 if (elf_ex->e_type != ET_EXEC && elf_ex->e_type != ET_DYN)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849 goto out;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800850 if (!elf_check_arch(elf_ex))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851 goto out;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800852 if (elf_check_fdpic(elf_ex))
Nicolas Pitre47552002017-08-16 16:05:13 -0400853 goto out;
Al Viro72c2d532013-09-22 16:27:52 -0400854 if (!bprm->file->f_op->mmap)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700855 goto out;
856
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800857 elf_phdata = load_elf_phdrs(elf_ex, bprm->file);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700858 if (!elf_phdata)
859 goto out;
860
Linus Torvalds1da177e2005-04-16 15:20:36 -0700861 elf_ppnt = elf_phdata;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800862 for (i = 0; i < elf_ex->e_phnum; i++, elf_ppnt++) {
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700863 char *elf_interpreter;
Alexey Dobriyan5cf4a362019-05-14 15:43:36 -0700864
Dave Martin00e19ce2020-03-16 16:50:44 +0000865 if (elf_ppnt->p_type == PT_GNU_PROPERTY) {
866 elf_property_phdata = elf_ppnt;
867 continue;
868 }
869
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700870 if (elf_ppnt->p_type != PT_INTERP)
871 continue;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700872
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700873 /*
874 * This is the program interpreter used for shared libraries -
875 * for now assume that this is an a.out format binary.
876 */
877 retval = -ENOEXEC;
878 if (elf_ppnt->p_filesz > PATH_MAX || elf_ppnt->p_filesz < 2)
879 goto out_free_ph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700881 retval = -ENOMEM;
882 elf_interpreter = kmalloc(elf_ppnt->p_filesz, GFP_KERNEL);
883 if (!elf_interpreter)
884 goto out_free_ph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700885
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800886 retval = elf_read(bprm->file, elf_interpreter, elf_ppnt->p_filesz,
887 elf_ppnt->p_offset);
888 if (retval < 0)
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700889 goto out_free_interp;
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700890 /* make sure path is NULL terminated */
891 retval = -ENOEXEC;
892 if (elf_interpreter[elf_ppnt->p_filesz - 1] != '\0')
893 goto out_free_interp;
Alexey Dobriyan1fb84492007-01-26 00:57:16 -0800894
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700895 interpreter = open_exec(elf_interpreter);
896 kfree(elf_interpreter);
897 retval = PTR_ERR(interpreter);
898 if (IS_ERR(interpreter))
899 goto out_free_ph;
Alexey Dobriyan1fb84492007-01-26 00:57:16 -0800900
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700901 /*
902 * If the binary is not readable then enforce mm->dumpable = 0
903 * regardless of the interpreter's permissions.
904 */
905 would_dump(bprm, interpreter);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -0700907 interp_elf_ex = kmalloc(sizeof(*interp_elf_ex), GFP_KERNEL);
908 if (!interp_elf_ex) {
909 retval = -ENOMEM;
910 goto out_free_ph;
911 }
912
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700913 /* Get the exec headers */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700914 retval = elf_read(interpreter, interp_elf_ex,
915 sizeof(*interp_elf_ex), 0);
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800916 if (retval < 0)
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700917 goto out_free_dentry;
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700918
919 break;
Alexey Dobriyancc338012019-05-14 15:43:39 -0700920
921out_free_interp:
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700922 kfree(elf_interpreter);
923 goto out_free_ph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700924 }
925
926 elf_ppnt = elf_phdata;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800927 for (i = 0; i < elf_ex->e_phnum; i++, elf_ppnt++)
Paul Burton774c1052014-09-11 08:30:16 +0100928 switch (elf_ppnt->p_type) {
929 case PT_GNU_STACK:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700930 if (elf_ppnt->p_flags & PF_X)
931 executable_stack = EXSTACK_ENABLE_X;
932 else
933 executable_stack = EXSTACK_DISABLE_X;
934 break;
Paul Burton774c1052014-09-11 08:30:16 +0100935
936 case PT_LOPROC ... PT_HIPROC:
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800937 retval = arch_elf_pt_proc(elf_ex, elf_ppnt,
Paul Burton774c1052014-09-11 08:30:16 +0100938 bprm->file, false,
939 &arch_state);
940 if (retval)
941 goto out_free_dentry;
942 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700943 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944
945 /* Some simple consistency checks for the interpreter */
Alexey Dobriyancc338012019-05-14 15:43:39 -0700946 if (interpreter) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700947 retval = -ELIBBAD;
Andi Kleend20894a2008-02-08 04:21:54 -0800948 /* Not an ELF interpreter */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700949 if (memcmp(interp_elf_ex->e_ident, ELFMAG, SELFMAG) != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700950 goto out_free_dentry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700951 /* Verify the interpreter has a valid arch */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700952 if (!elf_check_arch(interp_elf_ex) ||
953 elf_check_fdpic(interp_elf_ex))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954 goto out_free_dentry;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100955
956 /* Load the interpreter program headers */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700957 interp_elf_phdata = load_elf_phdrs(interp_elf_ex,
Paul Burtona9d9ef12014-09-11 08:30:15 +0100958 interpreter);
959 if (!interp_elf_phdata)
960 goto out_free_dentry;
Paul Burton774c1052014-09-11 08:30:16 +0100961
962 /* Pass PT_LOPROC..PT_HIPROC headers to arch code */
Dave Martin00e19ce2020-03-16 16:50:44 +0000963 elf_property_phdata = NULL;
Paul Burton774c1052014-09-11 08:30:16 +0100964 elf_ppnt = interp_elf_phdata;
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700965 for (i = 0; i < interp_elf_ex->e_phnum; i++, elf_ppnt++)
Paul Burton774c1052014-09-11 08:30:16 +0100966 switch (elf_ppnt->p_type) {
Dave Martin00e19ce2020-03-16 16:50:44 +0000967 case PT_GNU_PROPERTY:
968 elf_property_phdata = elf_ppnt;
969 break;
970
Paul Burton774c1052014-09-11 08:30:16 +0100971 case PT_LOPROC ... PT_HIPROC:
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700972 retval = arch_elf_pt_proc(interp_elf_ex,
Paul Burton774c1052014-09-11 08:30:16 +0100973 elf_ppnt, interpreter,
974 true, &arch_state);
975 if (retval)
976 goto out_free_dentry;
977 break;
978 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700979 }
980
Dave Martin00e19ce2020-03-16 16:50:44 +0000981 retval = parse_elf_properties(interpreter ?: bprm->file,
982 elf_property_phdata, &arch_state);
983 if (retval)
984 goto out_free_dentry;
985
Paul Burton774c1052014-09-11 08:30:16 +0100986 /*
987 * Allow arch code to reject the ELF at this point, whilst it's
988 * still possible to return an error to the code that invoked
989 * the exec syscall.
990 */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800991 retval = arch_check_elf(elf_ex,
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700992 !!interpreter, interp_elf_ex,
Maciej W. Rozyckieb4bc072015-11-13 00:47:48 +0000993 &arch_state);
Paul Burton774c1052014-09-11 08:30:16 +0100994 if (retval)
995 goto out_free_dentry;
996
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997 /* Flush all traces of the currently running executable */
Eric W. Biederman23887772020-05-03 07:54:10 -0500998 retval = begin_new_exec(bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 if (retval)
1000 goto out_free_dentry;
1001
Linus Torvalds1da177e2005-04-16 15:20:36 -07001002 /* Do this immediately, since STACK_TOP as used in setup_arg_pages
1003 may depend on the personality. */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001004 SET_PERSONALITY2(*elf_ex, &arch_state);
1005 if (elf_read_implies_exec(*elf_ex, executable_stack))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001006 current->personality |= READ_IMPLIES_EXEC;
1007
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001008 if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001009 current->flags |= PF_RANDOMIZE;
Linus Torvalds221af7f2010-01-28 22:14:42 -08001010
1011 setup_new_exec(bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012
1013 /* Do this so that we can load the interpreter, if need be. We will
1014 change some of these later */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 retval = setup_arg_pages(bprm, randomize_stack_top(STACK_TOP),
1016 executable_stack);
Al Viro19d860a2014-05-04 20:11:36 -04001017 if (retval < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001018 goto out_free_dentry;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001019
Alexey Dobriyan852643162019-05-14 15:43:48 -07001020 elf_bss = 0;
1021 elf_brk = 0;
1022
1023 start_code = ~0UL;
1024 end_code = 0;
1025 start_data = 0;
1026 end_data = 0;
1027
André Goddard Rosaaf901ca2009-11-14 13:09:05 -02001028 /* Now we do a little grungy work by mmapping the ELF image into
Jiri Kosinacc503c12008-01-30 13:31:07 +01001029 the correct location in memory. */
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001030 for(i = 0, elf_ppnt = elf_phdata;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001031 i < elf_ex->e_phnum; i++, elf_ppnt++) {
Linus Torvaldsb2129212019-10-06 13:53:27 -07001032 int elf_prot, elf_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001033 unsigned long k, vaddr;
Michael Davidsona87938b2015-04-14 15:47:38 -07001034 unsigned long total_size = 0;
Chris Kennellyce81bb22020-10-15 20:12:32 -07001035 unsigned long alignment;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036
1037 if (elf_ppnt->p_type != PT_LOAD)
1038 continue;
1039
1040 if (unlikely (elf_brk > elf_bss)) {
1041 unsigned long nbyte;
1042
1043 /* There was a PT_LOAD segment with p_memsz > p_filesz
1044 before this one. Map anonymous pages, if needed,
1045 and clear the area. */
Mikael Petterssonf670d0e2011-01-12 17:00:02 -08001046 retval = set_brk(elf_bss + load_bias,
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001047 elf_brk + load_bias,
1048 bss_prot);
Al Viro19d860a2014-05-04 20:11:36 -04001049 if (retval)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001050 goto out_free_dentry;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051 nbyte = ELF_PAGEOFFSET(elf_bss);
1052 if (nbyte) {
1053 nbyte = ELF_MIN_ALIGN - nbyte;
1054 if (nbyte > elf_brk - elf_bss)
1055 nbyte = elf_brk - elf_bss;
1056 if (clear_user((void __user *)elf_bss +
1057 load_bias, nbyte)) {
1058 /*
1059 * This bss-zeroing can fail if the ELF
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001060 * file specifies odd protections. So
Linus Torvalds1da177e2005-04-16 15:20:36 -07001061 * we don't check the return value
1062 */
1063 }
1064 }
1065 }
1066
Dave Martinfe0f6762020-03-16 16:50:46 +00001067 elf_prot = make_prot(elf_ppnt->p_flags, &arch_state,
1068 !!interpreter, false);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001070 elf_flags = MAP_PRIVATE | MAP_DENYWRITE | MAP_EXECUTABLE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001071
1072 vaddr = elf_ppnt->p_vaddr;
Kees Cookeab09532017-07-10 15:52:37 -07001073 /*
1074 * If we are loading ET_EXEC or we have already performed
1075 * the ET_DYN load_addr calculations, proceed normally.
1076 */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001077 if (elf_ex->e_type == ET_EXEC || load_addr_set) {
Linus Torvaldsb2129212019-10-06 13:53:27 -07001078 elf_flags |= MAP_FIXED;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001079 } else if (elf_ex->e_type == ET_DYN) {
Kees Cookeab09532017-07-10 15:52:37 -07001080 /*
1081 * This logic is run once for the first LOAD Program
1082 * Header for ET_DYN binaries to calculate the
1083 * randomization (load_bias) for all the LOAD
1084 * Program Headers, and to calculate the entire
1085 * size of the ELF mapping (total_size). (Note that
1086 * load_addr_set is set to true later once the
1087 * initial mapping is performed.)
1088 *
1089 * There are effectively two types of ET_DYN
1090 * binaries: programs (i.e. PIE: ET_DYN with INTERP)
1091 * and loaders (ET_DYN without INTERP, since they
1092 * _are_ the ELF interpreter). The loaders must
1093 * be loaded away from programs since the program
1094 * may otherwise collide with the loader (especially
1095 * for ET_EXEC which does not have a randomized
1096 * position). For example to handle invocations of
1097 * "./ld.so someprog" to test out a new version of
1098 * the loader, the subsequent program that the
1099 * loader loads must avoid the loader itself, so
1100 * they cannot share the same load range. Sufficient
1101 * room for the brk must be allocated with the
1102 * loader as well, since brk must be available with
1103 * the loader.
1104 *
1105 * Therefore, programs are loaded offset from
1106 * ELF_ET_DYN_BASE and loaders are loaded into the
1107 * independently randomized mmap region (0 load_bias
1108 * without MAP_FIXED).
1109 */
Alexey Dobriyancc338012019-05-14 15:43:39 -07001110 if (interpreter) {
Kees Cookeab09532017-07-10 15:52:37 -07001111 load_bias = ELF_ET_DYN_BASE;
1112 if (current->flags & PF_RANDOMIZE)
1113 load_bias += arch_mmap_rnd();
Chris Kennellyce81bb22020-10-15 20:12:32 -07001114 alignment = maximum_alignment(elf_phdata, elf_ex->e_phnum);
1115 if (alignment)
1116 load_bias &= ~(alignment - 1);
Linus Torvaldsb2129212019-10-06 13:53:27 -07001117 elf_flags |= MAP_FIXED;
Kees Cookeab09532017-07-10 15:52:37 -07001118 } else
1119 load_bias = 0;
1120
1121 /*
1122 * Since load_bias is used for all subsequent loading
1123 * calculations, we must lower it by the first vaddr
1124 * so that the remaining calculations based on the
1125 * ELF vaddrs will be correctly offset. The result
1126 * is then page aligned.
1127 */
1128 load_bias = ELF_PAGESTART(load_bias - vaddr);
1129
Michael Davidsona87938b2015-04-14 15:47:38 -07001130 total_size = total_mapping_size(elf_phdata,
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001131 elf_ex->e_phnum);
Michael Davidsona87938b2015-04-14 15:47:38 -07001132 if (!total_size) {
Andrew Morton2b1d3ae2015-05-28 15:44:24 -07001133 retval = -EINVAL;
Michael Davidsona87938b2015-04-14 15:47:38 -07001134 goto out_free_dentry;
1135 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136 }
1137
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001138 error = elf_map(bprm->file, load_bias + vaddr, elf_ppnt,
Michael Davidsona87938b2015-04-14 15:47:38 -07001139 elf_prot, elf_flags, total_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001140 if (BAD_ADDR(error)) {
Alexey Kuznetsovb140f2512007-05-08 00:31:57 -07001141 retval = IS_ERR((void *)error) ?
1142 PTR_ERR((void*)error) : -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001143 goto out_free_dentry;
1144 }
1145
1146 if (!load_addr_set) {
1147 load_addr_set = 1;
1148 load_addr = (elf_ppnt->p_vaddr - elf_ppnt->p_offset);
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001149 if (elf_ex->e_type == ET_DYN) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001150 load_bias += error -
1151 ELF_PAGESTART(load_bias + vaddr);
1152 load_addr += load_bias;
1153 reloc_func_desc = load_bias;
1154 }
1155 }
1156 k = elf_ppnt->p_vaddr;
Alexey Dobriyanf67ef442020-01-30 22:16:52 -08001157 if ((elf_ppnt->p_flags & PF_X) && k < start_code)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001158 start_code = k;
1159 if (start_data < k)
1160 start_data = k;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161
1162 /*
1163 * Check to see if the section's size will overflow the
1164 * allowed task size. Note that p_filesz must always be
1165 * <= p_memsz so it is only necessary to check p_memsz.
1166 */
Chuck Ebbertce510592006-07-03 00:24:14 -07001167 if (BAD_ADDR(k) || elf_ppnt->p_filesz > elf_ppnt->p_memsz ||
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 elf_ppnt->p_memsz > TASK_SIZE ||
1169 TASK_SIZE - elf_ppnt->p_memsz < k) {
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001170 /* set_brk can never work. Avoid overflows. */
Alexey Kuznetsovb140f2512007-05-08 00:31:57 -07001171 retval = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172 goto out_free_dentry;
1173 }
1174
1175 k = elf_ppnt->p_vaddr + elf_ppnt->p_filesz;
1176
1177 if (k > elf_bss)
1178 elf_bss = k;
1179 if ((elf_ppnt->p_flags & PF_X) && end_code < k)
1180 end_code = k;
1181 if (end_data < k)
1182 end_data = k;
1183 k = elf_ppnt->p_vaddr + elf_ppnt->p_memsz;
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001184 if (k > elf_brk) {
1185 bss_prot = elf_prot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001186 elf_brk = k;
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001187 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001188 }
1189
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001190 e_entry = elf_ex->e_entry + load_bias;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001191 elf_bss += load_bias;
1192 elf_brk += load_bias;
1193 start_code += load_bias;
1194 end_code += load_bias;
1195 start_data += load_bias;
1196 end_data += load_bias;
1197
1198 /* Calling set_brk effectively mmaps the pages that we need
1199 * for the bss and break sections. We must do this before
1200 * mapping in the interpreter, to make sure it doesn't wind
1201 * up getting placed where the bss needs to go.
1202 */
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001203 retval = set_brk(elf_bss, elf_brk, bss_prot);
Al Viro19d860a2014-05-04 20:11:36 -04001204 if (retval)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001205 goto out_free_dentry;
akpm@osdl.org6de50512005-10-11 08:29:08 -07001206 if (likely(elf_bss != elf_brk) && unlikely(padzero(elf_bss))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207 retval = -EFAULT; /* Nobody gets to see this, but.. */
1208 goto out_free_dentry;
1209 }
1210
Alexey Dobriyancc338012019-05-14 15:43:39 -07001211 if (interpreter) {
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -07001212 elf_entry = load_elf_interp(interp_elf_ex,
Andi Kleend20894a2008-02-08 04:21:54 -08001213 interpreter,
Dave Martinfe0f6762020-03-16 16:50:46 +00001214 load_bias, interp_elf_phdata,
1215 &arch_state);
Andi Kleend20894a2008-02-08 04:21:54 -08001216 if (!IS_ERR((void *)elf_entry)) {
1217 /*
1218 * load_elf_interp() returns relocation
1219 * adjustment
1220 */
1221 interp_load_addr = elf_entry;
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -07001222 elf_entry += interp_elf_ex->e_entry;
Jiri Kosinacc503c12008-01-30 13:31:07 +01001223 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224 if (BAD_ADDR(elf_entry)) {
Chuck Ebbertce510592006-07-03 00:24:14 -07001225 retval = IS_ERR((void *)elf_entry) ?
1226 (int)elf_entry : -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227 goto out_free_dentry;
1228 }
1229 reloc_func_desc = interp_load_addr;
1230
1231 allow_write_access(interpreter);
1232 fput(interpreter);
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -07001233
1234 kfree(interp_elf_ex);
Alexey Dobriyanaa0d1562020-04-06 20:11:32 -07001235 kfree(interp_elf_phdata);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001236 } else {
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001237 elf_entry = e_entry;
Suresh Siddha5342fba2006-02-26 04:18:28 +01001238 if (BAD_ADDR(elf_entry)) {
Chuck Ebbertce510592006-07-03 00:24:14 -07001239 retval = -EINVAL;
Suresh Siddha5342fba2006-02-26 04:18:28 +01001240 goto out_free_dentry;
1241 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001242 }
1243
1244 kfree(elf_phdata);
1245
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246 set_binfmt(&elf_format);
1247
Benjamin Herrenschmidt547ee842005-04-16 15:24:35 -07001248#ifdef ARCH_HAS_SETUP_ADDITIONAL_PAGES
Alexey Dobriyancc338012019-05-14 15:43:39 -07001249 retval = arch_setup_additional_pages(bprm, !!interpreter);
Al Viro19d860a2014-05-04 20:11:36 -04001250 if (retval < 0)
Roland McGrath18c8baff2005-04-28 15:17:19 -07001251 goto out;
Benjamin Herrenschmidt547ee842005-04-16 15:24:35 -07001252#endif /* ARCH_HAS_SETUP_ADDITIONAL_PAGES */
1253
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001254 retval = create_elf_tables(bprm, elf_ex,
1255 load_addr, interp_load_addr, e_entry);
Al Viro19d860a2014-05-04 20:11:36 -04001256 if (retval < 0)
Ollie Wildb6a2fea2007-07-19 01:48:16 -07001257 goto out;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001258
1259 mm = current->mm;
1260 mm->end_code = end_code;
1261 mm->start_code = start_code;
1262 mm->start_data = start_data;
1263 mm->end_data = end_data;
1264 mm->start_stack = bprm->p;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265
Jiri Kosina4471a672011-04-14 15:22:09 -07001266 if ((current->flags & PF_RANDOMIZE) && (randomize_va_space > 1)) {
Kees Cookbbdc6072019-05-14 15:43:57 -07001267 /*
1268 * For architectures with ELF randomization, when executing
1269 * a loader directly (i.e. no interpreter listed in ELF
1270 * headers), move the brk area out of the mmap region
1271 * (since it grows up, and may collide early with the stack
1272 * growing down), and into the unused ELF_ET_DYN_BASE region.
1273 */
Kees Cook7be3cb02019-09-26 10:15:25 -07001274 if (IS_ENABLED(CONFIG_ARCH_HAS_ELF_RANDOMIZE) &&
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001275 elf_ex->e_type == ET_DYN && !interpreter) {
1276 mm->brk = mm->start_brk = ELF_ET_DYN_BASE;
1277 }
Kees Cookbbdc6072019-05-14 15:43:57 -07001278
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001279 mm->brk = mm->start_brk = arch_randomize_brk(mm);
Kees Cook204db6e2015-04-14 15:48:12 -07001280#ifdef compat_brk_randomized
Jiri Kosina4471a672011-04-14 15:22:09 -07001281 current->brk_randomized = 1;
1282#endif
1283 }
Jiri Kosinac1d171a2008-01-30 13:30:40 +01001284
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285 if (current->personality & MMAP_PAGE_ZERO) {
1286 /* Why this, you ask??? Well SVr4 maps page 0 as read-only,
1287 and some applications "depend" upon this behavior.
1288 Since we do not have the power to recompile these, we
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001289 emulate the SVr4 behavior. Sigh. */
Linus Torvalds6be5ceb2012-04-20 17:13:58 -07001290 error = vm_mmap(NULL, 0, PAGE_SIZE, PROT_READ | PROT_EXEC,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001291 MAP_FIXED | MAP_PRIVATE, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292 }
1293
Alexey Dobriyan249b08e2019-05-14 15:43:54 -07001294 regs = current_pt_regs();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001295#ifdef ELF_PLAT_INIT
1296 /*
1297 * The ABI may specify that certain registers be set up in special
1298 * ways (on i386 %edx is the address of a DT_FINI function, for
1299 * example. In addition, it may also specify (eg, PowerPC64 ELF)
1300 * that the e_entry field is the address of the function descriptor
1301 * for the startup routine, rather than the address of the startup
1302 * routine itself. This macro performs whatever initialization to
1303 * the regs structure is required as well as any relocations to the
1304 * function descriptor entries when executing dynamically links apps.
1305 */
1306 ELF_PLAT_INIT(regs, reloc_func_desc);
1307#endif
1308
Kees Cookb8383832018-04-10 16:34:57 -07001309 finalize_exec(bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 start_thread(regs, elf_entry, bprm->p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001311 retval = 0;
1312out:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001313 return retval;
1314
1315 /* error cleanup */
1316out_free_dentry:
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -07001317 kfree(interp_elf_ex);
Paul Burtona9d9ef12014-09-11 08:30:15 +01001318 kfree(interp_elf_phdata);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001319 allow_write_access(interpreter);
1320 if (interpreter)
1321 fput(interpreter);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001322out_free_ph:
1323 kfree(elf_phdata);
1324 goto out;
1325}
1326
Josh Triplett69369a72014-04-03 14:48:27 -07001327#ifdef CONFIG_USELIB
Linus Torvalds1da177e2005-04-16 15:20:36 -07001328/* This is really simpleminded and specialized - we are loading an
1329 a.out library that is given an ELF header. */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001330static int load_elf_library(struct file *file)
1331{
1332 struct elf_phdr *elf_phdata;
1333 struct elf_phdr *eppnt;
1334 unsigned long elf_bss, bss, len;
1335 int retval, error, i, j;
1336 struct elfhdr elf_ex;
1337
1338 error = -ENOEXEC;
Alexey Dobriyan658c0332019-12-04 16:52:25 -08001339 retval = elf_read(file, &elf_ex, sizeof(elf_ex), 0);
1340 if (retval < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001341 goto out;
1342
1343 if (memcmp(elf_ex.e_ident, ELFMAG, SELFMAG) != 0)
1344 goto out;
1345
1346 /* First of all, some simple consistency checks */
1347 if (elf_ex.e_type != ET_EXEC || elf_ex.e_phnum > 2 ||
Al Viro72c2d532013-09-22 16:27:52 -04001348 !elf_check_arch(&elf_ex) || !file->f_op->mmap)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001349 goto out;
Nicolas Pitre47552002017-08-16 16:05:13 -04001350 if (elf_check_fdpic(&elf_ex))
1351 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001352
1353 /* Now read in all of the header information */
1354
1355 j = sizeof(struct elf_phdr) * elf_ex.e_phnum;
1356 /* j < ELF_MIN_ALIGN because elf_ex.e_phnum <= 2 */
1357
1358 error = -ENOMEM;
1359 elf_phdata = kmalloc(j, GFP_KERNEL);
1360 if (!elf_phdata)
1361 goto out;
1362
1363 eppnt = elf_phdata;
1364 error = -ENOEXEC;
Alexey Dobriyan658c0332019-12-04 16:52:25 -08001365 retval = elf_read(file, eppnt, j, elf_ex.e_phoff);
1366 if (retval < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001367 goto out_free_ph;
1368
1369 for (j = 0, i = 0; i<elf_ex.e_phnum; i++)
1370 if ((eppnt + i)->p_type == PT_LOAD)
1371 j++;
1372 if (j != 1)
1373 goto out_free_ph;
1374
1375 while (eppnt->p_type != PT_LOAD)
1376 eppnt++;
1377
1378 /* Now use mmap to map the library into memory. */
Linus Torvalds6be5ceb2012-04-20 17:13:58 -07001379 error = vm_mmap(file,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001380 ELF_PAGESTART(eppnt->p_vaddr),
1381 (eppnt->p_filesz +
1382 ELF_PAGEOFFSET(eppnt->p_vaddr)),
1383 PROT_READ | PROT_WRITE | PROT_EXEC,
Michal Hocko4ed28632018-04-10 16:36:01 -07001384 MAP_FIXED_NOREPLACE | MAP_PRIVATE | MAP_DENYWRITE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001385 (eppnt->p_offset -
1386 ELF_PAGEOFFSET(eppnt->p_vaddr)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387 if (error != ELF_PAGESTART(eppnt->p_vaddr))
1388 goto out_free_ph;
1389
1390 elf_bss = eppnt->p_vaddr + eppnt->p_filesz;
1391 if (padzero(elf_bss)) {
1392 error = -EFAULT;
1393 goto out_free_ph;
1394 }
1395
Oscar Salvador24962af2018-07-13 16:59:13 -07001396 len = ELF_PAGEALIGN(eppnt->p_filesz + eppnt->p_vaddr);
1397 bss = ELF_PAGEALIGN(eppnt->p_memsz + eppnt->p_vaddr);
Michal Hockoecc2bc82016-05-23 16:25:39 -07001398 if (bss > len) {
1399 error = vm_brk(len, bss - len);
Linus Torvalds5d22fc22016-05-27 15:57:31 -07001400 if (error)
Michal Hockoecc2bc82016-05-23 16:25:39 -07001401 goto out_free_ph;
1402 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403 error = 0;
1404
1405out_free_ph:
1406 kfree(elf_phdata);
1407out:
1408 return error;
1409}
Josh Triplett69369a72014-04-03 14:48:27 -07001410#endif /* #ifdef CONFIG_USELIB */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001411
Christoph Hellwig698ba7b2009-12-15 16:47:37 -08001412#ifdef CONFIG_ELF_CORE
Linus Torvalds1da177e2005-04-16 15:20:36 -07001413/*
1414 * ELF core dumper
1415 *
1416 * Modelled on fs/exec.c:aout_core_dump()
1417 * Jeremy Fitzhardinge <jeremy@sw.oz.au>
1418 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001419
Linus Torvalds1da177e2005-04-16 15:20:36 -07001420/* An ELF note in memory */
1421struct memelfnote
1422{
1423 const char *name;
1424 int type;
1425 unsigned int datasz;
1426 void *data;
1427};
1428
1429static int notesize(struct memelfnote *en)
1430{
1431 int sz;
1432
1433 sz = sizeof(struct elf_note);
1434 sz += roundup(strlen(en->name) + 1, 4);
1435 sz += roundup(en->datasz, 4);
1436
1437 return sz;
1438}
1439
Al Viroecc8c772013-10-05 15:32:35 -04001440static int writenote(struct memelfnote *men, struct coredump_params *cprm)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001441{
1442 struct elf_note en;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001443 en.n_namesz = strlen(men->name) + 1;
1444 en.n_descsz = men->datasz;
1445 en.n_type = men->type;
1446
Al Viroecc8c772013-10-05 15:32:35 -04001447 return dump_emit(cprm, &en, sizeof(en)) &&
Al Viro22a8cb82013-10-08 11:05:01 -04001448 dump_emit(cprm, men->name, en.n_namesz) && dump_align(cprm, 4) &&
1449 dump_emit(cprm, men->data, men->datasz) && dump_align(cprm, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001450}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001451
Roland McGrath3aba4812008-01-30 13:31:44 +01001452static void fill_elf_header(struct elfhdr *elf, int segs,
Zhang Yanfeid3330cf2013-02-21 16:44:20 -08001453 u16 machine, u32 flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001454{
Cyrill Gorcunov6970c8e2008-04-29 01:01:18 -07001455 memset(elf, 0, sizeof(*elf));
1456
Linus Torvalds1da177e2005-04-16 15:20:36 -07001457 memcpy(elf->e_ident, ELFMAG, SELFMAG);
1458 elf->e_ident[EI_CLASS] = ELF_CLASS;
1459 elf->e_ident[EI_DATA] = ELF_DATA;
1460 elf->e_ident[EI_VERSION] = EV_CURRENT;
1461 elf->e_ident[EI_OSABI] = ELF_OSABI;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001462
1463 elf->e_type = ET_CORE;
Roland McGrath3aba4812008-01-30 13:31:44 +01001464 elf->e_machine = machine;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001465 elf->e_version = EV_CURRENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001466 elf->e_phoff = sizeof(struct elfhdr);
Roland McGrath3aba4812008-01-30 13:31:44 +01001467 elf->e_flags = flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001468 elf->e_ehsize = sizeof(struct elfhdr);
1469 elf->e_phentsize = sizeof(struct elf_phdr);
1470 elf->e_phnum = segs;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001471}
1472
Andrew Morton8d6b5eee2006-09-25 23:32:04 -07001473static void fill_elf_note_phdr(struct elf_phdr *phdr, int sz, loff_t offset)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001474{
1475 phdr->p_type = PT_NOTE;
1476 phdr->p_offset = offset;
1477 phdr->p_vaddr = 0;
1478 phdr->p_paddr = 0;
1479 phdr->p_filesz = sz;
1480 phdr->p_memsz = 0;
1481 phdr->p_flags = 0;
1482 phdr->p_align = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001483}
1484
1485static void fill_note(struct memelfnote *note, const char *name, int type,
1486 unsigned int sz, void *data)
1487{
1488 note->name = name;
1489 note->type = type;
1490 note->datasz = sz;
1491 note->data = data;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001492}
1493
1494/*
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001495 * fill up all the fields in prstatus from the given task struct, except
1496 * registers which need to be filled up separately.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497 */
1498static void fill_prstatus(struct elf_prstatus *prstatus,
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001499 struct task_struct *p, long signr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001500{
1501 prstatus->pr_info.si_signo = prstatus->pr_cursig = signr;
1502 prstatus->pr_sigpend = p->pending.signal.sig[0];
1503 prstatus->pr_sighold = p->blocked.sig[0];
Oleg Nesterov3b34fc52009-06-17 16:27:38 -07001504 rcu_read_lock();
1505 prstatus->pr_ppid = task_pid_vnr(rcu_dereference(p->real_parent));
1506 rcu_read_unlock();
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001507 prstatus->pr_pid = task_pid_vnr(p);
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001508 prstatus->pr_pgrp = task_pgrp_vnr(p);
1509 prstatus->pr_sid = task_session_vnr(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001510 if (thread_group_leader(p)) {
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001511 struct task_cputime cputime;
Frank Mayharf06febc2008-09-12 09:54:39 -07001512
Linus Torvalds1da177e2005-04-16 15:20:36 -07001513 /*
Frank Mayharf06febc2008-09-12 09:54:39 -07001514 * This is the record for the group leader. It shows the
1515 * group-wide total, not its individual thread total.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001516 */
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001517 thread_group_cputime(p, &cputime);
Arnd Bergmanne2bb80d2017-11-23 13:46:33 +01001518 prstatus->pr_utime = ns_to_kernel_old_timeval(cputime.utime);
1519 prstatus->pr_stime = ns_to_kernel_old_timeval(cputime.stime);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001520 } else {
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001521 u64 utime, stime;
Frederic Weisbecker6fac4822012-11-13 14:20:55 +01001522
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001523 task_cputime(p, &utime, &stime);
Arnd Bergmanne2bb80d2017-11-23 13:46:33 +01001524 prstatus->pr_utime = ns_to_kernel_old_timeval(utime);
1525 prstatus->pr_stime = ns_to_kernel_old_timeval(stime);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001526 }
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001527
Arnd Bergmanne2bb80d2017-11-23 13:46:33 +01001528 prstatus->pr_cutime = ns_to_kernel_old_timeval(p->signal->cutime);
1529 prstatus->pr_cstime = ns_to_kernel_old_timeval(p->signal->cstime);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530}
1531
1532static int fill_psinfo(struct elf_prpsinfo *psinfo, struct task_struct *p,
1533 struct mm_struct *mm)
1534{
David Howellsc69e8d92008-11-14 10:39:19 +11001535 const struct cred *cred;
Greg Kroah-Hartmana84a5052005-05-11 00:10:44 -07001536 unsigned int i, len;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001537
1538 /* first copy the parameters from user space */
1539 memset(psinfo, 0, sizeof(struct elf_prpsinfo));
1540
1541 len = mm->arg_end - mm->arg_start;
1542 if (len >= ELF_PRARGSZ)
1543 len = ELF_PRARGSZ-1;
1544 if (copy_from_user(&psinfo->pr_psargs,
1545 (const char __user *)mm->arg_start, len))
1546 return -EFAULT;
1547 for(i = 0; i < len; i++)
1548 if (psinfo->pr_psargs[i] == 0)
1549 psinfo->pr_psargs[i] = ' ';
1550 psinfo->pr_psargs[len] = 0;
1551
Oleg Nesterov3b34fc52009-06-17 16:27:38 -07001552 rcu_read_lock();
1553 psinfo->pr_ppid = task_pid_vnr(rcu_dereference(p->real_parent));
1554 rcu_read_unlock();
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001555 psinfo->pr_pid = task_pid_vnr(p);
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001556 psinfo->pr_pgrp = task_pgrp_vnr(p);
1557 psinfo->pr_sid = task_session_vnr(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001558
1559 i = p->state ? ffz(~p->state) + 1 : 0;
1560 psinfo->pr_state = i;
Carsten Otte55148542006-03-25 03:08:22 -08001561 psinfo->pr_sname = (i > 5) ? '.' : "RSDTZW"[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001562 psinfo->pr_zomb = psinfo->pr_sname == 'Z';
1563 psinfo->pr_nice = task_nice(p);
1564 psinfo->pr_flag = p->flags;
David Howellsc69e8d92008-11-14 10:39:19 +11001565 rcu_read_lock();
1566 cred = __task_cred(p);
Eric W. Biedermanebc887b2012-02-07 18:36:10 -08001567 SET_UID(psinfo->pr_uid, from_kuid_munged(cred->user_ns, cred->uid));
1568 SET_GID(psinfo->pr_gid, from_kgid_munged(cred->user_ns, cred->gid));
David Howellsc69e8d92008-11-14 10:39:19 +11001569 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001570 strncpy(psinfo->pr_fname, p->comm, sizeof(psinfo->pr_fname));
1571
1572 return 0;
1573}
1574
Roland McGrath3aba4812008-01-30 13:31:44 +01001575static void fill_auxv_note(struct memelfnote *note, struct mm_struct *mm)
1576{
1577 elf_addr_t *auxv = (elf_addr_t *) mm->saved_auxv;
1578 int i = 0;
1579 do
1580 i += 2;
1581 while (auxv[i - 2] != AT_NULL);
1582 fill_note(note, "CORE", NT_AUXV, i * sizeof(elf_addr_t), auxv);
1583}
1584
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001585static void fill_siginfo_note(struct memelfnote *note, user_siginfo_t *csigdata,
Eric W. Biedermanae7795b2018-09-25 11:27:20 +02001586 const kernel_siginfo_t *siginfo)
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001587{
Eric W. Biedermanfa4751f2020-05-05 12:12:54 +02001588 copy_siginfo_to_external(csigdata, siginfo);
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001589 fill_note(note, "CORE", NT_SIGINFO, sizeof(*csigdata), csigdata);
1590}
1591
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001592#define MAX_FILE_NOTE_SIZE (4*1024*1024)
1593/*
1594 * Format of NT_FILE note:
1595 *
1596 * long count -- how many files are mapped
1597 * long page_size -- units for file_ofs
1598 * array of [COUNT] elements of
1599 * long start
1600 * long end
1601 * long file_ofs
1602 * followed by COUNT filenames in ASCII: "FILE1" NUL "FILE2" NUL...
1603 */
Dan Aloni72023652013-09-30 13:45:02 -07001604static int fill_files_note(struct memelfnote *note)
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001605{
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001606 struct mm_struct *mm = current->mm;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001607 struct vm_area_struct *vma;
1608 unsigned count, size, names_ofs, remaining, n;
1609 user_long_t *data;
1610 user_long_t *start_end_ofs;
1611 char *name_base, *name_curpos;
1612
1613 /* *Estimated* file count and total data size needed */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001614 count = mm->map_count;
Alexey Dobriyan60c9d922018-02-06 15:39:13 -08001615 if (count > UINT_MAX / 64)
1616 return -EINVAL;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001617 size = count * 64;
1618
1619 names_ofs = (2 + 3 * count) * sizeof(data[0]);
1620 alloc:
1621 if (size >= MAX_FILE_NOTE_SIZE) /* paranoia check */
Dan Aloni72023652013-09-30 13:45:02 -07001622 return -EINVAL;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001623 size = round_up(size, PAGE_SIZE);
Alexey Dobriyan1fbede62020-01-30 22:17:10 -08001624 /*
1625 * "size" can be 0 here legitimately.
1626 * Let it ENOMEM and omit NT_FILE section which will be empty anyway.
1627 */
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07001628 data = kvmalloc(size, GFP_KERNEL);
1629 if (ZERO_OR_NULL_PTR(data))
Dan Aloni72023652013-09-30 13:45:02 -07001630 return -ENOMEM;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001631
1632 start_end_ofs = data + 2;
1633 name_base = name_curpos = ((char *)data) + names_ofs;
1634 remaining = size - names_ofs;
1635 count = 0;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001636 for (vma = mm->mmap; vma != NULL; vma = vma->vm_next) {
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001637 struct file *file;
1638 const char *filename;
1639
1640 file = vma->vm_file;
1641 if (!file)
1642 continue;
Miklos Szeredi9bf39ab2015-06-19 10:29:13 +02001643 filename = file_path(file, name_curpos, remaining);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001644 if (IS_ERR(filename)) {
1645 if (PTR_ERR(filename) == -ENAMETOOLONG) {
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07001646 kvfree(data);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001647 size = size * 5 / 4;
1648 goto alloc;
1649 }
1650 continue;
1651 }
1652
Miklos Szeredi9bf39ab2015-06-19 10:29:13 +02001653 /* file_path() fills at the end, move name down */
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001654 /* n = strlen(filename) + 1: */
1655 n = (name_curpos + remaining) - filename;
1656 remaining = filename - name_curpos;
1657 memmove(name_curpos, filename, n);
1658 name_curpos += n;
1659
1660 *start_end_ofs++ = vma->vm_start;
1661 *start_end_ofs++ = vma->vm_end;
1662 *start_end_ofs++ = vma->vm_pgoff;
1663 count++;
1664 }
1665
1666 /* Now we know exact count of files, can store it */
1667 data[0] = count;
1668 data[1] = PAGE_SIZE;
1669 /*
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001670 * Count usually is less than mm->map_count,
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001671 * we need to move filenames down.
1672 */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001673 n = mm->map_count - count;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001674 if (n != 0) {
1675 unsigned shift_bytes = n * 3 * sizeof(data[0]);
1676 memmove(name_base - shift_bytes, name_base,
1677 name_curpos - name_base);
1678 name_curpos -= shift_bytes;
1679 }
1680
1681 size = name_curpos - (char *)data;
1682 fill_note(note, "CORE", NT_FILE, size, data);
Dan Aloni72023652013-09-30 13:45:02 -07001683 return 0;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001684}
1685
Roland McGrath4206d3a2008-01-30 13:31:45 +01001686#ifdef CORE_DUMP_USE_REGSET
1687#include <linux/regset.h>
1688
1689struct elf_thread_core_info {
1690 struct elf_thread_core_info *next;
1691 struct task_struct *task;
1692 struct elf_prstatus prstatus;
Gustavo A. R. Silva5e01fdf2020-08-31 08:25:42 -05001693 struct memelfnote notes[];
Roland McGrath4206d3a2008-01-30 13:31:45 +01001694};
1695
1696struct elf_note_info {
1697 struct elf_thread_core_info *thread;
1698 struct memelfnote psinfo;
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001699 struct memelfnote signote;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001700 struct memelfnote auxv;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001701 struct memelfnote files;
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001702 user_siginfo_t csigdata;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001703 size_t size;
1704 int thread_notes;
1705};
1706
Roland McGrathd31472b2008-03-04 14:28:30 -08001707/*
1708 * When a regset has a writeback hook, we call it on each thread before
1709 * dumping user memory. On register window machines, this makes sure the
1710 * user memory backing the register data is up to date before we read it.
1711 */
1712static void do_thread_regset_writeback(struct task_struct *task,
1713 const struct user_regset *regset)
1714{
1715 if (regset->writeback)
1716 regset->writeback(task, regset, 1);
1717}
1718
H. J. Lu0953f65d2012-02-14 13:34:52 -08001719#ifndef PRSTATUS_SIZE
Dmitry Safonov90954e72016-09-05 16:33:06 +03001720#define PRSTATUS_SIZE(S, R) sizeof(S)
H. J. Lu0953f65d2012-02-14 13:34:52 -08001721#endif
1722
1723#ifndef SET_PR_FPVALID
Dmitry Safonov90954e72016-09-05 16:33:06 +03001724#define SET_PR_FPVALID(S, V, R) ((S)->pr_fpvalid = (V))
H. J. Lu0953f65d2012-02-14 13:34:52 -08001725#endif
1726
Roland McGrath4206d3a2008-01-30 13:31:45 +01001727static int fill_thread_core_info(struct elf_thread_core_info *t,
1728 const struct user_regset_view *view,
1729 long signr, size_t *total)
1730{
1731 unsigned int i;
Al Virob4e9c952020-06-01 19:42:40 -04001732 int regset0_size;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001733
1734 /*
1735 * NT_PRSTATUS is the one special case, because the regset data
1736 * goes into the pr_reg field inside the note contents, rather
1737 * than being the whole note contents. We fill the reset in here.
1738 * We assume that regset 0 is NT_PRSTATUS.
1739 */
1740 fill_prstatus(&t->prstatus, t->task, signr);
Al Virob4e9c952020-06-01 19:42:40 -04001741 regset0_size = regset_get(t->task, &view->regsets[0],
1742 sizeof(t->prstatus.pr_reg), &t->prstatus.pr_reg);
1743 if (regset0_size < 0)
1744 return 0;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001745
1746 fill_note(&t->notes[0], "CORE", NT_PRSTATUS,
Dave Martin27e64b42017-10-31 15:50:53 +00001747 PRSTATUS_SIZE(t->prstatus, regset0_size), &t->prstatus);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001748 *total += notesize(&t->notes[0]);
1749
Roland McGrathd31472b2008-03-04 14:28:30 -08001750 do_thread_regset_writeback(t->task, &view->regsets[0]);
1751
Roland McGrath4206d3a2008-01-30 13:31:45 +01001752 /*
1753 * Each other regset might generate a note too. For each regset
1754 * that has no core_note_type or is inactive, we leave t->notes[i]
1755 * all zero and we'll know to skip writing it later.
1756 */
1757 for (i = 1; i < view->n; ++i) {
1758 const struct user_regset *regset = &view->regsets[i];
Al Virob4e9c952020-06-01 19:42:40 -04001759 int note_type = regset->core_note_type;
1760 bool is_fpreg = note_type == NT_PRFPREG;
1761 void *data;
1762 int ret;
1763
Roland McGrathd31472b2008-03-04 14:28:30 -08001764 do_thread_regset_writeback(t->task, regset);
Al Virob4e9c952020-06-01 19:42:40 -04001765 if (!note_type) // not for coredumps
1766 continue;
1767 if (regset->active && regset->active(t->task, regset) <= 0)
1768 continue;
1769
1770 ret = regset_get_alloc(t->task, regset, ~0U, &data);
1771 if (ret < 0)
1772 continue;
1773
1774 if (is_fpreg)
1775 SET_PR_FPVALID(&t->prstatus, 1, regset0_size);
1776
1777 fill_note(&t->notes[i], is_fpreg ? "CORE" : "LINUX",
1778 note_type, ret, data);
1779
1780 *total += notesize(&t->notes[i]);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001781 }
1782
1783 return 1;
1784}
1785
1786static int fill_note_info(struct elfhdr *elf, int phdrs,
1787 struct elf_note_info *info,
Eric W. Biedermanae7795b2018-09-25 11:27:20 +02001788 const kernel_siginfo_t *siginfo, struct pt_regs *regs)
Roland McGrath4206d3a2008-01-30 13:31:45 +01001789{
1790 struct task_struct *dump_task = current;
1791 const struct user_regset_view *view = task_user_regset_view(dump_task);
1792 struct elf_thread_core_info *t;
1793 struct elf_prpsinfo *psinfo;
Oleg Nesterov83914442008-07-25 01:47:45 -07001794 struct core_thread *ct;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001795 unsigned int i;
1796
1797 info->size = 0;
1798 info->thread = NULL;
1799
1800 psinfo = kmalloc(sizeof(*psinfo), GFP_KERNEL);
Alan Cox6899e922012-12-17 16:02:09 -08001801 if (psinfo == NULL) {
1802 info->psinfo.data = NULL; /* So we don't free this wrongly */
Roland McGrath4206d3a2008-01-30 13:31:45 +01001803 return 0;
Alan Cox6899e922012-12-17 16:02:09 -08001804 }
Roland McGrath4206d3a2008-01-30 13:31:45 +01001805
Amerigo Wange2dbe122009-07-01 01:06:26 -04001806 fill_note(&info->psinfo, "CORE", NT_PRPSINFO, sizeof(*psinfo), psinfo);
1807
Roland McGrath4206d3a2008-01-30 13:31:45 +01001808 /*
1809 * Figure out how many notes we're going to need for each thread.
1810 */
1811 info->thread_notes = 0;
1812 for (i = 0; i < view->n; ++i)
1813 if (view->regsets[i].core_note_type != 0)
1814 ++info->thread_notes;
1815
1816 /*
1817 * Sanity check. We rely on regset 0 being in NT_PRSTATUS,
1818 * since it is our one special case.
1819 */
1820 if (unlikely(info->thread_notes == 0) ||
1821 unlikely(view->regsets[0].core_note_type != NT_PRSTATUS)) {
1822 WARN_ON(1);
1823 return 0;
1824 }
1825
1826 /*
1827 * Initialize the ELF file header.
1828 */
1829 fill_elf_header(elf, phdrs,
Zhang Yanfeid3330cf2013-02-21 16:44:20 -08001830 view->e_machine, view->e_flags);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001831
1832 /*
1833 * Allocate a structure for each thread.
1834 */
Oleg Nesterov83914442008-07-25 01:47:45 -07001835 for (ct = &dump_task->mm->core_state->dumper; ct; ct = ct->next) {
1836 t = kzalloc(offsetof(struct elf_thread_core_info,
1837 notes[info->thread_notes]),
1838 GFP_KERNEL);
1839 if (unlikely(!t))
1840 return 0;
Oleg Nesterov24d52882008-07-25 01:47:40 -07001841
Oleg Nesterov83914442008-07-25 01:47:45 -07001842 t->task = ct->task;
1843 if (ct->task == dump_task || !info->thread) {
1844 t->next = info->thread;
1845 info->thread = t;
1846 } else {
1847 /*
1848 * Make sure to keep the original task at
1849 * the head of the list.
1850 */
1851 t->next = info->thread->next;
1852 info->thread->next = t;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001853 }
Oleg Nesterov83914442008-07-25 01:47:45 -07001854 }
Roland McGrath4206d3a2008-01-30 13:31:45 +01001855
1856 /*
1857 * Now fill in each thread's information.
1858 */
1859 for (t = info->thread; t != NULL; t = t->next)
Denys Vlasenko5ab1c302012-10-04 17:15:29 -07001860 if (!fill_thread_core_info(t, view, siginfo->si_signo, &info->size))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001861 return 0;
1862
1863 /*
1864 * Fill in the two process-wide notes.
1865 */
1866 fill_psinfo(psinfo, dump_task->group_leader, dump_task->mm);
1867 info->size += notesize(&info->psinfo);
1868
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001869 fill_siginfo_note(&info->signote, &info->csigdata, siginfo);
1870 info->size += notesize(&info->signote);
1871
Roland McGrath4206d3a2008-01-30 13:31:45 +01001872 fill_auxv_note(&info->auxv, current->mm);
1873 info->size += notesize(&info->auxv);
1874
Dan Aloni72023652013-09-30 13:45:02 -07001875 if (fill_files_note(&info->files) == 0)
1876 info->size += notesize(&info->files);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001877
Roland McGrath4206d3a2008-01-30 13:31:45 +01001878 return 1;
1879}
1880
1881static size_t get_note_info_size(struct elf_note_info *info)
1882{
1883 return info->size;
1884}
1885
1886/*
1887 * Write all the notes for each thread. When writing the first thread, the
1888 * process-wide notes are interleaved after the first thread-specific note.
1889 */
1890static int write_note_info(struct elf_note_info *info,
Al Viroecc8c772013-10-05 15:32:35 -04001891 struct coredump_params *cprm)
Roland McGrath4206d3a2008-01-30 13:31:45 +01001892{
Fabian Frederickb219e252014-06-04 16:12:14 -07001893 bool first = true;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001894 struct elf_thread_core_info *t = info->thread;
1895
1896 do {
1897 int i;
1898
Al Viroecc8c772013-10-05 15:32:35 -04001899 if (!writenote(&t->notes[0], cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001900 return 0;
1901
Al Viroecc8c772013-10-05 15:32:35 -04001902 if (first && !writenote(&info->psinfo, cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001903 return 0;
Al Viroecc8c772013-10-05 15:32:35 -04001904 if (first && !writenote(&info->signote, cprm))
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001905 return 0;
Al Viroecc8c772013-10-05 15:32:35 -04001906 if (first && !writenote(&info->auxv, cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001907 return 0;
Dan Aloni72023652013-09-30 13:45:02 -07001908 if (first && info->files.data &&
Al Viroecc8c772013-10-05 15:32:35 -04001909 !writenote(&info->files, cprm))
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001910 return 0;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001911
1912 for (i = 1; i < info->thread_notes; ++i)
1913 if (t->notes[i].data &&
Al Viroecc8c772013-10-05 15:32:35 -04001914 !writenote(&t->notes[i], cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001915 return 0;
1916
Fabian Frederickb219e252014-06-04 16:12:14 -07001917 first = false;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001918 t = t->next;
1919 } while (t);
1920
1921 return 1;
1922}
1923
1924static void free_note_info(struct elf_note_info *info)
1925{
1926 struct elf_thread_core_info *threads = info->thread;
1927 while (threads) {
1928 unsigned int i;
1929 struct elf_thread_core_info *t = threads;
1930 threads = t->next;
1931 WARN_ON(t->notes[0].data && t->notes[0].data != &t->prstatus);
1932 for (i = 1; i < info->thread_notes; ++i)
1933 kfree(t->notes[i].data);
1934 kfree(t);
1935 }
1936 kfree(info->psinfo.data);
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07001937 kvfree(info->files.data);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001938}
1939
1940#else
1941
Linus Torvalds1da177e2005-04-16 15:20:36 -07001942/* Here is the structure in which status of each thread is captured. */
1943struct elf_thread_status
1944{
1945 struct list_head list;
1946 struct elf_prstatus prstatus; /* NT_PRSTATUS */
1947 elf_fpregset_t fpu; /* NT_PRFPREG */
1948 struct task_struct *thread;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001949 struct memelfnote notes[3];
1950 int num_notes;
1951};
1952
1953/*
1954 * In order to add the specific thread information for the elf file format,
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001955 * we need to keep a linked list of every threads pr_status and then create
1956 * a single section for them in the final core file.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001957 */
1958static int elf_dump_thread_status(long signr, struct elf_thread_status *t)
1959{
1960 int sz = 0;
1961 struct task_struct *p = t->thread;
1962 t->num_notes = 0;
1963
1964 fill_prstatus(&t->prstatus, p, signr);
1965 elf_core_copy_task_regs(p, &t->prstatus.pr_reg);
1966
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001967 fill_note(&t->notes[0], "CORE", NT_PRSTATUS, sizeof(t->prstatus),
1968 &(t->prstatus));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001969 t->num_notes++;
1970 sz += notesize(&t->notes[0]);
1971
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001972 if ((t->prstatus.pr_fpvalid = elf_core_copy_task_fpregs(p, NULL,
1973 &t->fpu))) {
1974 fill_note(&t->notes[1], "CORE", NT_PRFPREG, sizeof(t->fpu),
1975 &(t->fpu));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001976 t->num_notes++;
1977 sz += notesize(&t->notes[1]);
1978 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001979 return sz;
1980}
1981
Roland McGrath3aba4812008-01-30 13:31:44 +01001982struct elf_note_info {
1983 struct memelfnote *notes;
Dan Aloni72023652013-09-30 13:45:02 -07001984 struct memelfnote *notes_files;
Roland McGrath3aba4812008-01-30 13:31:44 +01001985 struct elf_prstatus *prstatus; /* NT_PRSTATUS */
1986 struct elf_prpsinfo *psinfo; /* NT_PRPSINFO */
1987 struct list_head thread_list;
1988 elf_fpregset_t *fpu;
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001989 user_siginfo_t csigdata;
Roland McGrath3aba4812008-01-30 13:31:44 +01001990 int thread_status_size;
1991 int numnote;
1992};
1993
Amerigo Wang0cf062d2009-09-23 15:57:05 -07001994static int elf_note_info_init(struct elf_note_info *info)
Roland McGrath3aba4812008-01-30 13:31:44 +01001995{
Amerigo Wang0cf062d2009-09-23 15:57:05 -07001996 memset(info, 0, sizeof(*info));
Roland McGrath3aba4812008-01-30 13:31:44 +01001997 INIT_LIST_HEAD(&info->thread_list);
1998
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001999 /* Allocate space for ELF notes */
Kees Cook6da2ec52018-06-12 13:55:00 -07002000 info->notes = kmalloc_array(8, sizeof(struct memelfnote), GFP_KERNEL);
Roland McGrath3aba4812008-01-30 13:31:44 +01002001 if (!info->notes)
2002 return 0;
2003 info->psinfo = kmalloc(sizeof(*info->psinfo), GFP_KERNEL);
2004 if (!info->psinfo)
Denys Vlasenkof34f9d12012-09-26 11:34:50 +10002005 return 0;
Roland McGrath3aba4812008-01-30 13:31:44 +01002006 info->prstatus = kmalloc(sizeof(*info->prstatus), GFP_KERNEL);
2007 if (!info->prstatus)
Denys Vlasenkof34f9d12012-09-26 11:34:50 +10002008 return 0;
Roland McGrath3aba4812008-01-30 13:31:44 +01002009 info->fpu = kmalloc(sizeof(*info->fpu), GFP_KERNEL);
2010 if (!info->fpu)
Denys Vlasenkof34f9d12012-09-26 11:34:50 +10002011 return 0;
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002012 return 1;
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002013}
Roland McGrath3aba4812008-01-30 13:31:44 +01002014
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002015static int fill_note_info(struct elfhdr *elf, int phdrs,
2016 struct elf_note_info *info,
Eric W. Biedermanae7795b2018-09-25 11:27:20 +02002017 const kernel_siginfo_t *siginfo, struct pt_regs *regs)
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002018{
Al Viroafabada2013-10-14 07:39:56 -04002019 struct core_thread *ct;
2020 struct elf_thread_status *ets;
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002021
2022 if (!elf_note_info_init(info))
2023 return 0;
2024
Al Viroafabada2013-10-14 07:39:56 -04002025 for (ct = current->mm->core_state->dumper.next;
2026 ct; ct = ct->next) {
2027 ets = kzalloc(sizeof(*ets), GFP_KERNEL);
2028 if (!ets)
2029 return 0;
Oleg Nesterov24d52882008-07-25 01:47:40 -07002030
Al Viroafabada2013-10-14 07:39:56 -04002031 ets->thread = ct->task;
2032 list_add(&ets->list, &info->thread_list);
2033 }
Oleg Nesterov83914442008-07-25 01:47:45 -07002034
Alexey Dobriyan93f044e2019-03-07 16:28:59 -08002035 list_for_each_entry(ets, &info->thread_list, list) {
Al Viroafabada2013-10-14 07:39:56 -04002036 int sz;
Oleg Nesterov83914442008-07-25 01:47:45 -07002037
Al Viroafabada2013-10-14 07:39:56 -04002038 sz = elf_dump_thread_status(siginfo->si_signo, ets);
2039 info->thread_status_size += sz;
Roland McGrath3aba4812008-01-30 13:31:44 +01002040 }
2041 /* now collect the dump for the current */
2042 memset(info->prstatus, 0, sizeof(*info->prstatus));
Denys Vlasenko5ab1c302012-10-04 17:15:29 -07002043 fill_prstatus(info->prstatus, current, siginfo->si_signo);
Roland McGrath3aba4812008-01-30 13:31:44 +01002044 elf_core_copy_regs(&info->prstatus->pr_reg, regs);
2045
2046 /* Set up header */
Zhang Yanfeid3330cf2013-02-21 16:44:20 -08002047 fill_elf_header(elf, phdrs, ELF_ARCH, ELF_CORE_EFLAGS);
Roland McGrath3aba4812008-01-30 13:31:44 +01002048
2049 /*
2050 * Set up the notes in similar form to SVR4 core dumps made
2051 * with info from their /proc.
2052 */
2053
2054 fill_note(info->notes + 0, "CORE", NT_PRSTATUS,
2055 sizeof(*info->prstatus), info->prstatus);
2056 fill_psinfo(info->psinfo, current->group_leader, current->mm);
2057 fill_note(info->notes + 1, "CORE", NT_PRPSINFO,
2058 sizeof(*info->psinfo), info->psinfo);
2059
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07002060 fill_siginfo_note(info->notes + 2, &info->csigdata, siginfo);
2061 fill_auxv_note(info->notes + 3, current->mm);
Dan Aloni72023652013-09-30 13:45:02 -07002062 info->numnote = 4;
Roland McGrath3aba4812008-01-30 13:31:44 +01002063
Dan Aloni72023652013-09-30 13:45:02 -07002064 if (fill_files_note(info->notes + info->numnote) == 0) {
2065 info->notes_files = info->notes + info->numnote;
2066 info->numnote++;
2067 }
Roland McGrath3aba4812008-01-30 13:31:44 +01002068
2069 /* Try to dump the FPU. */
2070 info->prstatus->pr_fpvalid = elf_core_copy_task_fpregs(current, regs,
2071 info->fpu);
2072 if (info->prstatus->pr_fpvalid)
2073 fill_note(info->notes + info->numnote++,
2074 "CORE", NT_PRFPREG, sizeof(*info->fpu), info->fpu);
Roland McGrath3aba4812008-01-30 13:31:44 +01002075 return 1;
Roland McGrath3aba4812008-01-30 13:31:44 +01002076}
2077
2078static size_t get_note_info_size(struct elf_note_info *info)
2079{
2080 int sz = 0;
2081 int i;
2082
2083 for (i = 0; i < info->numnote; i++)
2084 sz += notesize(info->notes + i);
2085
2086 sz += info->thread_status_size;
2087
2088 return sz;
2089}
2090
2091static int write_note_info(struct elf_note_info *info,
Al Viroecc8c772013-10-05 15:32:35 -04002092 struct coredump_params *cprm)
Roland McGrath3aba4812008-01-30 13:31:44 +01002093{
Alexey Dobriyan93f044e2019-03-07 16:28:59 -08002094 struct elf_thread_status *ets;
Roland McGrath3aba4812008-01-30 13:31:44 +01002095 int i;
Roland McGrath3aba4812008-01-30 13:31:44 +01002096
2097 for (i = 0; i < info->numnote; i++)
Al Viroecc8c772013-10-05 15:32:35 -04002098 if (!writenote(info->notes + i, cprm))
Roland McGrath3aba4812008-01-30 13:31:44 +01002099 return 0;
2100
2101 /* write out the thread status notes section */
Alexey Dobriyan93f044e2019-03-07 16:28:59 -08002102 list_for_each_entry(ets, &info->thread_list, list) {
2103 for (i = 0; i < ets->num_notes; i++)
2104 if (!writenote(&ets->notes[i], cprm))
Roland McGrath3aba4812008-01-30 13:31:44 +01002105 return 0;
2106 }
2107
2108 return 1;
2109}
2110
2111static void free_note_info(struct elf_note_info *info)
2112{
2113 while (!list_empty(&info->thread_list)) {
2114 struct list_head *tmp = info->thread_list.next;
2115 list_del(tmp);
2116 kfree(list_entry(tmp, struct elf_thread_status, list));
2117 }
2118
Dan Aloni72023652013-09-30 13:45:02 -07002119 /* Free data possibly allocated by fill_files_note(): */
2120 if (info->notes_files)
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07002121 kvfree(info->notes_files->data);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07002122
Roland McGrath3aba4812008-01-30 13:31:44 +01002123 kfree(info->prstatus);
2124 kfree(info->psinfo);
2125 kfree(info->notes);
2126 kfree(info->fpu);
Roland McGrath3aba4812008-01-30 13:31:44 +01002127}
2128
Roland McGrath4206d3a2008-01-30 13:31:45 +01002129#endif
2130
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002131static void fill_extnum_info(struct elfhdr *elf, struct elf_shdr *shdr4extnum,
2132 elf_addr_t e_shoff, int segs)
2133{
2134 elf->e_shoff = e_shoff;
2135 elf->e_shentsize = sizeof(*shdr4extnum);
2136 elf->e_shnum = 1;
2137 elf->e_shstrndx = SHN_UNDEF;
2138
2139 memset(shdr4extnum, 0, sizeof(*shdr4extnum));
2140
2141 shdr4extnum->sh_type = SHT_NULL;
2142 shdr4extnum->sh_size = elf->e_shnum;
2143 shdr4extnum->sh_link = elf->e_shstrndx;
2144 shdr4extnum->sh_info = segs;
2145}
2146
Linus Torvalds1da177e2005-04-16 15:20:36 -07002147/*
2148 * Actual dumper
2149 *
2150 * This is a two-pass process; first we find the offsets of the bits,
2151 * and then they are actually written out. If we run out of core limit
2152 * we just truncate.
2153 */
Masami Hiramatsuf6151df2009-12-17 15:27:16 -08002154static int elf_core_dump(struct coredump_params *cprm)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002155{
Linus Torvalds1da177e2005-04-16 15:20:36 -07002156 int has_dumped = 0;
Jann Horna07279c2020-10-15 20:12:54 -07002157 int vma_count, segs, i;
2158 size_t vma_data_size;
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002159 struct elfhdr elf;
Al Virocdc3d562013-10-05 22:24:29 -04002160 loff_t offset = 0, dataoff;
Dan Aloni72023652013-09-30 13:45:02 -07002161 struct elf_note_info info = { };
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002162 struct elf_phdr *phdr4note = NULL;
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002163 struct elf_shdr *shdr4extnum = NULL;
2164 Elf_Half e_phnum;
2165 elf_addr_t e_shoff;
Jann Horna07279c2020-10-15 20:12:54 -07002166 struct core_vma_metadata *vma_meta;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002167
Jann Horna07279c2020-10-15 20:12:54 -07002168 if (dump_vma_snapshot(cprm, &vma_count, &vma_meta, &vma_data_size))
2169 return 0;
2170
KAMEZAWA Hiroyuki341c87b2009-06-30 11:41:23 -07002171 /*
2172 * The number of segs are recored into ELF header as 16bit value.
2173 * Please check DEFAULT_MAX_MAP_COUNT definition when you modify here.
2174 */
Jann Horna07279c2020-10-15 20:12:54 -07002175 segs = vma_count + elf_core_extra_phdrs();
Roland McGrathf47aef52007-01-26 00:56:49 -08002176
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002177 /* for notes section */
2178 segs++;
2179
2180 /* If segs > PN_XNUM(0xffff), then e_phnum overflows. To avoid
2181 * this, kernel supports extended numbering. Have a look at
2182 * include/linux/elf.h for further information. */
2183 e_phnum = segs > PN_XNUM ? PN_XNUM : segs;
2184
Roland McGrath3aba4812008-01-30 13:31:44 +01002185 /*
2186 * Collect all the non-memory information about the process for the
2187 * notes. This also sets up the file header.
2188 */
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002189 if (!fill_note_info(&elf, e_phnum, &info, cprm->siginfo, cprm->regs))
Christoph Hellwigd2530b42020-05-05 12:12:55 +02002190 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002191
2192 has_dumped = 1;
Oleg Nesterov079148b2013-04-30 15:28:16 -07002193
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002194 offset += sizeof(elf); /* Elf header */
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002195 offset += segs * sizeof(struct elf_phdr); /* Program headers */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002196
2197 /* Write notes phdr entry */
2198 {
Roland McGrath3aba4812008-01-30 13:31:44 +01002199 size_t sz = get_note_info_size(&info);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002200
Michael Ellermane5501492007-09-19 14:38:12 +10002201 sz += elf_coredump_extra_notes_size();
Dwayne Grant McConnellbf1ab972006-11-23 00:46:37 +01002202
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002203 phdr4note = kmalloc(sizeof(*phdr4note), GFP_KERNEL);
2204 if (!phdr4note)
Daisuke HATAYAMA088e7af2010-03-05 13:44:06 -08002205 goto end_coredump;
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002206
2207 fill_elf_note_phdr(phdr4note, sz, offset);
2208 offset += sz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002209 }
2210
Linus Torvalds1da177e2005-04-16 15:20:36 -07002211 dataoff = offset = roundup(offset, ELF_EXEC_PAGESIZE);
2212
Jungseung Lee52f5592e2014-12-10 15:52:16 -08002213 offset += vma_data_size;
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002214 offset += elf_core_extra_data_size();
2215 e_shoff = offset;
2216
2217 if (e_phnum == PN_XNUM) {
2218 shdr4extnum = kmalloc(sizeof(*shdr4extnum), GFP_KERNEL);
2219 if (!shdr4extnum)
2220 goto end_coredump;
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002221 fill_extnum_info(&elf, shdr4extnum, e_shoff, segs);
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002222 }
2223
2224 offset = dataoff;
2225
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002226 if (!dump_emit(cprm, &elf, sizeof(elf)))
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002227 goto end_coredump;
2228
Al Viroecc8c772013-10-05 15:32:35 -04002229 if (!dump_emit(cprm, phdr4note, sizeof(*phdr4note)))
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002230 goto end_coredump;
2231
Linus Torvalds1da177e2005-04-16 15:20:36 -07002232 /* Write program headers for segments dump */
Jann Horna07279c2020-10-15 20:12:54 -07002233 for (i = 0; i < vma_count; i++) {
2234 struct core_vma_metadata *meta = vma_meta + i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002235 struct elf_phdr phdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002236
2237 phdr.p_type = PT_LOAD;
2238 phdr.p_offset = offset;
Jann Horna07279c2020-10-15 20:12:54 -07002239 phdr.p_vaddr = meta->start;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002240 phdr.p_paddr = 0;
Jann Horna07279c2020-10-15 20:12:54 -07002241 phdr.p_filesz = meta->dump_size;
2242 phdr.p_memsz = meta->end - meta->start;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002243 offset += phdr.p_filesz;
Jann Horna07279c2020-10-15 20:12:54 -07002244 phdr.p_flags = 0;
2245 if (meta->flags & VM_READ)
2246 phdr.p_flags |= PF_R;
2247 if (meta->flags & VM_WRITE)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07002248 phdr.p_flags |= PF_W;
Jann Horna07279c2020-10-15 20:12:54 -07002249 if (meta->flags & VM_EXEC)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07002250 phdr.p_flags |= PF_X;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002251 phdr.p_align = ELF_EXEC_PAGESIZE;
2252
Al Viroecc8c772013-10-05 15:32:35 -04002253 if (!dump_emit(cprm, &phdr, sizeof(phdr)))
Daisuke HATAYAMA088e7af2010-03-05 13:44:06 -08002254 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002255 }
2256
Al Viro506f21c2013-10-05 17:22:57 -04002257 if (!elf_core_write_extra_phdrs(cprm, offset))
Daisuke HATAYAMA1fcccba2010-03-05 13:44:07 -08002258 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002259
2260 /* write out the notes section */
Al Viroecc8c772013-10-05 15:32:35 -04002261 if (!write_note_info(&info, cprm))
Roland McGrath3aba4812008-01-30 13:31:44 +01002262 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002263
Al Virocdc3d562013-10-05 22:24:29 -04002264 if (elf_coredump_extra_notes_write(cprm))
Michael Ellermane5501492007-09-19 14:38:12 +10002265 goto end_coredump;
Dwayne Grant McConnellbf1ab972006-11-23 00:46:37 +01002266
Andi Kleend025c9d2006-09-30 23:29:28 -07002267 /* Align to page */
Mateusz Guzik1607f092016-06-05 23:14:14 +02002268 if (!dump_skip(cprm, dataoff - cprm->pos))
Hugh Dickinsf3e8fcc2009-09-21 17:03:25 -07002269 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002270
Jann Horna07279c2020-10-15 20:12:54 -07002271 for (i = 0; i < vma_count; i++) {
2272 struct core_vma_metadata *meta = vma_meta + i;
2273
2274 if (!dump_user_range(cprm, meta->start, meta->dump_size))
Jann Hornafc63a97b2020-10-15 20:12:46 -07002275 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002276 }
Dave Kleikamp4d22c752017-01-11 13:25:00 -06002277 dump_truncate(cprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002278
Al Viroaa3e7ea2013-10-05 17:50:15 -04002279 if (!elf_core_write_extra_data(cprm))
Daisuke HATAYAMA1fcccba2010-03-05 13:44:07 -08002280 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002281
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002282 if (e_phnum == PN_XNUM) {
Al Viro13046ec2013-10-05 18:08:47 -04002283 if (!dump_emit(cprm, shdr4extnum, sizeof(*shdr4extnum)))
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002284 goto end_coredump;
2285 }
2286
Linus Torvalds1da177e2005-04-16 15:20:36 -07002287end_coredump:
Roland McGrath3aba4812008-01-30 13:31:44 +01002288 free_note_info(&info);
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002289 kfree(shdr4extnum);
Jann Horna07279c2020-10-15 20:12:54 -07002290 kvfree(vma_meta);
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002291 kfree(phdr4note);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002292 return has_dumped;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002293}
2294
Christoph Hellwig698ba7b2009-12-15 16:47:37 -08002295#endif /* CONFIG_ELF_CORE */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002296
2297static int __init init_elf_binfmt(void)
2298{
Al Viro8fc3dc52012-03-17 03:05:16 -04002299 register_binfmt(&elf_format);
2300 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002301}
2302
2303static void __exit exit_elf_binfmt(void)
2304{
2305 /* Remove the COFF and ELF loaders. */
2306 unregister_binfmt(&elf_format);
2307}
2308
2309core_initcall(init_elf_binfmt);
2310module_exit(exit_elf_binfmt);
2311MODULE_LICENSE("GPL");