blob: f8c7f26f1fbb3f987636d01295d0763ed9464c35 [file] [log] [blame]
Thomas Gleixner09c434b2019-05-19 13:08:20 +01001// SPDX-License-Identifier: GPL-2.0-only
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * linux/fs/binfmt_elf.c
4 *
5 * These are the functions used to load ELF format executables as used
6 * on SVr4 machines. Information on the format may be found in the book
7 * "UNIX SYSTEM V RELEASE 4 Programmers Guide: Ansi C and Programming Support
8 * Tools".
9 *
10 * Copyright 1993, 1994: Eric Youngdale (ericy@cais.com).
11 */
12
13#include <linux/module.h>
14#include <linux/kernel.h>
15#include <linux/fs.h>
Chris Kennellyce81bb22020-10-15 20:12:32 -070016#include <linux/log2.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/mm.h>
18#include <linux/mman.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <linux/errno.h>
20#include <linux/signal.h>
21#include <linux/binfmts.h>
22#include <linux/string.h>
23#include <linux/file.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/personality.h>
26#include <linux/elfcore.h>
27#include <linux/init.h>
28#include <linux/highuid.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029#include <linux/compiler.h>
30#include <linux/highmem.h>
Anshuman Khandual03911132020-04-06 20:03:51 -070031#include <linux/hugetlb.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/pagemap.h>
Denys Vlasenko2aa362c2012-10-04 17:15:36 -070033#include <linux/vmalloc.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070034#include <linux/security.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/random.h>
Jesper Juhlf4e5cc22006-06-23 02:05:35 -070036#include <linux/elf.h>
Kees Cookd1fd8362015-04-14 15:48:07 -070037#include <linux/elf-randomize.h>
Alexey Dobriyan7e80d0d2007-05-08 00:28:59 -070038#include <linux/utsname.h>
Daisuke HATAYAMA088e7af2010-03-05 13:44:06 -080039#include <linux/coredump.h>
Frederic Weisbecker6fac4822012-11-13 14:20:55 +010040#include <linux/sched.h>
Ingo Molnarf7ccbae2017-02-08 18:51:30 +010041#include <linux/sched/coredump.h>
Ingo Molnar68db0cf2017-02-08 18:51:37 +010042#include <linux/sched/task_stack.h>
Ingo Molnar32ef5512017-02-05 11:48:36 +010043#include <linux/sched/cputime.h>
Dave Martin00e19ce2020-03-16 16:50:44 +000044#include <linux/sizes.h>
45#include <linux/types.h>
Ingo Molnar5b825c32017-02-02 17:54:15 +010046#include <linux/cred.h>
Ross Zwisler50378352015-10-05 16:33:36 -060047#include <linux/dax.h>
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080048#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070049#include <asm/param.h>
50#include <asm/page.h>
51
Dave Martin00e19ce2020-03-16 16:50:44 +000052#ifndef ELF_COMPAT
53#define ELF_COMPAT 0
54#endif
55
Denys Vlasenko2aa362c2012-10-04 17:15:36 -070056#ifndef user_long_t
57#define user_long_t long
58#endif
Denys Vlasenko49ae4d42012-10-04 17:15:35 -070059#ifndef user_siginfo_t
60#define user_siginfo_t siginfo_t
61#endif
62
Nicolas Pitre47552002017-08-16 16:05:13 -040063/* That's for binfmt_elf_fdpic to deal with */
64#ifndef elf_check_fdpic
65#define elf_check_fdpic(ex) false
66#endif
67
Al Viro71613c32012-10-20 22:00:48 -040068static int load_elf_binary(struct linux_binprm *bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -070069
Josh Triplett69369a72014-04-03 14:48:27 -070070#ifdef CONFIG_USELIB
71static int load_elf_library(struct file *);
72#else
73#define load_elf_library NULL
74#endif
75
Linus Torvalds1da177e2005-04-16 15:20:36 -070076/*
77 * If we don't support core dumping, then supply a NULL so we
78 * don't even try.
79 */
Christoph Hellwig698ba7b2009-12-15 16:47:37 -080080#ifdef CONFIG_ELF_CORE
Masami Hiramatsuf6151df2009-12-17 15:27:16 -080081static int elf_core_dump(struct coredump_params *cprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -070082#else
83#define elf_core_dump NULL
84#endif
85
86#if ELF_EXEC_PAGESIZE > PAGE_SIZE
Jesper Juhlf4e5cc22006-06-23 02:05:35 -070087#define ELF_MIN_ALIGN ELF_EXEC_PAGESIZE
Linus Torvalds1da177e2005-04-16 15:20:36 -070088#else
Jesper Juhlf4e5cc22006-06-23 02:05:35 -070089#define ELF_MIN_ALIGN PAGE_SIZE
Linus Torvalds1da177e2005-04-16 15:20:36 -070090#endif
91
92#ifndef ELF_CORE_EFLAGS
93#define ELF_CORE_EFLAGS 0
94#endif
95
96#define ELF_PAGESTART(_v) ((_v) & ~(unsigned long)(ELF_MIN_ALIGN-1))
97#define ELF_PAGEOFFSET(_v) ((_v) & (ELF_MIN_ALIGN-1))
98#define ELF_PAGEALIGN(_v) (((_v) + ELF_MIN_ALIGN - 1) & ~(ELF_MIN_ALIGN - 1))
99
100static struct linux_binfmt elf_format = {
Mikael Petterssonf670d0e2011-01-12 17:00:02 -0800101 .module = THIS_MODULE,
102 .load_binary = load_elf_binary,
103 .load_shlib = load_elf_library,
104 .core_dump = elf_core_dump,
105 .min_coredump = ELF_EXEC_PAGESIZE,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106};
107
Alexey Dobriyan18676ff2020-01-30 22:17:01 -0800108#define BAD_ADDR(x) (unlikely((unsigned long)(x) >= TASK_SIZE))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800110static int set_brk(unsigned long start, unsigned long end, int prot)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111{
112 start = ELF_PAGEALIGN(start);
113 end = ELF_PAGEALIGN(end);
114 if (end > start) {
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800115 /*
116 * Map the last of the bss segment.
117 * If the header is requesting these pages to be
118 * executable, honour that (ppc32 needs this).
119 */
120 int error = vm_brk_flags(start, end - start,
121 prot & PROT_EXEC ? VM_EXEC : 0);
Linus Torvalds5d22fc22016-05-27 15:57:31 -0700122 if (error)
123 return error;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124 }
125 current->mm->start_brk = current->mm->brk = end;
126 return 0;
127}
128
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129/* We need to explicitly zero any fractional pages
130 after the data section (i.e. bss). This would
131 contain the junk from the file that should not
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700132 be in memory
133 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134static int padzero(unsigned long elf_bss)
135{
136 unsigned long nbyte;
137
138 nbyte = ELF_PAGEOFFSET(elf_bss);
139 if (nbyte) {
140 nbyte = ELF_MIN_ALIGN - nbyte;
141 if (clear_user((void __user *) elf_bss, nbyte))
142 return -EFAULT;
143 }
144 return 0;
145}
146
Ohad Ben-Cohen09c6dd32008-02-03 18:05:15 +0200147/* Let's use some macros to make this stack manipulation a little clearer */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148#ifdef CONFIG_STACK_GROWSUP
149#define STACK_ADD(sp, items) ((elf_addr_t __user *)(sp) + (items))
150#define STACK_ROUND(sp, items) \
151 ((15 + (unsigned long) ((sp) + (items))) &~ 15UL)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700152#define STACK_ALLOC(sp, len) ({ \
153 elf_addr_t __user *old_sp = (elf_addr_t __user *)sp; sp += len; \
154 old_sp; })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155#else
156#define STACK_ADD(sp, items) ((elf_addr_t __user *)(sp) - (items))
157#define STACK_ROUND(sp, items) \
158 (((unsigned long) (sp - items)) &~ 15UL)
Alexey Dobriyana43e5e32021-11-08 18:33:40 -0800159#define STACK_ALLOC(sp, len) (sp -= len)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160#endif
161
Nathan Lynch483fad12008-07-22 04:48:46 +1000162#ifndef ELF_BASE_PLATFORM
163/*
164 * AT_BASE_PLATFORM indicates the "real" hardware/microarchitecture.
165 * If the arch defines ELF_BASE_PLATFORM (in asm/elf.h), the value
166 * will be copied to the user stack in the same manner as AT_PLATFORM.
167 */
168#define ELF_BASE_PLATFORM NULL
169#endif
170
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171static int
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800172create_elf_tables(struct linux_binprm *bprm, const struct elfhdr *exec,
173 unsigned long load_addr, unsigned long interp_load_addr,
174 unsigned long e_entry)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175{
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800176 struct mm_struct *mm = current->mm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 unsigned long p = bprm->p;
178 int argc = bprm->argc;
179 int envc = bprm->envc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 elf_addr_t __user *sp;
181 elf_addr_t __user *u_platform;
Nathan Lynch483fad12008-07-22 04:48:46 +1000182 elf_addr_t __user *u_base_platform;
Kees Cookf06295b2009-01-07 18:08:52 -0800183 elf_addr_t __user *u_rand_bytes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 const char *k_platform = ELF_PLATFORM;
Nathan Lynch483fad12008-07-22 04:48:46 +1000185 const char *k_base_platform = ELF_BASE_PLATFORM;
Kees Cookf06295b2009-01-07 18:08:52 -0800186 unsigned char k_rand_bytes[16];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187 int items;
188 elf_addr_t *elf_info;
Laurent Vivier23479612020-01-28 14:25:39 +0100189 elf_addr_t flags = 0;
Alexey Dobriyan1f83d802020-01-30 22:16:50 -0800190 int ei_index;
David Howells86a264a2008-11-14 10:39:18 +1100191 const struct cred *cred = current_cred();
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700192 struct vm_area_struct *vma;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193
194 /*
Franck Bui-Huud68c9d62007-10-16 23:30:24 -0700195 * In some cases (e.g. Hyper-Threading), we want to avoid L1
196 * evictions by the processes running on the same package. One
197 * thing we can do is to shuffle the initial stack for them.
198 */
199
200 p = arch_align_stack(p);
201
202 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 * If this architecture has a platform capability string, copy it
204 * to userspace. In some cases (Sparc), this info is impossible
205 * for userspace to get any other way, in others (i386) it is
206 * merely difficult.
207 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 u_platform = NULL;
209 if (k_platform) {
210 size_t len = strlen(k_platform) + 1;
211
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212 u_platform = (elf_addr_t __user *)STACK_ALLOC(p, len);
Al Viro646e84d2020-02-19 09:23:34 -0500213 if (copy_to_user(u_platform, k_platform, len))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214 return -EFAULT;
215 }
216
Nathan Lynch483fad12008-07-22 04:48:46 +1000217 /*
218 * If this architecture has a "base" platform capability
219 * string, copy it to userspace.
220 */
221 u_base_platform = NULL;
222 if (k_base_platform) {
223 size_t len = strlen(k_base_platform) + 1;
224
225 u_base_platform = (elf_addr_t __user *)STACK_ALLOC(p, len);
Al Viro646e84d2020-02-19 09:23:34 -0500226 if (copy_to_user(u_base_platform, k_base_platform, len))
Nathan Lynch483fad12008-07-22 04:48:46 +1000227 return -EFAULT;
228 }
229
Kees Cookf06295b2009-01-07 18:08:52 -0800230 /*
231 * Generate 16 random bytes for userspace PRNG seeding.
232 */
233 get_random_bytes(k_rand_bytes, sizeof(k_rand_bytes));
234 u_rand_bytes = (elf_addr_t __user *)
235 STACK_ALLOC(p, sizeof(k_rand_bytes));
Al Viro646e84d2020-02-19 09:23:34 -0500236 if (copy_to_user(u_rand_bytes, k_rand_bytes, sizeof(k_rand_bytes)))
Kees Cookf06295b2009-01-07 18:08:52 -0800237 return -EFAULT;
238
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 /* Create the ELF interpreter info */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800240 elf_info = (elf_addr_t *)mm->saved_auxv;
Olaf Hering4f9a58d2007-10-16 23:30:12 -0700241 /* update AT_VECTOR_SIZE_BASE if the number of NEW_AUX_ENT() changes */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242#define NEW_AUX_ENT(id, val) \
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700243 do { \
Alexey Dobriyan1f83d802020-01-30 22:16:50 -0800244 *elf_info++ = id; \
245 *elf_info++ = val; \
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700246 } while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
248#ifdef ARCH_DLINFO
249 /*
250 * ARCH_DLINFO must come first so PPC can do its special alignment of
251 * AUXV.
Olaf Hering4f9a58d2007-10-16 23:30:12 -0700252 * update AT_VECTOR_SIZE_ARCH if the number of NEW_AUX_ENT() in
253 * ARCH_DLINFO changes
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254 */
255 ARCH_DLINFO;
256#endif
257 NEW_AUX_ENT(AT_HWCAP, ELF_HWCAP);
258 NEW_AUX_ENT(AT_PAGESZ, ELF_EXEC_PAGESIZE);
259 NEW_AUX_ENT(AT_CLKTCK, CLOCKS_PER_SEC);
260 NEW_AUX_ENT(AT_PHDR, load_addr + exec->e_phoff);
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700261 NEW_AUX_ENT(AT_PHENT, sizeof(struct elf_phdr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 NEW_AUX_ENT(AT_PHNUM, exec->e_phnum);
263 NEW_AUX_ENT(AT_BASE, interp_load_addr);
Laurent Vivier23479612020-01-28 14:25:39 +0100264 if (bprm->interp_flags & BINPRM_FLAGS_PRESERVE_ARGV0)
265 flags |= AT_FLAGS_PRESERVE_ARGV0;
266 NEW_AUX_ENT(AT_FLAGS, flags);
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800267 NEW_AUX_ENT(AT_ENTRY, e_entry);
Eric W. Biedermanebc887b2012-02-07 18:36:10 -0800268 NEW_AUX_ENT(AT_UID, from_kuid_munged(cred->user_ns, cred->uid));
269 NEW_AUX_ENT(AT_EUID, from_kuid_munged(cred->user_ns, cred->euid));
270 NEW_AUX_ENT(AT_GID, from_kgid_munged(cred->user_ns, cred->gid));
271 NEW_AUX_ENT(AT_EGID, from_kgid_munged(cred->user_ns, cred->egid));
Kees Cookc425e182017-07-18 15:25:22 -0700272 NEW_AUX_ENT(AT_SECURE, bprm->secureexec);
Kees Cookf06295b2009-01-07 18:08:52 -0800273 NEW_AUX_ENT(AT_RANDOM, (elf_addr_t)(unsigned long)u_rand_bytes);
Michael Neuling21713642013-04-17 17:33:11 +0000274#ifdef ELF_HWCAP2
275 NEW_AUX_ENT(AT_HWCAP2, ELF_HWCAP2);
276#endif
John Reiser65191082008-07-21 14:21:32 -0700277 NEW_AUX_ENT(AT_EXECFN, bprm->exec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 if (k_platform) {
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700279 NEW_AUX_ENT(AT_PLATFORM,
Jesper Juhl785d5572006-06-23 02:05:35 -0700280 (elf_addr_t)(unsigned long)u_platform);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281 }
Nathan Lynch483fad12008-07-22 04:48:46 +1000282 if (k_base_platform) {
283 NEW_AUX_ENT(AT_BASE_PLATFORM,
284 (elf_addr_t)(unsigned long)u_base_platform);
285 }
Eric W. Biedermanb8a61c92020-05-14 15:17:40 -0500286 if (bprm->have_execfd) {
287 NEW_AUX_ENT(AT_EXECFD, bprm->execfd);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 }
289#undef NEW_AUX_ENT
290 /* AT_NULL is zero; clear the rest too */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800291 memset(elf_info, 0, (char *)mm->saved_auxv +
292 sizeof(mm->saved_auxv) - (char *)elf_info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
294 /* And advance past the AT_NULL entry. */
Alexey Dobriyan1f83d802020-01-30 22:16:50 -0800295 elf_info += 2;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800297 ei_index = elf_info - (elf_addr_t *)mm->saved_auxv;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298 sp = STACK_ADD(p, ei_index);
299
Andi Kleend20894a2008-02-08 04:21:54 -0800300 items = (argc + 1) + (envc + 1) + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301 bprm->p = STACK_ROUND(sp, items);
302
303 /* Point sp at the lowest address on the stack */
304#ifdef CONFIG_STACK_GROWSUP
305 sp = (elf_addr_t __user *)bprm->p - items - ei_index;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700306 bprm->exec = (unsigned long)sp; /* XXX: PARISC HACK */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307#else
308 sp = (elf_addr_t __user *)bprm->p;
309#endif
310
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700311
312 /*
313 * Grow the stack manually; some architectures have a limit on how
314 * far ahead a user-space access may be in order to grow the stack.
315 */
Jann Hornb2767d92020-10-17 16:14:15 -0700316 if (mmap_read_lock_killable(mm))
317 return -EINTR;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800318 vma = find_extend_vma(mm, bprm->p);
Jann Hornb2767d92020-10-17 16:14:15 -0700319 mmap_read_unlock(mm);
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700320 if (!vma)
321 return -EFAULT;
322
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 /* Now, let's put argc (and argv, envp if appropriate) on the stack */
Al Viro646e84d2020-02-19 09:23:34 -0500324 if (put_user(argc, sp++))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325 return -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700326
Kees Cook67c67772017-07-10 15:52:54 -0700327 /* Populate list of argv pointers back to argv strings. */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800328 p = mm->arg_end = mm->arg_start;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329 while (argc-- > 0) {
330 size_t len;
Al Viro646e84d2020-02-19 09:23:34 -0500331 if (put_user((elf_addr_t)p, sp++))
Heiko Carstens841d5fb2006-12-06 20:36:35 -0800332 return -EFAULT;
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700333 len = strnlen_user((void __user *)p, MAX_ARG_STRLEN);
334 if (!len || len > MAX_ARG_STRLEN)
WANG Cong23c49712008-05-08 21:52:33 +0800335 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 p += len;
337 }
Al Viro646e84d2020-02-19 09:23:34 -0500338 if (put_user(0, sp++))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 return -EFAULT;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800340 mm->arg_end = p;
Kees Cook67c67772017-07-10 15:52:54 -0700341
342 /* Populate list of envp pointers back to envp strings. */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800343 mm->env_end = mm->env_start = p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 while (envc-- > 0) {
345 size_t len;
Al Viro646e84d2020-02-19 09:23:34 -0500346 if (put_user((elf_addr_t)p, sp++))
Heiko Carstens841d5fb2006-12-06 20:36:35 -0800347 return -EFAULT;
Ollie Wildb6a2fea2007-07-19 01:48:16 -0700348 len = strnlen_user((void __user *)p, MAX_ARG_STRLEN);
349 if (!len || len > MAX_ARG_STRLEN)
WANG Cong23c49712008-05-08 21:52:33 +0800350 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351 p += len;
352 }
Al Viro646e84d2020-02-19 09:23:34 -0500353 if (put_user(0, sp++))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 return -EFAULT;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800355 mm->env_end = p;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356
357 /* Put the elf_info on the stack in the right place. */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800358 if (copy_to_user(sp, mm->saved_auxv, ei_index * sizeof(elf_addr_t)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359 return -EFAULT;
360 return 0;
361}
362
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363static unsigned long elf_map(struct file *filep, unsigned long addr,
Alexey Dobriyan49ac9812019-03-07 16:29:03 -0800364 const struct elf_phdr *eppnt, int prot, int type,
Jiri Kosinacc503c12008-01-30 13:31:07 +0100365 unsigned long total_size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700366{
367 unsigned long map_addr;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100368 unsigned long size = eppnt->p_filesz + ELF_PAGEOFFSET(eppnt->p_vaddr);
369 unsigned long off = eppnt->p_offset - ELF_PAGEOFFSET(eppnt->p_vaddr);
370 addr = ELF_PAGESTART(addr);
371 size = ELF_PAGEALIGN(size);
Jan Kratochvil60bfba72007-07-15 23:40:06 -0700372
Andrew Mortond4e3cc32007-07-21 04:37:32 -0700373 /* mmap() will return -EINVAL if given a zero size, but a
374 * segment with zero filesize is perfectly valid */
Jiri Kosinacc503c12008-01-30 13:31:07 +0100375 if (!size)
376 return addr;
377
Jiri Kosinacc503c12008-01-30 13:31:07 +0100378 /*
379 * total_size is the size of the ELF (interpreter) image.
380 * The _first_ mmap needs to know the full size, otherwise
381 * randomization might put this image into an overlapping
382 * position with the ELF binary image. (since size < total_size)
383 * So we first map the 'big' image - and unmap the remainder at
384 * the end. (which unmap is needed for ELF images with holes.)
385 */
386 if (total_size) {
387 total_size = ELF_PAGEALIGN(total_size);
Al Viro5a5e4c22012-05-30 01:49:38 -0400388 map_addr = vm_mmap(filep, addr, total_size, prot, type, off);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100389 if (!BAD_ADDR(map_addr))
Al Viro5a5e4c22012-05-30 01:49:38 -0400390 vm_munmap(map_addr+size, total_size-size);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100391 } else
Al Viro5a5e4c22012-05-30 01:49:38 -0400392 map_addr = vm_mmap(filep, addr, size, prot, type, off);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100393
Tetsuo Handad23a61e2018-04-20 14:56:13 -0700394 if ((type & MAP_FIXED_NOREPLACE) &&
395 PTR_ERR((void *)map_addr) == -EEXIST)
396 pr_info("%d (%s): Uhuuh, elf segment at %px requested but the memory is mapped already\n",
397 task_pid_nr(current), current->comm, (void *)addr);
Michal Hocko4ed28632018-04-10 16:36:01 -0700398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 return(map_addr);
400}
401
Alexey Dobriyan49ac9812019-03-07 16:29:03 -0800402static unsigned long total_mapping_size(const struct elf_phdr *cmds, int nr)
Jiri Kosinacc503c12008-01-30 13:31:07 +0100403{
404 int i, first_idx = -1, last_idx = -1;
405
406 for (i = 0; i < nr; i++) {
407 if (cmds[i].p_type == PT_LOAD) {
408 last_idx = i;
409 if (first_idx == -1)
410 first_idx = i;
411 }
412 }
413 if (first_idx == -1)
414 return 0;
415
416 return cmds[last_idx].p_vaddr + cmds[last_idx].p_memsz -
417 ELF_PAGESTART(cmds[first_idx].p_vaddr);
418}
419
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800420static int elf_read(struct file *file, void *buf, size_t len, loff_t pos)
421{
422 ssize_t rv;
423
424 rv = kernel_read(file, buf, len, &pos);
425 if (unlikely(rv != len)) {
426 return (rv < 0) ? rv : -EIO;
427 }
428 return 0;
429}
430
Chris Kennellyce81bb22020-10-15 20:12:32 -0700431static unsigned long maximum_alignment(struct elf_phdr *cmds, int nr)
432{
433 unsigned long alignment = 0;
434 int i;
435
436 for (i = 0; i < nr; i++) {
437 if (cmds[i].p_type == PT_LOAD) {
438 unsigned long p_align = cmds[i].p_align;
439
440 /* skip non-power of two alignments as invalid */
441 if (!is_power_of_2(p_align))
442 continue;
443 alignment = max(alignment, p_align);
444 }
445 }
446
447 /* ensure we align to at least one page */
448 return ELF_PAGEALIGN(alignment);
449}
450
Paul Burton6a8d3892014-09-11 08:30:14 +0100451/**
452 * load_elf_phdrs() - load ELF program headers
453 * @elf_ex: ELF header of the binary whose program headers should be loaded
454 * @elf_file: the opened ELF binary file
455 *
456 * Loads ELF program headers from the binary file elf_file, which has the ELF
457 * header pointed to by elf_ex, into a newly allocated array. The caller is
458 * responsible for freeing the allocated data. Returns an ERR_PTR upon failure.
459 */
Alexey Dobriyan49ac9812019-03-07 16:29:03 -0800460static struct elf_phdr *load_elf_phdrs(const struct elfhdr *elf_ex,
Paul Burton6a8d3892014-09-11 08:30:14 +0100461 struct file *elf_file)
462{
463 struct elf_phdr *elf_phdata = NULL;
Alexey Dobriyanfaf1c312019-03-07 16:28:56 -0800464 int retval, err = -1;
Alexey Dobriyanfaf1c312019-03-07 16:28:56 -0800465 unsigned int size;
Paul Burton6a8d3892014-09-11 08:30:14 +0100466
467 /*
468 * If the size of this structure has changed, then punt, since
469 * we will be doing the wrong thing.
470 */
471 if (elf_ex->e_phentsize != sizeof(struct elf_phdr))
472 goto out;
473
474 /* Sanity check the number of program headers... */
Paul Burton6a8d3892014-09-11 08:30:14 +0100475 /* ...and their total size. */
476 size = sizeof(struct elf_phdr) * elf_ex->e_phnum;
Alexey Dobriyanfaf1c312019-03-07 16:28:56 -0800477 if (size == 0 || size > 65536 || size > ELF_MIN_ALIGN)
Paul Burton6a8d3892014-09-11 08:30:14 +0100478 goto out;
479
480 elf_phdata = kmalloc(size, GFP_KERNEL);
481 if (!elf_phdata)
482 goto out;
483
484 /* Read in the program headers */
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800485 retval = elf_read(elf_file, elf_phdata, size, elf_ex->e_phoff);
486 if (retval < 0) {
487 err = retval;
Paul Burton6a8d3892014-09-11 08:30:14 +0100488 goto out;
489 }
490
491 /* Success! */
492 err = 0;
493out:
494 if (err) {
495 kfree(elf_phdata);
496 elf_phdata = NULL;
497 }
498 return elf_phdata;
499}
Jiri Kosinacc503c12008-01-30 13:31:07 +0100500
Paul Burton774c1052014-09-11 08:30:16 +0100501#ifndef CONFIG_ARCH_BINFMT_ELF_STATE
502
503/**
504 * struct arch_elf_state - arch-specific ELF loading state
505 *
506 * This structure is used to preserve architecture specific data during
507 * the loading of an ELF file, throughout the checking of architecture
508 * specific ELF headers & through to the point where the ELF load is
509 * known to be proceeding (ie. SET_PERSONALITY).
510 *
511 * This implementation is a dummy for architectures which require no
512 * specific state.
513 */
514struct arch_elf_state {
515};
516
517#define INIT_ARCH_ELF_STATE {}
518
519/**
520 * arch_elf_pt_proc() - check a PT_LOPROC..PT_HIPROC ELF program header
521 * @ehdr: The main ELF header
522 * @phdr: The program header to check
523 * @elf: The open ELF file
524 * @is_interp: True if the phdr is from the interpreter of the ELF being
525 * loaded, else false.
526 * @state: Architecture-specific state preserved throughout the process
527 * of loading the ELF.
528 *
529 * Inspects the program header phdr to validate its correctness and/or
530 * suitability for the system. Called once per ELF program header in the
531 * range PT_LOPROC to PT_HIPROC, for both the ELF being loaded and its
532 * interpreter.
533 *
534 * Return: Zero to proceed with the ELF load, non-zero to fail the ELF load
535 * with that return code.
536 */
537static inline int arch_elf_pt_proc(struct elfhdr *ehdr,
538 struct elf_phdr *phdr,
539 struct file *elf, bool is_interp,
540 struct arch_elf_state *state)
541{
542 /* Dummy implementation, always proceed */
543 return 0;
544}
545
546/**
Maciej W. Rozycki54d157142015-10-26 15:47:57 +0000547 * arch_check_elf() - check an ELF executable
Paul Burton774c1052014-09-11 08:30:16 +0100548 * @ehdr: The main ELF header
549 * @has_interp: True if the ELF has an interpreter, else false.
Maciej W. Rozyckieb4bc072015-11-13 00:47:48 +0000550 * @interp_ehdr: The interpreter's ELF header
Paul Burton774c1052014-09-11 08:30:16 +0100551 * @state: Architecture-specific state preserved throughout the process
552 * of loading the ELF.
553 *
554 * Provides a final opportunity for architecture code to reject the loading
555 * of the ELF & cause an exec syscall to return an error. This is called after
556 * all program headers to be checked by arch_elf_pt_proc have been.
557 *
558 * Return: Zero to proceed with the ELF load, non-zero to fail the ELF load
559 * with that return code.
560 */
561static inline int arch_check_elf(struct elfhdr *ehdr, bool has_interp,
Maciej W. Rozyckieb4bc072015-11-13 00:47:48 +0000562 struct elfhdr *interp_ehdr,
Paul Burton774c1052014-09-11 08:30:16 +0100563 struct arch_elf_state *state)
564{
565 /* Dummy implementation, always proceed */
566 return 0;
567}
568
569#endif /* !CONFIG_ARCH_BINFMT_ELF_STATE */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700570
Dave Martinfe0f6762020-03-16 16:50:46 +0000571static inline int make_prot(u32 p_flags, struct arch_elf_state *arch_state,
572 bool has_interp, bool is_interp)
Alexey Dobriyand8e7cb32019-05-14 15:43:51 -0700573{
574 int prot = 0;
575
576 if (p_flags & PF_R)
577 prot |= PROT_READ;
578 if (p_flags & PF_W)
579 prot |= PROT_WRITE;
580 if (p_flags & PF_X)
581 prot |= PROT_EXEC;
Dave Martinfe0f6762020-03-16 16:50:46 +0000582
583 return arch_elf_adjust_prot(prot, arch_state, has_interp, is_interp);
Alexey Dobriyand8e7cb32019-05-14 15:43:51 -0700584}
585
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586/* This is much more generalized than the library routine read function,
587 so we keep this separate. Technically the library read function
588 is only provided so that we can read a.out libraries that have
589 an ELF header */
590
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700591static unsigned long load_elf_interp(struct elfhdr *interp_elf_ex,
Alexey Dobriyan81696d52019-12-04 16:52:22 -0800592 struct file *interpreter,
Dave Martinfe0f6762020-03-16 16:50:46 +0000593 unsigned long no_base, struct elf_phdr *interp_elf_phdata,
594 struct arch_elf_state *arch_state)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596 struct elf_phdr *eppnt;
597 unsigned long load_addr = 0;
598 int load_addr_set = 0;
599 unsigned long last_bss = 0, elf_bss = 0;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800600 int bss_prot = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 unsigned long error = ~0UL;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100602 unsigned long total_size;
Paul Burton6a8d3892014-09-11 08:30:14 +0100603 int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604
605 /* First of all, some simple consistency checks */
606 if (interp_elf_ex->e_type != ET_EXEC &&
607 interp_elf_ex->e_type != ET_DYN)
608 goto out;
Nicolas Pitre47552002017-08-16 16:05:13 -0400609 if (!elf_check_arch(interp_elf_ex) ||
610 elf_check_fdpic(interp_elf_ex))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700611 goto out;
Al Viro72c2d532013-09-22 16:27:52 -0400612 if (!interpreter->f_op->mmap)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 goto out;
614
Paul Burtona9d9ef12014-09-11 08:30:15 +0100615 total_size = total_mapping_size(interp_elf_phdata,
616 interp_elf_ex->e_phnum);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100617 if (!total_size) {
618 error = -EINVAL;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100619 goto out;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100620 }
621
Paul Burtona9d9ef12014-09-11 08:30:15 +0100622 eppnt = interp_elf_phdata;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700623 for (i = 0; i < interp_elf_ex->e_phnum; i++, eppnt++) {
624 if (eppnt->p_type == PT_LOAD) {
David Hildenbrand4589ff72021-04-23 09:42:41 +0200625 int elf_type = MAP_PRIVATE;
Dave Martinfe0f6762020-03-16 16:50:46 +0000626 int elf_prot = make_prot(eppnt->p_flags, arch_state,
627 true, true);
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700628 unsigned long vaddr = 0;
629 unsigned long k, map_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700631 vaddr = eppnt->p_vaddr;
632 if (interp_elf_ex->e_type == ET_EXEC || load_addr_set)
Chen Jingwen9b2f72c2021-09-28 20:56:57 +0800633 elf_type |= MAP_FIXED;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100634 else if (no_base && interp_elf_ex->e_type == ET_DYN)
635 load_addr = -vaddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700636
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700637 map_addr = elf_map(interpreter, load_addr + vaddr,
Andrew Mortonbb1ad822008-01-30 13:31:07 +0100638 eppnt, elf_prot, elf_type, total_size);
Jiri Kosinacc503c12008-01-30 13:31:07 +0100639 total_size = 0;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700640 error = map_addr;
641 if (BAD_ADDR(map_addr))
Paul Burtona9d9ef12014-09-11 08:30:15 +0100642 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700644 if (!load_addr_set &&
645 interp_elf_ex->e_type == ET_DYN) {
646 load_addr = map_addr - ELF_PAGESTART(vaddr);
647 load_addr_set = 1;
648 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700649
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700650 /*
651 * Check to see if the section's size will overflow the
652 * allowed task size. Note that p_filesz must always be
653 * <= p_memsize so it's only necessary to check p_memsz.
654 */
655 k = load_addr + eppnt->p_vaddr;
Chuck Ebbertce510592006-07-03 00:24:14 -0700656 if (BAD_ADDR(k) ||
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700657 eppnt->p_filesz > eppnt->p_memsz ||
658 eppnt->p_memsz > TASK_SIZE ||
659 TASK_SIZE - eppnt->p_memsz < k) {
660 error = -ENOMEM;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100661 goto out;
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700662 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700664 /*
665 * Find the end of the file mapping for this phdr, and
666 * keep track of the largest address we see for this.
667 */
668 k = load_addr + eppnt->p_vaddr + eppnt->p_filesz;
669 if (k > elf_bss)
670 elf_bss = k;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700672 /*
673 * Do the same thing for the memory mapping - between
674 * elf_bss and last_bss is the bss section.
675 */
Kees Cook0036d1f2016-08-02 14:04:51 -0700676 k = load_addr + eppnt->p_vaddr + eppnt->p_memsz;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800677 if (k > last_bss) {
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700678 last_bss = k;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800679 bss_prot = elf_prot;
680 }
Jesper Juhlf4e5cc22006-06-23 02:05:35 -0700681 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700682 }
683
Kees Cook0036d1f2016-08-02 14:04:51 -0700684 /*
685 * Now fill out the bss section: first pad the last page from
686 * the file up to the page boundary, and zero it from elf_bss
687 * up to the end of the page.
688 */
689 if (padzero(elf_bss)) {
690 error = -EFAULT;
691 goto out;
692 }
693 /*
694 * Next, align both the file and mem bss up to the page size,
695 * since this is where elf_bss was just zeroed up to, and where
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800696 * last_bss will end after the vm_brk_flags() below.
Kees Cook0036d1f2016-08-02 14:04:51 -0700697 */
698 elf_bss = ELF_PAGEALIGN(elf_bss);
699 last_bss = ELF_PAGEALIGN(last_bss);
700 /* Finally, if there is still more bss to allocate, do it. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701 if (last_bss > elf_bss) {
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800702 error = vm_brk_flags(elf_bss, last_bss - elf_bss,
703 bss_prot & PROT_EXEC ? VM_EXEC : 0);
Linus Torvalds5d22fc22016-05-27 15:57:31 -0700704 if (error)
Paul Burtona9d9ef12014-09-11 08:30:15 +0100705 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706 }
707
Jiri Kosinacc503c12008-01-30 13:31:07 +0100708 error = load_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709out:
710 return error;
711}
712
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713/*
714 * These are the functions used to load ELF style executables and shared
715 * libraries. There is no binary dependent code anywhere else.
716 */
717
Dave Martin00e19ce2020-03-16 16:50:44 +0000718static int parse_elf_property(const char *data, size_t *off, size_t datasz,
719 struct arch_elf_state *arch,
720 bool have_prev_type, u32 *prev_type)
721{
722 size_t o, step;
723 const struct gnu_property *pr;
724 int ret;
725
726 if (*off == datasz)
727 return -ENOENT;
728
729 if (WARN_ON_ONCE(*off > datasz || *off % ELF_GNU_PROPERTY_ALIGN))
730 return -EIO;
731 o = *off;
732 datasz -= *off;
733
734 if (datasz < sizeof(*pr))
735 return -ENOEXEC;
736 pr = (const struct gnu_property *)(data + o);
737 o += sizeof(*pr);
738 datasz -= sizeof(*pr);
739
740 if (pr->pr_datasz > datasz)
741 return -ENOEXEC;
742
743 WARN_ON_ONCE(o % ELF_GNU_PROPERTY_ALIGN);
744 step = round_up(pr->pr_datasz, ELF_GNU_PROPERTY_ALIGN);
745 if (step > datasz)
746 return -ENOEXEC;
747
748 /* Properties are supposed to be unique and sorted on pr_type: */
749 if (have_prev_type && pr->pr_type <= *prev_type)
750 return -ENOEXEC;
751 *prev_type = pr->pr_type;
752
753 ret = arch_parse_elf_property(pr->pr_type, data + o,
754 pr->pr_datasz, ELF_COMPAT, arch);
755 if (ret)
756 return ret;
757
758 *off = o + step;
759 return 0;
760}
761
762#define NOTE_DATA_SZ SZ_1K
763#define GNU_PROPERTY_TYPE_0_NAME "GNU"
764#define NOTE_NAME_SZ (sizeof(GNU_PROPERTY_TYPE_0_NAME))
765
766static int parse_elf_properties(struct file *f, const struct elf_phdr *phdr,
767 struct arch_elf_state *arch)
768{
769 union {
770 struct elf_note nhdr;
771 char data[NOTE_DATA_SZ];
772 } note;
773 loff_t pos;
774 ssize_t n;
775 size_t off, datasz;
776 int ret;
777 bool have_prev_type;
778 u32 prev_type;
779
780 if (!IS_ENABLED(CONFIG_ARCH_USE_GNU_PROPERTY) || !phdr)
781 return 0;
782
783 /* load_elf_binary() shouldn't call us unless this is true... */
784 if (WARN_ON_ONCE(phdr->p_type != PT_GNU_PROPERTY))
785 return -ENOEXEC;
786
787 /* If the properties are crazy large, that's too bad (for now): */
788 if (phdr->p_filesz > sizeof(note))
789 return -ENOEXEC;
790
791 pos = phdr->p_offset;
792 n = kernel_read(f, &note, phdr->p_filesz, &pos);
793
794 BUILD_BUG_ON(sizeof(note) < sizeof(note.nhdr) + NOTE_NAME_SZ);
795 if (n < 0 || n < sizeof(note.nhdr) + NOTE_NAME_SZ)
796 return -EIO;
797
798 if (note.nhdr.n_type != NT_GNU_PROPERTY_TYPE_0 ||
799 note.nhdr.n_namesz != NOTE_NAME_SZ ||
800 strncmp(note.data + sizeof(note.nhdr),
801 GNU_PROPERTY_TYPE_0_NAME, n - sizeof(note.nhdr)))
802 return -ENOEXEC;
803
804 off = round_up(sizeof(note.nhdr) + NOTE_NAME_SZ,
805 ELF_GNU_PROPERTY_ALIGN);
806 if (off > n)
807 return -ENOEXEC;
808
809 if (note.nhdr.n_descsz > n - off)
810 return -ENOEXEC;
811 datasz = off + note.nhdr.n_descsz;
812
813 have_prev_type = false;
814 do {
815 ret = parse_elf_property(note.data, &off, datasz, arch,
816 have_prev_type, &prev_type);
817 have_prev_type = true;
818 } while (!ret);
819
820 return ret == -ENOENT ? 0 : ret;
821}
822
Al Viro71613c32012-10-20 22:00:48 -0400823static int load_elf_binary(struct linux_binprm *bprm)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700824{
825 struct file *interpreter = NULL; /* to shut gcc up */
826 unsigned long load_addr = 0, load_bias = 0;
827 int load_addr_set = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700828 unsigned long error;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100829 struct elf_phdr *elf_ppnt, *elf_phdata, *interp_elf_phdata = NULL;
Dave Martin00e19ce2020-03-16 16:50:44 +0000830 struct elf_phdr *elf_property_phdata = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700831 unsigned long elf_bss, elf_brk;
Denys Vlasenko16e72e92017-02-22 15:45:16 -0800832 int bss_prot = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700833 int retval, i;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100834 unsigned long elf_entry;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800835 unsigned long e_entry;
Jiri Kosinacc503c12008-01-30 13:31:07 +0100836 unsigned long interp_load_addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700837 unsigned long start_code, end_code, start_data, end_data;
David Daney1a530a62011-03-22 16:34:48 -0700838 unsigned long reloc_func_desc __maybe_unused = 0;
David Rientjes8de61e62006-12-06 20:40:16 -0800839 int executable_stack = EXSTACK_DEFAULT;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800840 struct elfhdr *elf_ex = (struct elfhdr *)bprm->buf;
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -0700841 struct elfhdr *interp_elf_ex = NULL;
Paul Burton774c1052014-09-11 08:30:16 +0100842 struct arch_elf_state arch_state = INIT_ARCH_ELF_STATE;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -0800843 struct mm_struct *mm;
Alexey Dobriyan249b08e2019-05-14 15:43:54 -0700844 struct pt_regs *regs;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700845
Linus Torvalds1da177e2005-04-16 15:20:36 -0700846 retval = -ENOEXEC;
847 /* First of all, some simple consistency checks */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800848 if (memcmp(elf_ex->e_ident, ELFMAG, SELFMAG) != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849 goto out;
850
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800851 if (elf_ex->e_type != ET_EXEC && elf_ex->e_type != ET_DYN)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700852 goto out;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800853 if (!elf_check_arch(elf_ex))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854 goto out;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800855 if (elf_check_fdpic(elf_ex))
Nicolas Pitre47552002017-08-16 16:05:13 -0400856 goto out;
Al Viro72c2d532013-09-22 16:27:52 -0400857 if (!bprm->file->f_op->mmap)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700858 goto out;
859
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800860 elf_phdata = load_elf_phdrs(elf_ex, bprm->file);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700861 if (!elf_phdata)
862 goto out;
863
Linus Torvalds1da177e2005-04-16 15:20:36 -0700864 elf_ppnt = elf_phdata;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800865 for (i = 0; i < elf_ex->e_phnum; i++, elf_ppnt++) {
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700866 char *elf_interpreter;
Alexey Dobriyan5cf4a362019-05-14 15:43:36 -0700867
Dave Martin00e19ce2020-03-16 16:50:44 +0000868 if (elf_ppnt->p_type == PT_GNU_PROPERTY) {
869 elf_property_phdata = elf_ppnt;
870 continue;
871 }
872
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700873 if (elf_ppnt->p_type != PT_INTERP)
874 continue;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700875
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700876 /*
877 * This is the program interpreter used for shared libraries -
878 * for now assume that this is an a.out format binary.
879 */
880 retval = -ENOEXEC;
881 if (elf_ppnt->p_filesz > PATH_MAX || elf_ppnt->p_filesz < 2)
882 goto out_free_ph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700883
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700884 retval = -ENOMEM;
885 elf_interpreter = kmalloc(elf_ppnt->p_filesz, GFP_KERNEL);
886 if (!elf_interpreter)
887 goto out_free_ph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700888
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800889 retval = elf_read(bprm->file, elf_interpreter, elf_ppnt->p_filesz,
890 elf_ppnt->p_offset);
891 if (retval < 0)
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700892 goto out_free_interp;
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700893 /* make sure path is NULL terminated */
894 retval = -ENOEXEC;
895 if (elf_interpreter[elf_ppnt->p_filesz - 1] != '\0')
896 goto out_free_interp;
Alexey Dobriyan1fb84492007-01-26 00:57:16 -0800897
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700898 interpreter = open_exec(elf_interpreter);
899 kfree(elf_interpreter);
900 retval = PTR_ERR(interpreter);
901 if (IS_ERR(interpreter))
902 goto out_free_ph;
Alexey Dobriyan1fb84492007-01-26 00:57:16 -0800903
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700904 /*
905 * If the binary is not readable then enforce mm->dumpable = 0
906 * regardless of the interpreter's permissions.
907 */
908 would_dump(bprm, interpreter);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700909
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -0700910 interp_elf_ex = kmalloc(sizeof(*interp_elf_ex), GFP_KERNEL);
911 if (!interp_elf_ex) {
912 retval = -ENOMEM;
913 goto out_free_ph;
914 }
915
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700916 /* Get the exec headers */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700917 retval = elf_read(interpreter, interp_elf_ex,
918 sizeof(*interp_elf_ex), 0);
Alexey Dobriyan658c0332019-12-04 16:52:25 -0800919 if (retval < 0)
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700920 goto out_free_dentry;
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700921
922 break;
Alexey Dobriyancc338012019-05-14 15:43:39 -0700923
924out_free_interp:
Alexey Dobriyanbe0deb52019-05-14 15:43:45 -0700925 kfree(elf_interpreter);
926 goto out_free_ph;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700927 }
928
929 elf_ppnt = elf_phdata;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800930 for (i = 0; i < elf_ex->e_phnum; i++, elf_ppnt++)
Paul Burton774c1052014-09-11 08:30:16 +0100931 switch (elf_ppnt->p_type) {
932 case PT_GNU_STACK:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933 if (elf_ppnt->p_flags & PF_X)
934 executable_stack = EXSTACK_ENABLE_X;
935 else
936 executable_stack = EXSTACK_DISABLE_X;
937 break;
Paul Burton774c1052014-09-11 08:30:16 +0100938
939 case PT_LOPROC ... PT_HIPROC:
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800940 retval = arch_elf_pt_proc(elf_ex, elf_ppnt,
Paul Burton774c1052014-09-11 08:30:16 +0100941 bprm->file, false,
942 &arch_state);
943 if (retval)
944 goto out_free_dentry;
945 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700947
948 /* Some simple consistency checks for the interpreter */
Alexey Dobriyancc338012019-05-14 15:43:39 -0700949 if (interpreter) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700950 retval = -ELIBBAD;
Andi Kleend20894a2008-02-08 04:21:54 -0800951 /* Not an ELF interpreter */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700952 if (memcmp(interp_elf_ex->e_ident, ELFMAG, SELFMAG) != 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953 goto out_free_dentry;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954 /* Verify the interpreter has a valid arch */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700955 if (!elf_check_arch(interp_elf_ex) ||
956 elf_check_fdpic(interp_elf_ex))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700957 goto out_free_dentry;
Paul Burtona9d9ef12014-09-11 08:30:15 +0100958
959 /* Load the interpreter program headers */
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700960 interp_elf_phdata = load_elf_phdrs(interp_elf_ex,
Paul Burtona9d9ef12014-09-11 08:30:15 +0100961 interpreter);
962 if (!interp_elf_phdata)
963 goto out_free_dentry;
Paul Burton774c1052014-09-11 08:30:16 +0100964
965 /* Pass PT_LOPROC..PT_HIPROC headers to arch code */
Dave Martin00e19ce2020-03-16 16:50:44 +0000966 elf_property_phdata = NULL;
Paul Burton774c1052014-09-11 08:30:16 +0100967 elf_ppnt = interp_elf_phdata;
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700968 for (i = 0; i < interp_elf_ex->e_phnum; i++, elf_ppnt++)
Paul Burton774c1052014-09-11 08:30:16 +0100969 switch (elf_ppnt->p_type) {
Dave Martin00e19ce2020-03-16 16:50:44 +0000970 case PT_GNU_PROPERTY:
971 elf_property_phdata = elf_ppnt;
972 break;
973
Paul Burton774c1052014-09-11 08:30:16 +0100974 case PT_LOPROC ... PT_HIPROC:
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700975 retval = arch_elf_pt_proc(interp_elf_ex,
Paul Burton774c1052014-09-11 08:30:16 +0100976 elf_ppnt, interpreter,
977 true, &arch_state);
978 if (retval)
979 goto out_free_dentry;
980 break;
981 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982 }
983
Dave Martin00e19ce2020-03-16 16:50:44 +0000984 retval = parse_elf_properties(interpreter ?: bprm->file,
985 elf_property_phdata, &arch_state);
986 if (retval)
987 goto out_free_dentry;
988
Paul Burton774c1052014-09-11 08:30:16 +0100989 /*
990 * Allow arch code to reject the ELF at this point, whilst it's
991 * still possible to return an error to the code that invoked
992 * the exec syscall.
993 */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -0800994 retval = arch_check_elf(elf_ex,
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -0700995 !!interpreter, interp_elf_ex,
Maciej W. Rozyckieb4bc072015-11-13 00:47:48 +0000996 &arch_state);
Paul Burton774c1052014-09-11 08:30:16 +0100997 if (retval)
998 goto out_free_dentry;
999
Linus Torvalds1da177e2005-04-16 15:20:36 -07001000 /* Flush all traces of the currently running executable */
Eric W. Biederman23887772020-05-03 07:54:10 -05001001 retval = begin_new_exec(bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001002 if (retval)
1003 goto out_free_dentry;
1004
Linus Torvalds1da177e2005-04-16 15:20:36 -07001005 /* Do this immediately, since STACK_TOP as used in setup_arg_pages
1006 may depend on the personality. */
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001007 SET_PERSONALITY2(*elf_ex, &arch_state);
1008 if (elf_read_implies_exec(*elf_ex, executable_stack))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001009 current->personality |= READ_IMPLIES_EXEC;
1010
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001011 if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012 current->flags |= PF_RANDOMIZE;
Linus Torvalds221af7f2010-01-28 22:14:42 -08001013
1014 setup_new_exec(bprm);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015
1016 /* Do this so that we can load the interpreter, if need be. We will
1017 change some of these later */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001018 retval = setup_arg_pages(bprm, randomize_stack_top(STACK_TOP),
1019 executable_stack);
Al Viro19d860a2014-05-04 20:11:36 -04001020 if (retval < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001021 goto out_free_dentry;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022
Alexey Dobriyan852643162019-05-14 15:43:48 -07001023 elf_bss = 0;
1024 elf_brk = 0;
1025
1026 start_code = ~0UL;
1027 end_code = 0;
1028 start_data = 0;
1029 end_data = 0;
1030
André Goddard Rosaaf901ca2009-11-14 13:09:05 -02001031 /* Now we do a little grungy work by mmapping the ELF image into
Jiri Kosinacc503c12008-01-30 13:31:07 +01001032 the correct location in memory. */
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001033 for(i = 0, elf_ppnt = elf_phdata;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001034 i < elf_ex->e_phnum; i++, elf_ppnt++) {
Linus Torvaldsb2129212019-10-06 13:53:27 -07001035 int elf_prot, elf_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036 unsigned long k, vaddr;
Michael Davidsona87938b2015-04-14 15:47:38 -07001037 unsigned long total_size = 0;
Chris Kennellyce81bb22020-10-15 20:12:32 -07001038 unsigned long alignment;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001039
1040 if (elf_ppnt->p_type != PT_LOAD)
1041 continue;
1042
1043 if (unlikely (elf_brk > elf_bss)) {
1044 unsigned long nbyte;
1045
1046 /* There was a PT_LOAD segment with p_memsz > p_filesz
1047 before this one. Map anonymous pages, if needed,
1048 and clear the area. */
Mikael Petterssonf670d0e2011-01-12 17:00:02 -08001049 retval = set_brk(elf_bss + load_bias,
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001050 elf_brk + load_bias,
1051 bss_prot);
Al Viro19d860a2014-05-04 20:11:36 -04001052 if (retval)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053 goto out_free_dentry;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001054 nbyte = ELF_PAGEOFFSET(elf_bss);
1055 if (nbyte) {
1056 nbyte = ELF_MIN_ALIGN - nbyte;
1057 if (nbyte > elf_brk - elf_bss)
1058 nbyte = elf_brk - elf_bss;
1059 if (clear_user((void __user *)elf_bss +
1060 load_bias, nbyte)) {
1061 /*
1062 * This bss-zeroing can fail if the ELF
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001063 * file specifies odd protections. So
Linus Torvalds1da177e2005-04-16 15:20:36 -07001064 * we don't check the return value
1065 */
1066 }
1067 }
1068 }
1069
Dave Martinfe0f6762020-03-16 16:50:46 +00001070 elf_prot = make_prot(elf_ppnt->p_flags, &arch_state,
1071 !!interpreter, false);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072
David Hildenbrand4589ff72021-04-23 09:42:41 +02001073 elf_flags = MAP_PRIVATE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001074
1075 vaddr = elf_ppnt->p_vaddr;
Kees Cookeab09532017-07-10 15:52:37 -07001076 /*
Kees Cook5f501d52021-11-08 18:33:37 -08001077 * The first time through the loop, load_addr_set is false:
1078 * layout will be calculated. Once set, use MAP_FIXED since
1079 * we know we've already safely mapped the entire region with
1080 * MAP_FIXED_NOREPLACE in the once-per-binary logic following.
Kees Cookeab09532017-07-10 15:52:37 -07001081 */
Kees Cook5f501d52021-11-08 18:33:37 -08001082 if (load_addr_set) {
Linus Torvaldsb2129212019-10-06 13:53:27 -07001083 elf_flags |= MAP_FIXED;
Kees Cook5f501d52021-11-08 18:33:37 -08001084 } else if (elf_ex->e_type == ET_EXEC) {
1085 /*
1086 * This logic is run once for the first LOAD Program
1087 * Header for ET_EXEC binaries. No special handling
1088 * is needed.
1089 */
1090 elf_flags |= MAP_FIXED_NOREPLACE;
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001091 } else if (elf_ex->e_type == ET_DYN) {
Kees Cookeab09532017-07-10 15:52:37 -07001092 /*
1093 * This logic is run once for the first LOAD Program
1094 * Header for ET_DYN binaries to calculate the
1095 * randomization (load_bias) for all the LOAD
Kees Cook5f501d52021-11-08 18:33:37 -08001096 * Program Headers.
Kees Cookeab09532017-07-10 15:52:37 -07001097 *
1098 * There are effectively two types of ET_DYN
1099 * binaries: programs (i.e. PIE: ET_DYN with INTERP)
1100 * and loaders (ET_DYN without INTERP, since they
1101 * _are_ the ELF interpreter). The loaders must
1102 * be loaded away from programs since the program
1103 * may otherwise collide with the loader (especially
1104 * for ET_EXEC which does not have a randomized
1105 * position). For example to handle invocations of
1106 * "./ld.so someprog" to test out a new version of
1107 * the loader, the subsequent program that the
1108 * loader loads must avoid the loader itself, so
1109 * they cannot share the same load range. Sufficient
1110 * room for the brk must be allocated with the
1111 * loader as well, since brk must be available with
1112 * the loader.
1113 *
1114 * Therefore, programs are loaded offset from
1115 * ELF_ET_DYN_BASE and loaders are loaded into the
1116 * independently randomized mmap region (0 load_bias
Kees Cook5f501d52021-11-08 18:33:37 -08001117 * without MAP_FIXED nor MAP_FIXED_NOREPLACE).
Kees Cookeab09532017-07-10 15:52:37 -07001118 */
Alexey Dobriyancc338012019-05-14 15:43:39 -07001119 if (interpreter) {
Kees Cookeab09532017-07-10 15:52:37 -07001120 load_bias = ELF_ET_DYN_BASE;
1121 if (current->flags & PF_RANDOMIZE)
1122 load_bias += arch_mmap_rnd();
Chris Kennellyce81bb22020-10-15 20:12:32 -07001123 alignment = maximum_alignment(elf_phdata, elf_ex->e_phnum);
1124 if (alignment)
1125 load_bias &= ~(alignment - 1);
Kees Cook5f501d52021-11-08 18:33:37 -08001126 elf_flags |= MAP_FIXED_NOREPLACE;
Kees Cookeab09532017-07-10 15:52:37 -07001127 } else
1128 load_bias = 0;
1129
1130 /*
1131 * Since load_bias is used for all subsequent loading
1132 * calculations, we must lower it by the first vaddr
1133 * so that the remaining calculations based on the
1134 * ELF vaddrs will be correctly offset. The result
1135 * is then page aligned.
1136 */
1137 load_bias = ELF_PAGESTART(load_bias - vaddr);
Kees Cook5f501d52021-11-08 18:33:37 -08001138 }
Kees Cookeab09532017-07-10 15:52:37 -07001139
Kees Cook5f501d52021-11-08 18:33:37 -08001140 /*
1141 * Calculate the entire size of the ELF mapping (total_size).
1142 * (Note that load_addr_set is set to true later once the
1143 * initial mapping is performed.)
1144 */
1145 if (!load_addr_set) {
Michael Davidsona87938b2015-04-14 15:47:38 -07001146 total_size = total_mapping_size(elf_phdata,
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001147 elf_ex->e_phnum);
Michael Davidsona87938b2015-04-14 15:47:38 -07001148 if (!total_size) {
Andrew Morton2b1d3ae2015-05-28 15:44:24 -07001149 retval = -EINVAL;
Michael Davidsona87938b2015-04-14 15:47:38 -07001150 goto out_free_dentry;
1151 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001152 }
1153
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001154 error = elf_map(bprm->file, load_bias + vaddr, elf_ppnt,
Michael Davidsona87938b2015-04-14 15:47:38 -07001155 elf_prot, elf_flags, total_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 if (BAD_ADDR(error)) {
Alexey Kuznetsovb140f2512007-05-08 00:31:57 -07001157 retval = IS_ERR((void *)error) ?
1158 PTR_ERR((void*)error) : -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001159 goto out_free_dentry;
1160 }
1161
1162 if (!load_addr_set) {
1163 load_addr_set = 1;
1164 load_addr = (elf_ppnt->p_vaddr - elf_ppnt->p_offset);
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001165 if (elf_ex->e_type == ET_DYN) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 load_bias += error -
1167 ELF_PAGESTART(load_bias + vaddr);
1168 load_addr += load_bias;
1169 reloc_func_desc = load_bias;
1170 }
1171 }
1172 k = elf_ppnt->p_vaddr;
Alexey Dobriyanf67ef442020-01-30 22:16:52 -08001173 if ((elf_ppnt->p_flags & PF_X) && k < start_code)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001174 start_code = k;
1175 if (start_data < k)
1176 start_data = k;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177
1178 /*
1179 * Check to see if the section's size will overflow the
1180 * allowed task size. Note that p_filesz must always be
1181 * <= p_memsz so it is only necessary to check p_memsz.
1182 */
Chuck Ebbertce510592006-07-03 00:24:14 -07001183 if (BAD_ADDR(k) || elf_ppnt->p_filesz > elf_ppnt->p_memsz ||
Linus Torvalds1da177e2005-04-16 15:20:36 -07001184 elf_ppnt->p_memsz > TASK_SIZE ||
1185 TASK_SIZE - elf_ppnt->p_memsz < k) {
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001186 /* set_brk can never work. Avoid overflows. */
Alexey Kuznetsovb140f2512007-05-08 00:31:57 -07001187 retval = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001188 goto out_free_dentry;
1189 }
1190
1191 k = elf_ppnt->p_vaddr + elf_ppnt->p_filesz;
1192
1193 if (k > elf_bss)
1194 elf_bss = k;
1195 if ((elf_ppnt->p_flags & PF_X) && end_code < k)
1196 end_code = k;
1197 if (end_data < k)
1198 end_data = k;
1199 k = elf_ppnt->p_vaddr + elf_ppnt->p_memsz;
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001200 if (k > elf_brk) {
1201 bss_prot = elf_prot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001202 elf_brk = k;
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001203 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204 }
1205
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001206 e_entry = elf_ex->e_entry + load_bias;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207 elf_bss += load_bias;
1208 elf_brk += load_bias;
1209 start_code += load_bias;
1210 end_code += load_bias;
1211 start_data += load_bias;
1212 end_data += load_bias;
1213
1214 /* Calling set_brk effectively mmaps the pages that we need
1215 * for the bss and break sections. We must do this before
1216 * mapping in the interpreter, to make sure it doesn't wind
1217 * up getting placed where the bss needs to go.
1218 */
Denys Vlasenko16e72e92017-02-22 15:45:16 -08001219 retval = set_brk(elf_bss, elf_brk, bss_prot);
Al Viro19d860a2014-05-04 20:11:36 -04001220 if (retval)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001221 goto out_free_dentry;
akpm@osdl.org6de50512005-10-11 08:29:08 -07001222 if (likely(elf_bss != elf_brk) && unlikely(padzero(elf_bss))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001223 retval = -EFAULT; /* Nobody gets to see this, but.. */
1224 goto out_free_dentry;
1225 }
1226
Alexey Dobriyancc338012019-05-14 15:43:39 -07001227 if (interpreter) {
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -07001228 elf_entry = load_elf_interp(interp_elf_ex,
Andi Kleend20894a2008-02-08 04:21:54 -08001229 interpreter,
Dave Martinfe0f6762020-03-16 16:50:46 +00001230 load_bias, interp_elf_phdata,
1231 &arch_state);
Andi Kleend20894a2008-02-08 04:21:54 -08001232 if (!IS_ERR((void *)elf_entry)) {
1233 /*
1234 * load_elf_interp() returns relocation
1235 * adjustment
1236 */
1237 interp_load_addr = elf_entry;
Alexey Dobriyanc69bcc92020-04-06 20:11:26 -07001238 elf_entry += interp_elf_ex->e_entry;
Jiri Kosinacc503c12008-01-30 13:31:07 +01001239 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001240 if (BAD_ADDR(elf_entry)) {
Chuck Ebbertce510592006-07-03 00:24:14 -07001241 retval = IS_ERR((void *)elf_entry) ?
1242 (int)elf_entry : -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001243 goto out_free_dentry;
1244 }
1245 reloc_func_desc = interp_load_addr;
1246
1247 allow_write_access(interpreter);
1248 fput(interpreter);
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -07001249
1250 kfree(interp_elf_ex);
Alexey Dobriyanaa0d1562020-04-06 20:11:32 -07001251 kfree(interp_elf_phdata);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001252 } else {
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001253 elf_entry = e_entry;
Suresh Siddha5342fba2006-02-26 04:18:28 +01001254 if (BAD_ADDR(elf_entry)) {
Chuck Ebbertce510592006-07-03 00:24:14 -07001255 retval = -EINVAL;
Suresh Siddha5342fba2006-02-26 04:18:28 +01001256 goto out_free_dentry;
1257 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001258 }
1259
1260 kfree(elf_phdata);
1261
Linus Torvalds1da177e2005-04-16 15:20:36 -07001262 set_binfmt(&elf_format);
1263
Benjamin Herrenschmidt547ee842005-04-16 15:24:35 -07001264#ifdef ARCH_HAS_SETUP_ADDITIONAL_PAGES
Gabriel Krisman Bertazi9a29a672020-10-03 23:25:33 -04001265 retval = ARCH_SETUP_ADDITIONAL_PAGES(bprm, elf_ex, !!interpreter);
Al Viro19d860a2014-05-04 20:11:36 -04001266 if (retval < 0)
Roland McGrath18c8baff2005-04-28 15:17:19 -07001267 goto out;
Benjamin Herrenschmidt547ee842005-04-16 15:24:35 -07001268#endif /* ARCH_HAS_SETUP_ADDITIONAL_PAGES */
1269
Alexey Dobriyana62c5b12020-01-30 22:16:55 -08001270 retval = create_elf_tables(bprm, elf_ex,
1271 load_addr, interp_load_addr, e_entry);
Al Viro19d860a2014-05-04 20:11:36 -04001272 if (retval < 0)
Ollie Wildb6a2fea2007-07-19 01:48:16 -07001273 goto out;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001274
1275 mm = current->mm;
1276 mm->end_code = end_code;
1277 mm->start_code = start_code;
1278 mm->start_data = start_data;
1279 mm->end_data = end_data;
1280 mm->start_stack = bprm->p;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
Jiri Kosina4471a672011-04-14 15:22:09 -07001282 if ((current->flags & PF_RANDOMIZE) && (randomize_va_space > 1)) {
Kees Cookbbdc6072019-05-14 15:43:57 -07001283 /*
1284 * For architectures with ELF randomization, when executing
1285 * a loader directly (i.e. no interpreter listed in ELF
1286 * headers), move the brk area out of the mmap region
1287 * (since it grows up, and may collide early with the stack
1288 * growing down), and into the unused ELF_ET_DYN_BASE region.
1289 */
Kees Cook7be3cb02019-09-26 10:15:25 -07001290 if (IS_ENABLED(CONFIG_ARCH_HAS_ELF_RANDOMIZE) &&
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001291 elf_ex->e_type == ET_DYN && !interpreter) {
1292 mm->brk = mm->start_brk = ELF_ET_DYN_BASE;
1293 }
Kees Cookbbdc6072019-05-14 15:43:57 -07001294
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001295 mm->brk = mm->start_brk = arch_randomize_brk(mm);
Kees Cook204db6e2015-04-14 15:48:12 -07001296#ifdef compat_brk_randomized
Jiri Kosina4471a672011-04-14 15:22:09 -07001297 current->brk_randomized = 1;
1298#endif
1299 }
Jiri Kosinac1d171a2008-01-30 13:30:40 +01001300
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301 if (current->personality & MMAP_PAGE_ZERO) {
1302 /* Why this, you ask??? Well SVr4 maps page 0 as read-only,
1303 and some applications "depend" upon this behavior.
1304 Since we do not have the power to recompile these, we
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001305 emulate the SVr4 behavior. Sigh. */
Linus Torvalds6be5ceb2012-04-20 17:13:58 -07001306 error = vm_mmap(NULL, 0, PAGE_SIZE, PROT_READ | PROT_EXEC,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001307 MAP_FIXED | MAP_PRIVATE, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001308 }
1309
Alexey Dobriyan249b08e2019-05-14 15:43:54 -07001310 regs = current_pt_regs();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001311#ifdef ELF_PLAT_INIT
1312 /*
1313 * The ABI may specify that certain registers be set up in special
1314 * ways (on i386 %edx is the address of a DT_FINI function, for
1315 * example. In addition, it may also specify (eg, PowerPC64 ELF)
1316 * that the e_entry field is the address of the function descriptor
1317 * for the startup routine, rather than the address of the startup
1318 * routine itself. This macro performs whatever initialization to
1319 * the regs structure is required as well as any relocations to the
1320 * function descriptor entries when executing dynamically links apps.
1321 */
1322 ELF_PLAT_INIT(regs, reloc_func_desc);
1323#endif
1324
Kees Cookb8383832018-04-10 16:34:57 -07001325 finalize_exec(bprm);
Gabriel Krisman Bertazibc3d7bf2020-10-03 23:25:31 -04001326 START_THREAD(elf_ex, regs, elf_entry, bprm->p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001327 retval = 0;
1328out:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001329 return retval;
1330
1331 /* error cleanup */
1332out_free_dentry:
Alexey Dobriyan0693ffe2020-04-06 20:11:29 -07001333 kfree(interp_elf_ex);
Paul Burtona9d9ef12014-09-11 08:30:15 +01001334 kfree(interp_elf_phdata);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001335 allow_write_access(interpreter);
1336 if (interpreter)
1337 fput(interpreter);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338out_free_ph:
1339 kfree(elf_phdata);
1340 goto out;
1341}
1342
Josh Triplett69369a72014-04-03 14:48:27 -07001343#ifdef CONFIG_USELIB
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344/* This is really simpleminded and specialized - we are loading an
1345 a.out library that is given an ELF header. */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001346static int load_elf_library(struct file *file)
1347{
1348 struct elf_phdr *elf_phdata;
1349 struct elf_phdr *eppnt;
1350 unsigned long elf_bss, bss, len;
1351 int retval, error, i, j;
1352 struct elfhdr elf_ex;
1353
1354 error = -ENOEXEC;
Alexey Dobriyan658c0332019-12-04 16:52:25 -08001355 retval = elf_read(file, &elf_ex, sizeof(elf_ex), 0);
1356 if (retval < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001357 goto out;
1358
1359 if (memcmp(elf_ex.e_ident, ELFMAG, SELFMAG) != 0)
1360 goto out;
1361
1362 /* First of all, some simple consistency checks */
1363 if (elf_ex.e_type != ET_EXEC || elf_ex.e_phnum > 2 ||
Al Viro72c2d532013-09-22 16:27:52 -04001364 !elf_check_arch(&elf_ex) || !file->f_op->mmap)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365 goto out;
Nicolas Pitre47552002017-08-16 16:05:13 -04001366 if (elf_check_fdpic(&elf_ex))
1367 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368
1369 /* Now read in all of the header information */
1370
1371 j = sizeof(struct elf_phdr) * elf_ex.e_phnum;
1372 /* j < ELF_MIN_ALIGN because elf_ex.e_phnum <= 2 */
1373
1374 error = -ENOMEM;
1375 elf_phdata = kmalloc(j, GFP_KERNEL);
1376 if (!elf_phdata)
1377 goto out;
1378
1379 eppnt = elf_phdata;
1380 error = -ENOEXEC;
Alexey Dobriyan658c0332019-12-04 16:52:25 -08001381 retval = elf_read(file, eppnt, j, elf_ex.e_phoff);
1382 if (retval < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001383 goto out_free_ph;
1384
1385 for (j = 0, i = 0; i<elf_ex.e_phnum; i++)
1386 if ((eppnt + i)->p_type == PT_LOAD)
1387 j++;
1388 if (j != 1)
1389 goto out_free_ph;
1390
1391 while (eppnt->p_type != PT_LOAD)
1392 eppnt++;
1393
1394 /* Now use mmap to map the library into memory. */
Linus Torvalds6be5ceb2012-04-20 17:13:58 -07001395 error = vm_mmap(file,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001396 ELF_PAGESTART(eppnt->p_vaddr),
1397 (eppnt->p_filesz +
1398 ELF_PAGEOFFSET(eppnt->p_vaddr)),
1399 PROT_READ | PROT_WRITE | PROT_EXEC,
David Hildenbrand42be8b42021-04-22 12:53:00 +02001400 MAP_FIXED_NOREPLACE | MAP_PRIVATE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401 (eppnt->p_offset -
1402 ELF_PAGEOFFSET(eppnt->p_vaddr)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403 if (error != ELF_PAGESTART(eppnt->p_vaddr))
1404 goto out_free_ph;
1405
1406 elf_bss = eppnt->p_vaddr + eppnt->p_filesz;
1407 if (padzero(elf_bss)) {
1408 error = -EFAULT;
1409 goto out_free_ph;
1410 }
1411
Oscar Salvador24962af2018-07-13 16:59:13 -07001412 len = ELF_PAGEALIGN(eppnt->p_filesz + eppnt->p_vaddr);
1413 bss = ELF_PAGEALIGN(eppnt->p_memsz + eppnt->p_vaddr);
Michal Hockoecc2bc82016-05-23 16:25:39 -07001414 if (bss > len) {
1415 error = vm_brk(len, bss - len);
Linus Torvalds5d22fc22016-05-27 15:57:31 -07001416 if (error)
Michal Hockoecc2bc82016-05-23 16:25:39 -07001417 goto out_free_ph;
1418 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001419 error = 0;
1420
1421out_free_ph:
1422 kfree(elf_phdata);
1423out:
1424 return error;
1425}
Josh Triplett69369a72014-04-03 14:48:27 -07001426#endif /* #ifdef CONFIG_USELIB */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001427
Christoph Hellwig698ba7b2009-12-15 16:47:37 -08001428#ifdef CONFIG_ELF_CORE
Linus Torvalds1da177e2005-04-16 15:20:36 -07001429/*
1430 * ELF core dumper
1431 *
1432 * Modelled on fs/exec.c:aout_core_dump()
1433 * Jeremy Fitzhardinge <jeremy@sw.oz.au>
1434 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001435
Linus Torvalds1da177e2005-04-16 15:20:36 -07001436/* An ELF note in memory */
1437struct memelfnote
1438{
1439 const char *name;
1440 int type;
1441 unsigned int datasz;
1442 void *data;
1443};
1444
1445static int notesize(struct memelfnote *en)
1446{
1447 int sz;
1448
1449 sz = sizeof(struct elf_note);
1450 sz += roundup(strlen(en->name) + 1, 4);
1451 sz += roundup(en->datasz, 4);
1452
1453 return sz;
1454}
1455
Al Viroecc8c772013-10-05 15:32:35 -04001456static int writenote(struct memelfnote *men, struct coredump_params *cprm)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001457{
1458 struct elf_note en;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001459 en.n_namesz = strlen(men->name) + 1;
1460 en.n_descsz = men->datasz;
1461 en.n_type = men->type;
1462
Al Viroecc8c772013-10-05 15:32:35 -04001463 return dump_emit(cprm, &en, sizeof(en)) &&
Al Viro22a8cb82013-10-08 11:05:01 -04001464 dump_emit(cprm, men->name, en.n_namesz) && dump_align(cprm, 4) &&
1465 dump_emit(cprm, men->data, men->datasz) && dump_align(cprm, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001466}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467
Roland McGrath3aba4812008-01-30 13:31:44 +01001468static void fill_elf_header(struct elfhdr *elf, int segs,
Zhang Yanfeid3330cf2013-02-21 16:44:20 -08001469 u16 machine, u32 flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001470{
Cyrill Gorcunov6970c8e2008-04-29 01:01:18 -07001471 memset(elf, 0, sizeof(*elf));
1472
Linus Torvalds1da177e2005-04-16 15:20:36 -07001473 memcpy(elf->e_ident, ELFMAG, SELFMAG);
1474 elf->e_ident[EI_CLASS] = ELF_CLASS;
1475 elf->e_ident[EI_DATA] = ELF_DATA;
1476 elf->e_ident[EI_VERSION] = EV_CURRENT;
1477 elf->e_ident[EI_OSABI] = ELF_OSABI;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001478
1479 elf->e_type = ET_CORE;
Roland McGrath3aba4812008-01-30 13:31:44 +01001480 elf->e_machine = machine;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001481 elf->e_version = EV_CURRENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001482 elf->e_phoff = sizeof(struct elfhdr);
Roland McGrath3aba4812008-01-30 13:31:44 +01001483 elf->e_flags = flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001484 elf->e_ehsize = sizeof(struct elfhdr);
1485 elf->e_phentsize = sizeof(struct elf_phdr);
1486 elf->e_phnum = segs;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001487}
1488
Andrew Morton8d6b5eee2006-09-25 23:32:04 -07001489static void fill_elf_note_phdr(struct elf_phdr *phdr, int sz, loff_t offset)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001490{
1491 phdr->p_type = PT_NOTE;
1492 phdr->p_offset = offset;
1493 phdr->p_vaddr = 0;
1494 phdr->p_paddr = 0;
1495 phdr->p_filesz = sz;
1496 phdr->p_memsz = 0;
1497 phdr->p_flags = 0;
1498 phdr->p_align = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001499}
1500
1501static void fill_note(struct memelfnote *note, const char *name, int type,
1502 unsigned int sz, void *data)
1503{
1504 note->name = name;
1505 note->type = type;
1506 note->datasz = sz;
1507 note->data = data;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001508}
1509
1510/*
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001511 * fill up all the fields in prstatus from the given task struct, except
1512 * registers which need to be filled up separately.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001513 */
Al Virof2485a22020-06-13 00:08:44 -04001514static void fill_prstatus(struct elf_prstatus_common *prstatus,
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001515 struct task_struct *p, long signr)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001516{
1517 prstatus->pr_info.si_signo = prstatus->pr_cursig = signr;
1518 prstatus->pr_sigpend = p->pending.signal.sig[0];
1519 prstatus->pr_sighold = p->blocked.sig[0];
Oleg Nesterov3b34fc52009-06-17 16:27:38 -07001520 rcu_read_lock();
1521 prstatus->pr_ppid = task_pid_vnr(rcu_dereference(p->real_parent));
1522 rcu_read_unlock();
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001523 prstatus->pr_pid = task_pid_vnr(p);
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001524 prstatus->pr_pgrp = task_pgrp_vnr(p);
1525 prstatus->pr_sid = task_session_vnr(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001526 if (thread_group_leader(p)) {
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001527 struct task_cputime cputime;
Frank Mayharf06febc2008-09-12 09:54:39 -07001528
Linus Torvalds1da177e2005-04-16 15:20:36 -07001529 /*
Frank Mayharf06febc2008-09-12 09:54:39 -07001530 * This is the record for the group leader. It shows the
1531 * group-wide total, not its individual thread total.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001532 */
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001533 thread_group_cputime(p, &cputime);
Arnd Bergmanne2bb80d2017-11-23 13:46:33 +01001534 prstatus->pr_utime = ns_to_kernel_old_timeval(cputime.utime);
1535 prstatus->pr_stime = ns_to_kernel_old_timeval(cputime.stime);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001536 } else {
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001537 u64 utime, stime;
Frederic Weisbecker6fac4822012-11-13 14:20:55 +01001538
Frederic Weisbeckercd19c362017-01-31 04:09:27 +01001539 task_cputime(p, &utime, &stime);
Arnd Bergmanne2bb80d2017-11-23 13:46:33 +01001540 prstatus->pr_utime = ns_to_kernel_old_timeval(utime);
1541 prstatus->pr_stime = ns_to_kernel_old_timeval(stime);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001542 }
Frederic Weisbecker5613fda2017-01-31 04:09:23 +01001543
Arnd Bergmanne2bb80d2017-11-23 13:46:33 +01001544 prstatus->pr_cutime = ns_to_kernel_old_timeval(p->signal->cutime);
1545 prstatus->pr_cstime = ns_to_kernel_old_timeval(p->signal->cstime);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546}
1547
1548static int fill_psinfo(struct elf_prpsinfo *psinfo, struct task_struct *p,
1549 struct mm_struct *mm)
1550{
David Howellsc69e8d92008-11-14 10:39:19 +11001551 const struct cred *cred;
Greg Kroah-Hartmana84a5052005-05-11 00:10:44 -07001552 unsigned int i, len;
Peter Zijlstra2f064a52021-06-11 10:28:17 +02001553 unsigned int state;
1554
Linus Torvalds1da177e2005-04-16 15:20:36 -07001555 /* first copy the parameters from user space */
1556 memset(psinfo, 0, sizeof(struct elf_prpsinfo));
1557
1558 len = mm->arg_end - mm->arg_start;
1559 if (len >= ELF_PRARGSZ)
1560 len = ELF_PRARGSZ-1;
1561 if (copy_from_user(&psinfo->pr_psargs,
1562 (const char __user *)mm->arg_start, len))
1563 return -EFAULT;
1564 for(i = 0; i < len; i++)
1565 if (psinfo->pr_psargs[i] == 0)
1566 psinfo->pr_psargs[i] = ' ';
1567 psinfo->pr_psargs[len] = 0;
1568
Oleg Nesterov3b34fc52009-06-17 16:27:38 -07001569 rcu_read_lock();
1570 psinfo->pr_ppid = task_pid_vnr(rcu_dereference(p->real_parent));
1571 rcu_read_unlock();
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001572 psinfo->pr_pid = task_pid_vnr(p);
Pavel Emelyanovb4888932007-10-18 23:40:14 -07001573 psinfo->pr_pgrp = task_pgrp_vnr(p);
1574 psinfo->pr_sid = task_session_vnr(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001575
Peter Zijlstra2f064a52021-06-11 10:28:17 +02001576 state = READ_ONCE(p->__state);
1577 i = state ? ffz(~state) + 1 : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001578 psinfo->pr_state = i;
Carsten Otte55148542006-03-25 03:08:22 -08001579 psinfo->pr_sname = (i > 5) ? '.' : "RSDTZW"[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580 psinfo->pr_zomb = psinfo->pr_sname == 'Z';
1581 psinfo->pr_nice = task_nice(p);
1582 psinfo->pr_flag = p->flags;
David Howellsc69e8d92008-11-14 10:39:19 +11001583 rcu_read_lock();
1584 cred = __task_cred(p);
Eric W. Biedermanebc887b2012-02-07 18:36:10 -08001585 SET_UID(psinfo->pr_uid, from_kuid_munged(cred->user_ns, cred->uid));
1586 SET_GID(psinfo->pr_gid, from_kgid_munged(cred->user_ns, cred->gid));
David Howellsc69e8d92008-11-14 10:39:19 +11001587 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001588 strncpy(psinfo->pr_fname, p->comm, sizeof(psinfo->pr_fname));
Peter Zijlstra2f064a52021-06-11 10:28:17 +02001589
Linus Torvalds1da177e2005-04-16 15:20:36 -07001590 return 0;
1591}
1592
Roland McGrath3aba4812008-01-30 13:31:44 +01001593static void fill_auxv_note(struct memelfnote *note, struct mm_struct *mm)
1594{
1595 elf_addr_t *auxv = (elf_addr_t *) mm->saved_auxv;
1596 int i = 0;
1597 do
1598 i += 2;
1599 while (auxv[i - 2] != AT_NULL);
1600 fill_note(note, "CORE", NT_AUXV, i * sizeof(elf_addr_t), auxv);
1601}
1602
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001603static void fill_siginfo_note(struct memelfnote *note, user_siginfo_t *csigdata,
Eric W. Biedermanae7795b2018-09-25 11:27:20 +02001604 const kernel_siginfo_t *siginfo)
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001605{
Eric W. Biedermanfa4751f2020-05-05 12:12:54 +02001606 copy_siginfo_to_external(csigdata, siginfo);
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001607 fill_note(note, "CORE", NT_SIGINFO, sizeof(*csigdata), csigdata);
1608}
1609
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001610#define MAX_FILE_NOTE_SIZE (4*1024*1024)
1611/*
1612 * Format of NT_FILE note:
1613 *
1614 * long count -- how many files are mapped
1615 * long page_size -- units for file_ofs
1616 * array of [COUNT] elements of
1617 * long start
1618 * long end
1619 * long file_ofs
1620 * followed by COUNT filenames in ASCII: "FILE1" NUL "FILE2" NUL...
1621 */
Dan Aloni72023652013-09-30 13:45:02 -07001622static int fill_files_note(struct memelfnote *note)
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001623{
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001624 struct mm_struct *mm = current->mm;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001625 struct vm_area_struct *vma;
1626 unsigned count, size, names_ofs, remaining, n;
1627 user_long_t *data;
1628 user_long_t *start_end_ofs;
1629 char *name_base, *name_curpos;
1630
1631 /* *Estimated* file count and total data size needed */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001632 count = mm->map_count;
Alexey Dobriyan60c9d922018-02-06 15:39:13 -08001633 if (count > UINT_MAX / 64)
1634 return -EINVAL;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001635 size = count * 64;
1636
1637 names_ofs = (2 + 3 * count) * sizeof(data[0]);
1638 alloc:
1639 if (size >= MAX_FILE_NOTE_SIZE) /* paranoia check */
Dan Aloni72023652013-09-30 13:45:02 -07001640 return -EINVAL;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001641 size = round_up(size, PAGE_SIZE);
Alexey Dobriyan1fbede62020-01-30 22:17:10 -08001642 /*
1643 * "size" can be 0 here legitimately.
1644 * Let it ENOMEM and omit NT_FILE section which will be empty anyway.
1645 */
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07001646 data = kvmalloc(size, GFP_KERNEL);
1647 if (ZERO_OR_NULL_PTR(data))
Dan Aloni72023652013-09-30 13:45:02 -07001648 return -ENOMEM;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001649
1650 start_end_ofs = data + 2;
1651 name_base = name_curpos = ((char *)data) + names_ofs;
1652 remaining = size - names_ofs;
1653 count = 0;
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001654 for (vma = mm->mmap; vma != NULL; vma = vma->vm_next) {
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001655 struct file *file;
1656 const char *filename;
1657
1658 file = vma->vm_file;
1659 if (!file)
1660 continue;
Miklos Szeredi9bf39ab2015-06-19 10:29:13 +02001661 filename = file_path(file, name_curpos, remaining);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001662 if (IS_ERR(filename)) {
1663 if (PTR_ERR(filename) == -ENAMETOOLONG) {
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07001664 kvfree(data);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001665 size = size * 5 / 4;
1666 goto alloc;
1667 }
1668 continue;
1669 }
1670
Miklos Szeredi9bf39ab2015-06-19 10:29:13 +02001671 /* file_path() fills at the end, move name down */
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001672 /* n = strlen(filename) + 1: */
1673 n = (name_curpos + remaining) - filename;
1674 remaining = filename - name_curpos;
1675 memmove(name_curpos, filename, n);
1676 name_curpos += n;
1677
1678 *start_end_ofs++ = vma->vm_start;
1679 *start_end_ofs++ = vma->vm_end;
1680 *start_end_ofs++ = vma->vm_pgoff;
1681 count++;
1682 }
1683
1684 /* Now we know exact count of files, can store it */
1685 data[0] = count;
1686 data[1] = PAGE_SIZE;
1687 /*
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001688 * Count usually is less than mm->map_count,
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001689 * we need to move filenames down.
1690 */
Alexey Dobriyan03c6d722020-01-30 22:16:58 -08001691 n = mm->map_count - count;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001692 if (n != 0) {
1693 unsigned shift_bytes = n * 3 * sizeof(data[0]);
1694 memmove(name_base - shift_bytes, name_base,
1695 name_curpos - name_base);
1696 name_curpos -= shift_bytes;
1697 }
1698
1699 size = name_curpos - (char *)data;
1700 fill_note(note, "CORE", NT_FILE, size, data);
Dan Aloni72023652013-09-30 13:45:02 -07001701 return 0;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001702}
1703
Roland McGrath4206d3a2008-01-30 13:31:45 +01001704#ifdef CORE_DUMP_USE_REGSET
1705#include <linux/regset.h>
1706
1707struct elf_thread_core_info {
1708 struct elf_thread_core_info *next;
1709 struct task_struct *task;
1710 struct elf_prstatus prstatus;
Gustavo A. R. Silva5e01fdf2020-08-31 08:25:42 -05001711 struct memelfnote notes[];
Roland McGrath4206d3a2008-01-30 13:31:45 +01001712};
1713
1714struct elf_note_info {
1715 struct elf_thread_core_info *thread;
1716 struct memelfnote psinfo;
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001717 struct memelfnote signote;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001718 struct memelfnote auxv;
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001719 struct memelfnote files;
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001720 user_siginfo_t csigdata;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001721 size_t size;
1722 int thread_notes;
1723};
1724
Roland McGrathd31472b2008-03-04 14:28:30 -08001725/*
1726 * When a regset has a writeback hook, we call it on each thread before
1727 * dumping user memory. On register window machines, this makes sure the
1728 * user memory backing the register data is up to date before we read it.
1729 */
1730static void do_thread_regset_writeback(struct task_struct *task,
1731 const struct user_regset *regset)
1732{
1733 if (regset->writeback)
1734 regset->writeback(task, regset, 1);
1735}
1736
H. J. Lu0953f65d2012-02-14 13:34:52 -08001737#ifndef PRSTATUS_SIZE
Al Viro8a00dd02020-06-22 20:14:02 -04001738#define PRSTATUS_SIZE sizeof(struct elf_prstatus)
H. J. Lu0953f65d2012-02-14 13:34:52 -08001739#endif
1740
1741#ifndef SET_PR_FPVALID
Al Viro8a00dd02020-06-22 20:14:02 -04001742#define SET_PR_FPVALID(S) ((S)->pr_fpvalid = 1)
H. J. Lu0953f65d2012-02-14 13:34:52 -08001743#endif
1744
Roland McGrath4206d3a2008-01-30 13:31:45 +01001745static int fill_thread_core_info(struct elf_thread_core_info *t,
1746 const struct user_regset_view *view,
1747 long signr, size_t *total)
1748{
1749 unsigned int i;
1750
1751 /*
1752 * NT_PRSTATUS is the one special case, because the regset data
1753 * goes into the pr_reg field inside the note contents, rather
1754 * than being the whole note contents. We fill the reset in here.
1755 * We assume that regset 0 is NT_PRSTATUS.
1756 */
Al Virof2485a22020-06-13 00:08:44 -04001757 fill_prstatus(&t->prstatus.common, t->task, signr);
Al Viro8a00dd02020-06-22 20:14:02 -04001758 regset_get(t->task, &view->regsets[0],
Al Virob4e9c952020-06-01 19:42:40 -04001759 sizeof(t->prstatus.pr_reg), &t->prstatus.pr_reg);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001760
1761 fill_note(&t->notes[0], "CORE", NT_PRSTATUS,
Al Viro8a00dd02020-06-22 20:14:02 -04001762 PRSTATUS_SIZE, &t->prstatus);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001763 *total += notesize(&t->notes[0]);
1764
Roland McGrathd31472b2008-03-04 14:28:30 -08001765 do_thread_regset_writeback(t->task, &view->regsets[0]);
1766
Roland McGrath4206d3a2008-01-30 13:31:45 +01001767 /*
1768 * Each other regset might generate a note too. For each regset
1769 * that has no core_note_type or is inactive, we leave t->notes[i]
1770 * all zero and we'll know to skip writing it later.
1771 */
1772 for (i = 1; i < view->n; ++i) {
1773 const struct user_regset *regset = &view->regsets[i];
Al Virob4e9c952020-06-01 19:42:40 -04001774 int note_type = regset->core_note_type;
1775 bool is_fpreg = note_type == NT_PRFPREG;
1776 void *data;
1777 int ret;
1778
Roland McGrathd31472b2008-03-04 14:28:30 -08001779 do_thread_regset_writeback(t->task, regset);
Al Virob4e9c952020-06-01 19:42:40 -04001780 if (!note_type) // not for coredumps
1781 continue;
1782 if (regset->active && regset->active(t->task, regset) <= 0)
1783 continue;
1784
1785 ret = regset_get_alloc(t->task, regset, ~0U, &data);
1786 if (ret < 0)
1787 continue;
1788
1789 if (is_fpreg)
Al Viro8a00dd02020-06-22 20:14:02 -04001790 SET_PR_FPVALID(&t->prstatus);
Al Virob4e9c952020-06-01 19:42:40 -04001791
1792 fill_note(&t->notes[i], is_fpreg ? "CORE" : "LINUX",
1793 note_type, ret, data);
1794
1795 *total += notesize(&t->notes[i]);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001796 }
1797
1798 return 1;
1799}
1800
1801static int fill_note_info(struct elfhdr *elf, int phdrs,
1802 struct elf_note_info *info,
Eric W. Biedermanae7795b2018-09-25 11:27:20 +02001803 const kernel_siginfo_t *siginfo, struct pt_regs *regs)
Roland McGrath4206d3a2008-01-30 13:31:45 +01001804{
1805 struct task_struct *dump_task = current;
1806 const struct user_regset_view *view = task_user_regset_view(dump_task);
1807 struct elf_thread_core_info *t;
1808 struct elf_prpsinfo *psinfo;
Oleg Nesterov83914442008-07-25 01:47:45 -07001809 struct core_thread *ct;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001810 unsigned int i;
1811
1812 info->size = 0;
1813 info->thread = NULL;
1814
1815 psinfo = kmalloc(sizeof(*psinfo), GFP_KERNEL);
Alan Cox6899e922012-12-17 16:02:09 -08001816 if (psinfo == NULL) {
1817 info->psinfo.data = NULL; /* So we don't free this wrongly */
Roland McGrath4206d3a2008-01-30 13:31:45 +01001818 return 0;
Alan Cox6899e922012-12-17 16:02:09 -08001819 }
Roland McGrath4206d3a2008-01-30 13:31:45 +01001820
Amerigo Wange2dbe122009-07-01 01:06:26 -04001821 fill_note(&info->psinfo, "CORE", NT_PRPSINFO, sizeof(*psinfo), psinfo);
1822
Roland McGrath4206d3a2008-01-30 13:31:45 +01001823 /*
1824 * Figure out how many notes we're going to need for each thread.
1825 */
1826 info->thread_notes = 0;
1827 for (i = 0; i < view->n; ++i)
1828 if (view->regsets[i].core_note_type != 0)
1829 ++info->thread_notes;
1830
1831 /*
1832 * Sanity check. We rely on regset 0 being in NT_PRSTATUS,
1833 * since it is our one special case.
1834 */
1835 if (unlikely(info->thread_notes == 0) ||
1836 unlikely(view->regsets[0].core_note_type != NT_PRSTATUS)) {
1837 WARN_ON(1);
1838 return 0;
1839 }
1840
1841 /*
1842 * Initialize the ELF file header.
1843 */
1844 fill_elf_header(elf, phdrs,
Zhang Yanfeid3330cf2013-02-21 16:44:20 -08001845 view->e_machine, view->e_flags);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001846
1847 /*
1848 * Allocate a structure for each thread.
1849 */
Eric W. Biederman0258b5f2021-09-22 11:24:02 -05001850 for (ct = &dump_task->signal->core_state->dumper; ct; ct = ct->next) {
Oleg Nesterov83914442008-07-25 01:47:45 -07001851 t = kzalloc(offsetof(struct elf_thread_core_info,
1852 notes[info->thread_notes]),
1853 GFP_KERNEL);
1854 if (unlikely(!t))
1855 return 0;
Oleg Nesterov24d52882008-07-25 01:47:40 -07001856
Oleg Nesterov83914442008-07-25 01:47:45 -07001857 t->task = ct->task;
1858 if (ct->task == dump_task || !info->thread) {
1859 t->next = info->thread;
1860 info->thread = t;
1861 } else {
1862 /*
1863 * Make sure to keep the original task at
1864 * the head of the list.
1865 */
1866 t->next = info->thread->next;
1867 info->thread->next = t;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001868 }
Oleg Nesterov83914442008-07-25 01:47:45 -07001869 }
Roland McGrath4206d3a2008-01-30 13:31:45 +01001870
1871 /*
1872 * Now fill in each thread's information.
1873 */
1874 for (t = info->thread; t != NULL; t = t->next)
Denys Vlasenko5ab1c302012-10-04 17:15:29 -07001875 if (!fill_thread_core_info(t, view, siginfo->si_signo, &info->size))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001876 return 0;
1877
1878 /*
1879 * Fill in the two process-wide notes.
1880 */
1881 fill_psinfo(psinfo, dump_task->group_leader, dump_task->mm);
1882 info->size += notesize(&info->psinfo);
1883
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001884 fill_siginfo_note(&info->signote, &info->csigdata, siginfo);
1885 info->size += notesize(&info->signote);
1886
Roland McGrath4206d3a2008-01-30 13:31:45 +01001887 fill_auxv_note(&info->auxv, current->mm);
1888 info->size += notesize(&info->auxv);
1889
Dan Aloni72023652013-09-30 13:45:02 -07001890 if (fill_files_note(&info->files) == 0)
1891 info->size += notesize(&info->files);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001892
Roland McGrath4206d3a2008-01-30 13:31:45 +01001893 return 1;
1894}
1895
1896static size_t get_note_info_size(struct elf_note_info *info)
1897{
1898 return info->size;
1899}
1900
1901/*
1902 * Write all the notes for each thread. When writing the first thread, the
1903 * process-wide notes are interleaved after the first thread-specific note.
1904 */
1905static int write_note_info(struct elf_note_info *info,
Al Viroecc8c772013-10-05 15:32:35 -04001906 struct coredump_params *cprm)
Roland McGrath4206d3a2008-01-30 13:31:45 +01001907{
Fabian Frederickb219e252014-06-04 16:12:14 -07001908 bool first = true;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001909 struct elf_thread_core_info *t = info->thread;
1910
1911 do {
1912 int i;
1913
Al Viroecc8c772013-10-05 15:32:35 -04001914 if (!writenote(&t->notes[0], cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001915 return 0;
1916
Al Viroecc8c772013-10-05 15:32:35 -04001917 if (first && !writenote(&info->psinfo, cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001918 return 0;
Al Viroecc8c772013-10-05 15:32:35 -04001919 if (first && !writenote(&info->signote, cprm))
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07001920 return 0;
Al Viroecc8c772013-10-05 15:32:35 -04001921 if (first && !writenote(&info->auxv, cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001922 return 0;
Dan Aloni72023652013-09-30 13:45:02 -07001923 if (first && info->files.data &&
Al Viroecc8c772013-10-05 15:32:35 -04001924 !writenote(&info->files, cprm))
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07001925 return 0;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001926
1927 for (i = 1; i < info->thread_notes; ++i)
1928 if (t->notes[i].data &&
Al Viroecc8c772013-10-05 15:32:35 -04001929 !writenote(&t->notes[i], cprm))
Roland McGrath4206d3a2008-01-30 13:31:45 +01001930 return 0;
1931
Fabian Frederickb219e252014-06-04 16:12:14 -07001932 first = false;
Roland McGrath4206d3a2008-01-30 13:31:45 +01001933 t = t->next;
1934 } while (t);
1935
1936 return 1;
1937}
1938
1939static void free_note_info(struct elf_note_info *info)
1940{
1941 struct elf_thread_core_info *threads = info->thread;
1942 while (threads) {
1943 unsigned int i;
1944 struct elf_thread_core_info *t = threads;
1945 threads = t->next;
1946 WARN_ON(t->notes[0].data && t->notes[0].data != &t->prstatus);
1947 for (i = 1; i < info->thread_notes; ++i)
1948 kfree(t->notes[i].data);
1949 kfree(t);
1950 }
1951 kfree(info->psinfo.data);
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07001952 kvfree(info->files.data);
Roland McGrath4206d3a2008-01-30 13:31:45 +01001953}
1954
1955#else
1956
Linus Torvalds1da177e2005-04-16 15:20:36 -07001957/* Here is the structure in which status of each thread is captured. */
1958struct elf_thread_status
1959{
1960 struct list_head list;
1961 struct elf_prstatus prstatus; /* NT_PRSTATUS */
1962 elf_fpregset_t fpu; /* NT_PRFPREG */
1963 struct task_struct *thread;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001964 struct memelfnote notes[3];
1965 int num_notes;
1966};
1967
1968/*
1969 * In order to add the specific thread information for the elf file format,
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001970 * we need to keep a linked list of every threads pr_status and then create
1971 * a single section for them in the final core file.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001972 */
1973static int elf_dump_thread_status(long signr, struct elf_thread_status *t)
1974{
1975 int sz = 0;
1976 struct task_struct *p = t->thread;
1977 t->num_notes = 0;
1978
Al Virof2485a22020-06-13 00:08:44 -04001979 fill_prstatus(&t->prstatus.common, p, signr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001980 elf_core_copy_task_regs(p, &t->prstatus.pr_reg);
1981
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001982 fill_note(&t->notes[0], "CORE", NT_PRSTATUS, sizeof(t->prstatus),
1983 &(t->prstatus));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001984 t->num_notes++;
1985 sz += notesize(&t->notes[0]);
1986
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07001987 if ((t->prstatus.pr_fpvalid = elf_core_copy_task_fpregs(p, NULL,
1988 &t->fpu))) {
1989 fill_note(&t->notes[1], "CORE", NT_PRFPREG, sizeof(t->fpu),
1990 &(t->fpu));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001991 t->num_notes++;
1992 sz += notesize(&t->notes[1]);
1993 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001994 return sz;
1995}
1996
Roland McGrath3aba4812008-01-30 13:31:44 +01001997struct elf_note_info {
1998 struct memelfnote *notes;
Dan Aloni72023652013-09-30 13:45:02 -07001999 struct memelfnote *notes_files;
Roland McGrath3aba4812008-01-30 13:31:44 +01002000 struct elf_prstatus *prstatus; /* NT_PRSTATUS */
2001 struct elf_prpsinfo *psinfo; /* NT_PRPSINFO */
2002 struct list_head thread_list;
2003 elf_fpregset_t *fpu;
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07002004 user_siginfo_t csigdata;
Roland McGrath3aba4812008-01-30 13:31:44 +01002005 int thread_status_size;
2006 int numnote;
2007};
2008
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002009static int elf_note_info_init(struct elf_note_info *info)
Roland McGrath3aba4812008-01-30 13:31:44 +01002010{
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002011 memset(info, 0, sizeof(*info));
Roland McGrath3aba4812008-01-30 13:31:44 +01002012 INIT_LIST_HEAD(&info->thread_list);
2013
Denys Vlasenko49ae4d42012-10-04 17:15:35 -07002014 /* Allocate space for ELF notes */
Kees Cook6da2ec52018-06-12 13:55:00 -07002015 info->notes = kmalloc_array(8, sizeof(struct memelfnote), GFP_KERNEL);
Roland McGrath3aba4812008-01-30 13:31:44 +01002016 if (!info->notes)
2017 return 0;
2018 info->psinfo = kmalloc(sizeof(*info->psinfo), GFP_KERNEL);
2019 if (!info->psinfo)
Denys Vlasenkof34f9d12012-09-26 11:34:50 +10002020 return 0;
Roland McGrath3aba4812008-01-30 13:31:44 +01002021 info->prstatus = kmalloc(sizeof(*info->prstatus), GFP_KERNEL);
2022 if (!info->prstatus)
Denys Vlasenkof34f9d12012-09-26 11:34:50 +10002023 return 0;
Roland McGrath3aba4812008-01-30 13:31:44 +01002024 info->fpu = kmalloc(sizeof(*info->fpu), GFP_KERNEL);
2025 if (!info->fpu)
Denys Vlasenkof34f9d12012-09-26 11:34:50 +10002026 return 0;
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002027 return 1;
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002028}
Roland McGrath3aba4812008-01-30 13:31:44 +01002029
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002030static int fill_note_info(struct elfhdr *elf, int phdrs,
2031 struct elf_note_info *info,
Eric W. Biedermanae7795b2018-09-25 11:27:20 +02002032 const kernel_siginfo_t *siginfo, struct pt_regs *regs)
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002033{
Al Viroafabada2013-10-14 07:39:56 -04002034 struct core_thread *ct;
2035 struct elf_thread_status *ets;
Amerigo Wang0cf062d2009-09-23 15:57:05 -07002036
2037 if (!elf_note_info_init(info))
2038 return 0;
2039
Eric W. Biederman0258b5f2021-09-22 11:24:02 -05002040 for (ct = current->signal->core_state->dumper.next;
Al Viroafabada2013-10-14 07:39:56 -04002041 ct; ct = ct->next) {
2042 ets = kzalloc(sizeof(*ets), GFP_KERNEL);
2043 if (!ets)
2044 return 0;
Oleg Nesterov24d52882008-07-25 01:47:40 -07002045
Al Viroafabada2013-10-14 07:39:56 -04002046 ets->thread = ct->task;
2047 list_add(&ets->list, &info->thread_list);
2048 }
Oleg Nesterov83914442008-07-25 01:47:45 -07002049
Alexey Dobriyan93f044e2019-03-07 16:28:59 -08002050 list_for_each_entry(ets, &info->thread_list, list) {
Al Viroafabada2013-10-14 07:39:56 -04002051 int sz;
Oleg Nesterov83914442008-07-25 01:47:45 -07002052
Al Viroafabada2013-10-14 07:39:56 -04002053 sz = elf_dump_thread_status(siginfo->si_signo, ets);
2054 info->thread_status_size += sz;
Roland McGrath3aba4812008-01-30 13:31:44 +01002055 }
2056 /* now collect the dump for the current */
2057 memset(info->prstatus, 0, sizeof(*info->prstatus));
Al Virof2485a22020-06-13 00:08:44 -04002058 fill_prstatus(&info->prstatus->common, current, siginfo->si_signo);
Roland McGrath3aba4812008-01-30 13:31:44 +01002059 elf_core_copy_regs(&info->prstatus->pr_reg, regs);
2060
2061 /* Set up header */
Zhang Yanfeid3330cf2013-02-21 16:44:20 -08002062 fill_elf_header(elf, phdrs, ELF_ARCH, ELF_CORE_EFLAGS);
Roland McGrath3aba4812008-01-30 13:31:44 +01002063
2064 /*
2065 * Set up the notes in similar form to SVR4 core dumps made
2066 * with info from their /proc.
2067 */
2068
2069 fill_note(info->notes + 0, "CORE", NT_PRSTATUS,
2070 sizeof(*info->prstatus), info->prstatus);
2071 fill_psinfo(info->psinfo, current->group_leader, current->mm);
2072 fill_note(info->notes + 1, "CORE", NT_PRPSINFO,
2073 sizeof(*info->psinfo), info->psinfo);
2074
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07002075 fill_siginfo_note(info->notes + 2, &info->csigdata, siginfo);
2076 fill_auxv_note(info->notes + 3, current->mm);
Dan Aloni72023652013-09-30 13:45:02 -07002077 info->numnote = 4;
Roland McGrath3aba4812008-01-30 13:31:44 +01002078
Dan Aloni72023652013-09-30 13:45:02 -07002079 if (fill_files_note(info->notes + info->numnote) == 0) {
2080 info->notes_files = info->notes + info->numnote;
2081 info->numnote++;
2082 }
Roland McGrath3aba4812008-01-30 13:31:44 +01002083
2084 /* Try to dump the FPU. */
2085 info->prstatus->pr_fpvalid = elf_core_copy_task_fpregs(current, regs,
2086 info->fpu);
2087 if (info->prstatus->pr_fpvalid)
2088 fill_note(info->notes + info->numnote++,
2089 "CORE", NT_PRFPREG, sizeof(*info->fpu), info->fpu);
Roland McGrath3aba4812008-01-30 13:31:44 +01002090 return 1;
Roland McGrath3aba4812008-01-30 13:31:44 +01002091}
2092
2093static size_t get_note_info_size(struct elf_note_info *info)
2094{
2095 int sz = 0;
2096 int i;
2097
2098 for (i = 0; i < info->numnote; i++)
2099 sz += notesize(info->notes + i);
2100
2101 sz += info->thread_status_size;
2102
2103 return sz;
2104}
2105
2106static int write_note_info(struct elf_note_info *info,
Al Viroecc8c772013-10-05 15:32:35 -04002107 struct coredump_params *cprm)
Roland McGrath3aba4812008-01-30 13:31:44 +01002108{
Alexey Dobriyan93f044e2019-03-07 16:28:59 -08002109 struct elf_thread_status *ets;
Roland McGrath3aba4812008-01-30 13:31:44 +01002110 int i;
Roland McGrath3aba4812008-01-30 13:31:44 +01002111
2112 for (i = 0; i < info->numnote; i++)
Al Viroecc8c772013-10-05 15:32:35 -04002113 if (!writenote(info->notes + i, cprm))
Roland McGrath3aba4812008-01-30 13:31:44 +01002114 return 0;
2115
2116 /* write out the thread status notes section */
Alexey Dobriyan93f044e2019-03-07 16:28:59 -08002117 list_for_each_entry(ets, &info->thread_list, list) {
2118 for (i = 0; i < ets->num_notes; i++)
2119 if (!writenote(&ets->notes[i], cprm))
Roland McGrath3aba4812008-01-30 13:31:44 +01002120 return 0;
2121 }
2122
2123 return 1;
2124}
2125
2126static void free_note_info(struct elf_note_info *info)
2127{
2128 while (!list_empty(&info->thread_list)) {
2129 struct list_head *tmp = info->thread_list.next;
2130 list_del(tmp);
2131 kfree(list_entry(tmp, struct elf_thread_status, list));
2132 }
2133
Dan Aloni72023652013-09-30 13:45:02 -07002134 /* Free data possibly allocated by fill_files_note(): */
2135 if (info->notes_files)
Alexey Dobriyan86a2bb52018-06-14 15:27:24 -07002136 kvfree(info->notes_files->data);
Denys Vlasenko2aa362c2012-10-04 17:15:36 -07002137
Roland McGrath3aba4812008-01-30 13:31:44 +01002138 kfree(info->prstatus);
2139 kfree(info->psinfo);
2140 kfree(info->notes);
2141 kfree(info->fpu);
Roland McGrath3aba4812008-01-30 13:31:44 +01002142}
2143
Roland McGrath4206d3a2008-01-30 13:31:45 +01002144#endif
2145
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002146static void fill_extnum_info(struct elfhdr *elf, struct elf_shdr *shdr4extnum,
2147 elf_addr_t e_shoff, int segs)
2148{
2149 elf->e_shoff = e_shoff;
2150 elf->e_shentsize = sizeof(*shdr4extnum);
2151 elf->e_shnum = 1;
2152 elf->e_shstrndx = SHN_UNDEF;
2153
2154 memset(shdr4extnum, 0, sizeof(*shdr4extnum));
2155
2156 shdr4extnum->sh_type = SHT_NULL;
2157 shdr4extnum->sh_size = elf->e_shnum;
2158 shdr4extnum->sh_link = elf->e_shstrndx;
2159 shdr4extnum->sh_info = segs;
2160}
2161
Linus Torvalds1da177e2005-04-16 15:20:36 -07002162/*
2163 * Actual dumper
2164 *
2165 * This is a two-pass process; first we find the offsets of the bits,
2166 * and then they are actually written out. If we run out of core limit
2167 * we just truncate.
2168 */
Masami Hiramatsuf6151df2009-12-17 15:27:16 -08002169static int elf_core_dump(struct coredump_params *cprm)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002170{
Linus Torvalds1da177e2005-04-16 15:20:36 -07002171 int has_dumped = 0;
Jann Horna07279c2020-10-15 20:12:54 -07002172 int vma_count, segs, i;
2173 size_t vma_data_size;
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002174 struct elfhdr elf;
Al Virocdc3d562013-10-05 22:24:29 -04002175 loff_t offset = 0, dataoff;
Dan Aloni72023652013-09-30 13:45:02 -07002176 struct elf_note_info info = { };
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002177 struct elf_phdr *phdr4note = NULL;
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002178 struct elf_shdr *shdr4extnum = NULL;
2179 Elf_Half e_phnum;
2180 elf_addr_t e_shoff;
Jann Horna07279c2020-10-15 20:12:54 -07002181 struct core_vma_metadata *vma_meta;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002182
Jann Horna07279c2020-10-15 20:12:54 -07002183 if (dump_vma_snapshot(cprm, &vma_count, &vma_meta, &vma_data_size))
2184 return 0;
2185
KAMEZAWA Hiroyuki341c87b2009-06-30 11:41:23 -07002186 /*
2187 * The number of segs are recored into ELF header as 16bit value.
2188 * Please check DEFAULT_MAX_MAP_COUNT definition when you modify here.
2189 */
Jann Horna07279c2020-10-15 20:12:54 -07002190 segs = vma_count + elf_core_extra_phdrs();
Roland McGrathf47aef52007-01-26 00:56:49 -08002191
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002192 /* for notes section */
2193 segs++;
2194
2195 /* If segs > PN_XNUM(0xffff), then e_phnum overflows. To avoid
2196 * this, kernel supports extended numbering. Have a look at
2197 * include/linux/elf.h for further information. */
2198 e_phnum = segs > PN_XNUM ? PN_XNUM : segs;
2199
Roland McGrath3aba4812008-01-30 13:31:44 +01002200 /*
2201 * Collect all the non-memory information about the process for the
2202 * notes. This also sets up the file header.
2203 */
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002204 if (!fill_note_info(&elf, e_phnum, &info, cprm->siginfo, cprm->regs))
Christoph Hellwigd2530b42020-05-05 12:12:55 +02002205 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002206
2207 has_dumped = 1;
Oleg Nesterov079148b2013-04-30 15:28:16 -07002208
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002209 offset += sizeof(elf); /* Elf header */
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002210 offset += segs * sizeof(struct elf_phdr); /* Program headers */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002211
2212 /* Write notes phdr entry */
2213 {
Roland McGrath3aba4812008-01-30 13:31:44 +01002214 size_t sz = get_note_info_size(&info);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002215
Eric W. Biedermanc39ab6d2020-11-25 15:51:32 -06002216 /* For cell spufs */
Michael Ellermane5501492007-09-19 14:38:12 +10002217 sz += elf_coredump_extra_notes_size();
Dwayne Grant McConnellbf1ab972006-11-23 00:46:37 +01002218
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002219 phdr4note = kmalloc(sizeof(*phdr4note), GFP_KERNEL);
2220 if (!phdr4note)
Daisuke HATAYAMA088e7af2010-03-05 13:44:06 -08002221 goto end_coredump;
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002222
2223 fill_elf_note_phdr(phdr4note, sz, offset);
2224 offset += sz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002225 }
2226
Linus Torvalds1da177e2005-04-16 15:20:36 -07002227 dataoff = offset = roundup(offset, ELF_EXEC_PAGESIZE);
2228
Jungseung Lee52f5592e2014-12-10 15:52:16 -08002229 offset += vma_data_size;
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002230 offset += elf_core_extra_data_size();
2231 e_shoff = offset;
2232
2233 if (e_phnum == PN_XNUM) {
2234 shdr4extnum = kmalloc(sizeof(*shdr4extnum), GFP_KERNEL);
2235 if (!shdr4extnum)
2236 goto end_coredump;
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002237 fill_extnum_info(&elf, shdr4extnum, e_shoff, segs);
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002238 }
2239
2240 offset = dataoff;
2241
Alexey Dobriyan225a3f52020-01-30 22:17:04 -08002242 if (!dump_emit(cprm, &elf, sizeof(elf)))
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002243 goto end_coredump;
2244
Al Viroecc8c772013-10-05 15:32:35 -04002245 if (!dump_emit(cprm, phdr4note, sizeof(*phdr4note)))
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002246 goto end_coredump;
2247
Linus Torvalds1da177e2005-04-16 15:20:36 -07002248 /* Write program headers for segments dump */
Jann Horna07279c2020-10-15 20:12:54 -07002249 for (i = 0; i < vma_count; i++) {
2250 struct core_vma_metadata *meta = vma_meta + i;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002251 struct elf_phdr phdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002252
2253 phdr.p_type = PT_LOAD;
2254 phdr.p_offset = offset;
Jann Horna07279c2020-10-15 20:12:54 -07002255 phdr.p_vaddr = meta->start;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002256 phdr.p_paddr = 0;
Jann Horna07279c2020-10-15 20:12:54 -07002257 phdr.p_filesz = meta->dump_size;
2258 phdr.p_memsz = meta->end - meta->start;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002259 offset += phdr.p_filesz;
Jann Horna07279c2020-10-15 20:12:54 -07002260 phdr.p_flags = 0;
2261 if (meta->flags & VM_READ)
2262 phdr.p_flags |= PF_R;
2263 if (meta->flags & VM_WRITE)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07002264 phdr.p_flags |= PF_W;
Jann Horna07279c2020-10-15 20:12:54 -07002265 if (meta->flags & VM_EXEC)
Jesper Juhlf4e5cc22006-06-23 02:05:35 -07002266 phdr.p_flags |= PF_X;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002267 phdr.p_align = ELF_EXEC_PAGESIZE;
2268
Al Viroecc8c772013-10-05 15:32:35 -04002269 if (!dump_emit(cprm, &phdr, sizeof(phdr)))
Daisuke HATAYAMA088e7af2010-03-05 13:44:06 -08002270 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002271 }
2272
Al Viro506f21c2013-10-05 17:22:57 -04002273 if (!elf_core_write_extra_phdrs(cprm, offset))
Daisuke HATAYAMA1fcccba2010-03-05 13:44:07 -08002274 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002275
2276 /* write out the notes section */
Al Viroecc8c772013-10-05 15:32:35 -04002277 if (!write_note_info(&info, cprm))
Roland McGrath3aba4812008-01-30 13:31:44 +01002278 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002279
Eric W. Biedermanc39ab6d2020-11-25 15:51:32 -06002280 /* For cell spufs */
Al Virocdc3d562013-10-05 22:24:29 -04002281 if (elf_coredump_extra_notes_write(cprm))
Michael Ellermane5501492007-09-19 14:38:12 +10002282 goto end_coredump;
Dwayne Grant McConnellbf1ab972006-11-23 00:46:37 +01002283
Andi Kleend025c9d2006-09-30 23:29:28 -07002284 /* Align to page */
Al Virod0f10882020-03-08 09:16:37 -04002285 dump_skip_to(cprm, dataoff);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002286
Jann Horna07279c2020-10-15 20:12:54 -07002287 for (i = 0; i < vma_count; i++) {
2288 struct core_vma_metadata *meta = vma_meta + i;
2289
2290 if (!dump_user_range(cprm, meta->start, meta->dump_size))
Jann Hornafc63a97b2020-10-15 20:12:46 -07002291 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002292 }
2293
Al Viroaa3e7ea2013-10-05 17:50:15 -04002294 if (!elf_core_write_extra_data(cprm))
Daisuke HATAYAMA1fcccba2010-03-05 13:44:07 -08002295 goto end_coredump;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002296
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002297 if (e_phnum == PN_XNUM) {
Al Viro13046ec2013-10-05 18:08:47 -04002298 if (!dump_emit(cprm, shdr4extnum, sizeof(*shdr4extnum)))
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002299 goto end_coredump;
2300 }
2301
Linus Torvalds1da177e2005-04-16 15:20:36 -07002302end_coredump:
Roland McGrath3aba4812008-01-30 13:31:44 +01002303 free_note_info(&info);
Daisuke HATAYAMA8d9032b2010-03-05 13:44:10 -08002304 kfree(shdr4extnum);
Jann Horna07279c2020-10-15 20:12:54 -07002305 kvfree(vma_meta);
Daisuke HATAYAMA93eb2112010-03-05 13:44:09 -08002306 kfree(phdr4note);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002307 return has_dumped;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002308}
2309
Christoph Hellwig698ba7b2009-12-15 16:47:37 -08002310#endif /* CONFIG_ELF_CORE */
Linus Torvalds1da177e2005-04-16 15:20:36 -07002311
2312static int __init init_elf_binfmt(void)
2313{
Al Viro8fc3dc52012-03-17 03:05:16 -04002314 register_binfmt(&elf_format);
2315 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002316}
2317
2318static void __exit exit_elf_binfmt(void)
2319{
2320 /* Remove the COFF and ELF loaders. */
2321 unregister_binfmt(&elf_format);
2322}
2323
2324core_initcall(init_elf_binfmt);
2325module_exit(exit_elf_binfmt);
2326MODULE_LICENSE("GPL");