Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
H. Peter Anvin | 1965aae | 2008-10-22 22:26:29 -0700 | [diff] [blame] | 2 | #ifndef _ASM_X86_PROCESSOR_H |
| 3 | #define _ASM_X86_PROCESSOR_H |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 4 | |
Glauber de Oliveira Costa | 053de04 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 5 | #include <asm/processor-flags.h> |
| 6 | |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 7 | /* Forward declaration, a strange C thing */ |
| 8 | struct task_struct; |
| 9 | struct mm_struct; |
Brian Gerst | 9fda6a0 | 2015-07-29 01:41:16 -0400 | [diff] [blame] | 10 | struct vm86; |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 11 | |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 12 | #include <asm/math_emu.h> |
| 13 | #include <asm/segment.h> |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 14 | #include <asm/types.h> |
Ingo Molnar | decb4c4 | 2015-09-05 09:32:43 +0200 | [diff] [blame] | 15 | #include <uapi/asm/sigcontext.h> |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 16 | #include <asm/current.h> |
Borislav Petkov | cd4d09e | 2016-01-26 22:12:04 +0100 | [diff] [blame] | 17 | #include <asm/cpufeatures.h> |
Glauber de Oliveira Costa | c72dcf8 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 18 | #include <asm/page.h> |
Jeremy Fitzhardinge | 54321d9 | 2009-02-11 10:20:05 -0800 | [diff] [blame] | 19 | #include <asm/pgtable_types.h> |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 20 | #include <asm/percpu.h> |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 21 | #include <asm/msr.h> |
| 22 | #include <asm/desc_defs.h> |
Andi Kleen | bd61643 | 2008-01-30 13:32:38 +0100 | [diff] [blame] | 23 | #include <asm/nops.h> |
David Howells | f05e798 | 2012-03-28 18:11:12 +0100 | [diff] [blame] | 24 | #include <asm/special_insns.h> |
Ingo Molnar | 14b9675 | 2015-04-22 09:57:24 +0200 | [diff] [blame] | 25 | #include <asm/fpu/types.h> |
Josh Poimboeuf | 76846bf | 2017-07-11 10:33:45 -0500 | [diff] [blame] | 26 | #include <asm/unwind_hints.h> |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 27 | |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 28 | #include <linux/personality.h> |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 29 | #include <linux/cache.h> |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 30 | #include <linux/threads.h> |
Peter Zijlstra | 5cbc19a | 2009-09-02 11:49:52 +0200 | [diff] [blame] | 31 | #include <linux/math64.h> |
Peter Zijlstra | faa4602 | 2010-03-25 14:51:50 +0100 | [diff] [blame] | 32 | #include <linux/err.h> |
David Howells | f05e798 | 2012-03-28 18:11:12 +0100 | [diff] [blame] | 33 | #include <linux/irqflags.h> |
Tom Lendacky | 21729f8 | 2017-07-17 16:10:07 -0500 | [diff] [blame] | 34 | #include <linux/mem_encrypt.h> |
David Howells | f05e798 | 2012-03-28 18:11:12 +0100 | [diff] [blame] | 35 | |
| 36 | /* |
| 37 | * We handle most unaligned accesses in hardware. On the other hand |
| 38 | * unaligned DMA can be quite expensive on some Nehalem processors. |
| 39 | * |
| 40 | * Based on this we disable the IP header alignment in network drivers. |
| 41 | */ |
| 42 | #define NET_IP_ALIGN 0 |
Glauber de Oliveira Costa | c72dcf8 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 43 | |
K.Prasad | b332828c | 2009-06-01 23:43:10 +0530 | [diff] [blame] | 44 | #define HBP_NUM 4 |
Glauber de Oliveira Costa | 0ccb8ac | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 45 | /* |
| 46 | * Default implementation of macro that returns current |
| 47 | * instruction pointer ("program counter"). |
| 48 | */ |
| 49 | static inline void *current_text_addr(void) |
| 50 | { |
| 51 | void *pc; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 52 | |
| 53 | asm volatile("mov $1f, %0; 1:":"=r" (pc)); |
| 54 | |
Glauber de Oliveira Costa | 0ccb8ac | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 55 | return pc; |
| 56 | } |
| 57 | |
Ingo Molnar | b8c1b8ea | 2015-05-24 09:58:12 +0200 | [diff] [blame] | 58 | /* |
| 59 | * These alignment constraints are for performance in the vSMP case, |
| 60 | * but in the task_struct case we must also meet hardware imposed |
| 61 | * alignment requirements of the FPU state: |
| 62 | */ |
Glauber de Oliveira Costa | dbcb466 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 63 | #ifdef CONFIG_X86_VSMP |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 64 | # define ARCH_MIN_TASKALIGN (1 << INTERNODE_CACHE_SHIFT) |
| 65 | # define ARCH_MIN_MMSTRUCT_ALIGN (1 << INTERNODE_CACHE_SHIFT) |
Glauber de Oliveira Costa | dbcb466 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 66 | #else |
Ingo Molnar | b8c1b8ea | 2015-05-24 09:58:12 +0200 | [diff] [blame] | 67 | # define ARCH_MIN_TASKALIGN __alignof__(union fpregs_state) |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 68 | # define ARCH_MIN_MMSTRUCT_ALIGN 0 |
Glauber de Oliveira Costa | dbcb466 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 69 | #endif |
| 70 | |
Alex Shi | e0ba94f | 2012-06-28 09:02:16 +0800 | [diff] [blame] | 71 | enum tlb_infos { |
| 72 | ENTRIES, |
| 73 | NR_INFO |
| 74 | }; |
| 75 | |
| 76 | extern u16 __read_mostly tlb_lli_4k[NR_INFO]; |
| 77 | extern u16 __read_mostly tlb_lli_2m[NR_INFO]; |
| 78 | extern u16 __read_mostly tlb_lli_4m[NR_INFO]; |
| 79 | extern u16 __read_mostly tlb_lld_4k[NR_INFO]; |
| 80 | extern u16 __read_mostly tlb_lld_2m[NR_INFO]; |
| 81 | extern u16 __read_mostly tlb_lld_4m[NR_INFO]; |
Kirill A. Shutemov | dd36039 | 2013-12-23 14:16:58 +0200 | [diff] [blame] | 82 | extern u16 __read_mostly tlb_lld_1g[NR_INFO]; |
Alex Shi | c4211f4 | 2012-06-28 09:02:19 +0800 | [diff] [blame] | 83 | |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 84 | /* |
| 85 | * CPU type and hardware bug flags. Kept separately for each CPU. |
Mathias Krause | 0440211 | 2017-02-12 22:12:07 +0100 | [diff] [blame] | 86 | * Members of this structure are referenced in head_32.S, so think twice |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 87 | * before touching them. [mj] |
| 88 | */ |
| 89 | |
| 90 | struct cpuinfo_x86 { |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 91 | __u8 x86; /* CPU family */ |
| 92 | __u8 x86_vendor; /* CPU vendor */ |
| 93 | __u8 x86_model; |
Jia Zhang | b399151 | 2018-01-01 09:52:10 +0800 | [diff] [blame] | 94 | __u8 x86_stepping; |
Mathias Krause | 6415813 | 2017-02-12 22:12:08 +0100 | [diff] [blame] | 95 | #ifdef CONFIG_X86_64 |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 96 | /* Number of 4K pages in DTLB/ITLB combined(in pages): */ |
H. Peter Anvin | b1882e6 | 2009-01-23 17:18:52 -0800 | [diff] [blame] | 97 | int x86_tlbsize; |
Jan Beulich | 13c6c53 | 2009-03-12 12:37:34 +0000 | [diff] [blame] | 98 | #endif |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 99 | __u8 x86_virt_bits; |
| 100 | __u8 x86_phys_bits; |
| 101 | /* CPUID returned core id bits: */ |
| 102 | __u8 x86_coreid_bits; |
Borislav Petkov | 79a8b9a | 2017-02-05 11:50:21 +0100 | [diff] [blame] | 103 | __u8 cu_id; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 104 | /* Max extended CPUID function supported: */ |
| 105 | __u32 extended_cpuid_level; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 106 | /* Maximum supported CPUID level, -1=no CPUID: */ |
| 107 | int cpuid_level; |
Borislav Petkov | 65fc985 | 2013-03-20 15:07:23 +0100 | [diff] [blame] | 108 | __u32 x86_capability[NCAPINTS + NBUGINTS]; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 109 | char x86_vendor_id[16]; |
| 110 | char x86_model_id[64]; |
| 111 | /* in KB - valid for CPUS which support this call: */ |
Gustavo A. R. Silva | 24dbc60 | 2018-02-13 13:22:08 -0600 | [diff] [blame] | 112 | unsigned int x86_cache_size; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 113 | int x86_cache_alignment; /* In bytes */ |
Peter P Waskiewicz Jr | cbc82b1 | 2015-01-23 18:45:43 +0000 | [diff] [blame] | 114 | /* Cache QoS architectural values: */ |
| 115 | int x86_cache_max_rmid; /* max index */ |
| 116 | int x86_cache_occ_scale; /* scale to bytes */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 117 | int x86_power; |
| 118 | unsigned long loops_per_jiffy; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 119 | /* cpuid returned max cores value: */ |
| 120 | u16 x86_max_cores; |
| 121 | u16 apicid; |
Yinghai Lu | 01aaea1 | 2008-03-06 13:46:39 -0800 | [diff] [blame] | 122 | u16 initial_apicid; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 123 | u16 x86_clflush_size; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 124 | /* number of cores as seen by the OS: */ |
| 125 | u16 booted_cores; |
| 126 | /* Physical processor id: */ |
| 127 | u16 phys_proc_id; |
Thomas Gleixner | 1f12e32 | 2016-02-22 22:19:15 +0000 | [diff] [blame] | 128 | /* Logical processor id: */ |
| 129 | u16 logical_proc_id; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 130 | /* Core id: */ |
| 131 | u16 cpu_core_id; |
| 132 | /* Index into per_cpu list: */ |
| 133 | u16 cpu_index; |
Andi Kleen | 506ed6b | 2011-10-12 17:46:33 -0700 | [diff] [blame] | 134 | u32 microcode; |
Andi Kleen | 30bb981 | 2017-11-14 07:42:56 -0500 | [diff] [blame] | 135 | unsigned initialized : 1; |
Kees Cook | 3859a27 | 2016-10-28 01:22:25 -0700 | [diff] [blame] | 136 | } __randomize_layout; |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 137 | |
He Chen | 47f10a3 | 2016-11-11 17:25:34 +0800 | [diff] [blame] | 138 | struct cpuid_regs { |
| 139 | u32 eax, ebx, ecx, edx; |
| 140 | }; |
| 141 | |
| 142 | enum cpuid_regs_idx { |
| 143 | CPUID_EAX = 0, |
| 144 | CPUID_EBX, |
| 145 | CPUID_ECX, |
| 146 | CPUID_EDX, |
| 147 | }; |
| 148 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 149 | #define X86_VENDOR_INTEL 0 |
| 150 | #define X86_VENDOR_CYRIX 1 |
| 151 | #define X86_VENDOR_AMD 2 |
| 152 | #define X86_VENDOR_UMC 3 |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 153 | #define X86_VENDOR_CENTAUR 5 |
| 154 | #define X86_VENDOR_TRANSMETA 7 |
| 155 | #define X86_VENDOR_NSC 8 |
| 156 | #define X86_VENDOR_NUM 9 |
| 157 | |
| 158 | #define X86_VENDOR_UNKNOWN 0xff |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 159 | |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 160 | /* |
| 161 | * capabilities of CPUs |
| 162 | */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 163 | extern struct cpuinfo_x86 boot_cpu_data; |
| 164 | extern struct cpuinfo_x86 new_cpu_data; |
| 165 | |
Andy Lutomirski | 7fb983b | 2017-12-04 15:07:17 +0100 | [diff] [blame] | 166 | extern struct x86_hw_tss doublefault_tss; |
Thomas Gleixner | 6cbd217 | 2017-12-04 15:07:32 +0100 | [diff] [blame] | 167 | extern __u32 cpu_caps_cleared[NCAPINTS + NBUGINTS]; |
| 168 | extern __u32 cpu_caps_set[NCAPINTS + NBUGINTS]; |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 169 | |
| 170 | #ifdef CONFIG_SMP |
Jan Beulich | 2c773dd | 2014-11-04 08:26:42 +0000 | [diff] [blame] | 171 | DECLARE_PER_CPU_READ_MOSTLY(struct cpuinfo_x86, cpu_info); |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 172 | #define cpu_data(cpu) per_cpu(cpu_info, cpu) |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 173 | #else |
Tejun Heo | 7b543a5 | 2010-12-18 16:30:05 +0100 | [diff] [blame] | 174 | #define cpu_info boot_cpu_data |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 175 | #define cpu_data(cpu) boot_cpu_data |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 176 | #endif |
| 177 | |
Jaswinder Singh | 1c6c727 | 2008-07-21 22:40:37 +0530 | [diff] [blame] | 178 | extern const struct seq_operations cpuinfo_op; |
| 179 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 180 | #define cache_line_size() (boot_cpu_data.x86_cache_alignment) |
| 181 | |
| 182 | extern void cpu_detect(struct cpuinfo_x86 *c); |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 183 | |
Yinghai Lu | f580366 | 2008-06-21 03:24:19 -0700 | [diff] [blame] | 184 | extern void early_cpu_init(void); |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 185 | extern void identify_boot_cpu(void); |
| 186 | extern void identify_secondary_cpu(struct cpuinfo_x86 *); |
Glauber de Oliveira Costa | 5300db8 | 2008-01-30 13:31:33 +0100 | [diff] [blame] | 187 | extern void print_cpu_info(struct cpuinfo_x86 *); |
Yinghai Lu | 21c3fcf | 2012-02-12 09:53:57 -0800 | [diff] [blame] | 188 | void print_cpu_msr(struct cpuinfo_x86 *); |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 189 | |
Fenghua Yu | d288e1c | 2012-12-20 23:44:23 -0800 | [diff] [blame] | 190 | #ifdef CONFIG_X86_32 |
| 191 | extern int have_cpuid_p(void); |
| 192 | #else |
| 193 | static inline int have_cpuid_p(void) |
| 194 | { |
| 195 | return 1; |
| 196 | } |
| 197 | #endif |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 198 | static inline void native_cpuid(unsigned int *eax, unsigned int *ebx, |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 199 | unsigned int *ecx, unsigned int *edx) |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 200 | { |
| 201 | /* ecx is often an input as well as an output. */ |
Suresh Siddha | 45a94d7 | 2009-12-16 16:25:42 -0800 | [diff] [blame] | 202 | asm volatile("cpuid" |
Joe Perches | cca2e6f | 2008-03-23 01:03:15 -0700 | [diff] [blame] | 203 | : "=a" (*eax), |
| 204 | "=b" (*ebx), |
| 205 | "=c" (*ecx), |
| 206 | "=d" (*edx) |
Andi Kleen | 506ed6b | 2011-10-12 17:46:33 -0700 | [diff] [blame] | 207 | : "0" (*eax), "2" (*ecx) |
| 208 | : "memory"); |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 209 | } |
| 210 | |
Borislav Petkov | 5dedade | 2017-01-09 12:41:43 +0100 | [diff] [blame] | 211 | #define native_cpuid_reg(reg) \ |
| 212 | static inline unsigned int native_cpuid_##reg(unsigned int op) \ |
| 213 | { \ |
| 214 | unsigned int eax = op, ebx, ecx = 0, edx; \ |
| 215 | \ |
| 216 | native_cpuid(&eax, &ebx, &ecx, &edx); \ |
| 217 | \ |
| 218 | return reg; \ |
| 219 | } |
| 220 | |
| 221 | /* |
| 222 | * Native CPUID functions returning a single datum. |
| 223 | */ |
| 224 | native_cpuid_reg(eax) |
| 225 | native_cpuid_reg(ebx) |
| 226 | native_cpuid_reg(ecx) |
| 227 | native_cpuid_reg(edx) |
| 228 | |
Andy Lutomirski | 6c690ee | 2017-06-12 10:26:14 -0700 | [diff] [blame] | 229 | /* |
| 230 | * Friendlier CR3 helpers. |
| 231 | */ |
| 232 | static inline unsigned long read_cr3_pa(void) |
| 233 | { |
| 234 | return __read_cr3() & CR3_ADDR_MASK; |
| 235 | } |
| 236 | |
Tom Lendacky | eef9c4a | 2017-07-17 16:10:08 -0500 | [diff] [blame] | 237 | static inline unsigned long native_read_cr3_pa(void) |
| 238 | { |
| 239 | return __native_read_cr3() & CR3_ADDR_MASK; |
| 240 | } |
| 241 | |
Glauber de Oliveira Costa | c72dcf8 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 242 | static inline void load_cr3(pgd_t *pgdir) |
| 243 | { |
Tom Lendacky | 21729f8 | 2017-07-17 16:10:07 -0500 | [diff] [blame] | 244 | write_cr3(__sme_pa(pgdir)); |
Glauber de Oliveira Costa | c72dcf8 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 245 | } |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 246 | |
Andy Lutomirski | 7fb983b | 2017-12-04 15:07:17 +0100 | [diff] [blame] | 247 | /* |
| 248 | * Note that while the legacy 'TSS' name comes from 'Task State Segment', |
| 249 | * on modern x86 CPUs the TSS also holds information important to 64-bit mode, |
| 250 | * unrelated to the task-switch mechanism: |
| 251 | */ |
Thomas Gleixner | 96a388d | 2007-10-11 11:20:03 +0200 | [diff] [blame] | 252 | #ifdef CONFIG_X86_32 |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 253 | /* This is the TSS defined by the hardware. */ |
| 254 | struct x86_hw_tss { |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 255 | unsigned short back_link, __blh; |
| 256 | unsigned long sp0; |
| 257 | unsigned short ss0, __ss0h; |
Andy Lutomirski | cf9328c | 2015-04-02 12:41:45 -0700 | [diff] [blame] | 258 | unsigned long sp1; |
Andy Lutomirski | 76e4c49 | 2015-03-10 11:06:00 -0700 | [diff] [blame] | 259 | |
| 260 | /* |
Andy Lutomirski | cf9328c | 2015-04-02 12:41:45 -0700 | [diff] [blame] | 261 | * We don't use ring 1, so ss1 is a convenient scratch space in |
| 262 | * the same cacheline as sp0. We use ss1 to cache the value in |
| 263 | * MSR_IA32_SYSENTER_CS. When we context switch |
| 264 | * MSR_IA32_SYSENTER_CS, we first check if the new value being |
| 265 | * written matches ss1, and, if it's not, then we wrmsr the new |
| 266 | * value and update ss1. |
Andy Lutomirski | 76e4c49 | 2015-03-10 11:06:00 -0700 | [diff] [blame] | 267 | * |
Andy Lutomirski | cf9328c | 2015-04-02 12:41:45 -0700 | [diff] [blame] | 268 | * The only reason we context switch MSR_IA32_SYSENTER_CS is |
| 269 | * that we set it to zero in vm86 tasks to avoid corrupting the |
| 270 | * stack if we were to go through the sysenter path from vm86 |
| 271 | * mode. |
Andy Lutomirski | 76e4c49 | 2015-03-10 11:06:00 -0700 | [diff] [blame] | 272 | */ |
Andy Lutomirski | 76e4c49 | 2015-03-10 11:06:00 -0700 | [diff] [blame] | 273 | unsigned short ss1; /* MSR_IA32_SYSENTER_CS */ |
| 274 | |
| 275 | unsigned short __ss1h; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 276 | unsigned long sp2; |
| 277 | unsigned short ss2, __ss2h; |
| 278 | unsigned long __cr3; |
| 279 | unsigned long ip; |
| 280 | unsigned long flags; |
| 281 | unsigned long ax; |
| 282 | unsigned long cx; |
| 283 | unsigned long dx; |
| 284 | unsigned long bx; |
| 285 | unsigned long sp; |
| 286 | unsigned long bp; |
| 287 | unsigned long si; |
| 288 | unsigned long di; |
| 289 | unsigned short es, __esh; |
| 290 | unsigned short cs, __csh; |
| 291 | unsigned short ss, __ssh; |
| 292 | unsigned short ds, __dsh; |
| 293 | unsigned short fs, __fsh; |
| 294 | unsigned short gs, __gsh; |
| 295 | unsigned short ldt, __ldth; |
| 296 | unsigned short trace; |
| 297 | unsigned short io_bitmap_base; |
| 298 | |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 299 | } __attribute__((packed)); |
| 300 | #else |
| 301 | struct x86_hw_tss { |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 302 | u32 reserved1; |
| 303 | u64 sp0; |
Andy Lutomirski | 9aaefe7 | 2017-12-04 15:07:21 +0100 | [diff] [blame] | 304 | |
| 305 | /* |
| 306 | * We store cpu_current_top_of_stack in sp1 so it's always accessible. |
| 307 | * Linux does not use ring 1, so sp1 is not otherwise needed. |
| 308 | */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 309 | u64 sp1; |
Andy Lutomirski | 9aaefe7 | 2017-12-04 15:07:21 +0100 | [diff] [blame] | 310 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 311 | u64 sp2; |
| 312 | u64 reserved2; |
| 313 | u64 ist[7]; |
| 314 | u32 reserved3; |
| 315 | u32 reserved4; |
| 316 | u16 reserved5; |
| 317 | u16 io_bitmap_base; |
| 318 | |
Andy Lutomirski | d3273de | 2017-02-20 08:56:13 -0800 | [diff] [blame] | 319 | } __attribute__((packed)); |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 320 | #endif |
| 321 | |
| 322 | /* |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 323 | * IO-bitmap sizes: |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 324 | */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 325 | #define IO_BITMAP_BITS 65536 |
| 326 | #define IO_BITMAP_BYTES (IO_BITMAP_BITS/8) |
| 327 | #define IO_BITMAP_LONGS (IO_BITMAP_BYTES/sizeof(long)) |
Andy Lutomirski | 7fb983b | 2017-12-04 15:07:17 +0100 | [diff] [blame] | 328 | #define IO_BITMAP_OFFSET (offsetof(struct tss_struct, io_bitmap) - offsetof(struct tss_struct, x86_tss)) |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 329 | #define INVALID_IO_BITMAP_OFFSET 0x8000 |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 330 | |
Dave Hansen | 4fe2d8b | 2017-12-04 17:25:07 -0800 | [diff] [blame] | 331 | struct entry_stack { |
Andy Lutomirski | 0f9a481 | 2017-12-04 15:07:28 +0100 | [diff] [blame] | 332 | unsigned long words[64]; |
| 333 | }; |
| 334 | |
Dave Hansen | 4fe2d8b | 2017-12-04 17:25:07 -0800 | [diff] [blame] | 335 | struct entry_stack_page { |
| 336 | struct entry_stack stack; |
Andy Lutomirski | c482fee | 2017-12-04 15:07:29 +0100 | [diff] [blame] | 337 | } __aligned(PAGE_SIZE); |
Andy Lutomirski | 1a935bc | 2017-12-04 15:07:19 +0100 | [diff] [blame] | 338 | |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 339 | struct tss_struct { |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 340 | /* |
Andy Lutomirski | 1a935bc | 2017-12-04 15:07:19 +0100 | [diff] [blame] | 341 | * The fixed hardware portion. This must not cross a page boundary |
| 342 | * at risk of violating the SDM's advice and potentially triggering |
| 343 | * errata. |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 344 | */ |
| 345 | struct x86_hw_tss x86_tss; |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 346 | |
| 347 | /* |
| 348 | * The extra 1 is there because the CPU will access an |
| 349 | * additional byte beyond the end of the IO permission |
| 350 | * bitmap. The extra byte must be all 1 bits, and must |
| 351 | * be within the limit. |
| 352 | */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 353 | unsigned long io_bitmap[IO_BITMAP_LONGS + 1]; |
Andy Lutomirski | 1a935bc | 2017-12-04 15:07:19 +0100 | [diff] [blame] | 354 | } __aligned(PAGE_SIZE); |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 355 | |
Andy Lutomirski | c482fee | 2017-12-04 15:07:29 +0100 | [diff] [blame] | 356 | DECLARE_PER_CPU_PAGE_ALIGNED(struct tss_struct, cpu_tss_rw); |
Glauber de Oliveira Costa | ca241c7 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 357 | |
Andy Lutomirski | 4f53ab1 | 2017-02-20 08:56:09 -0800 | [diff] [blame] | 358 | /* |
| 359 | * sizeof(unsigned long) coming from an extra "long" at the end |
| 360 | * of the iobitmap. |
| 361 | * |
| 362 | * -1? seg base+limit should be pointing to the address of the |
| 363 | * last valid byte |
| 364 | */ |
| 365 | #define __KERNEL_TSS_LIMIT \ |
| 366 | (IO_BITMAP_OFFSET + IO_BITMAP_BYTES + sizeof(unsigned long) - 1) |
| 367 | |
Andy Lutomirski | a7fcf28 | 2015-03-06 17:50:19 -0800 | [diff] [blame] | 368 | #ifdef CONFIG_X86_32 |
| 369 | DECLARE_PER_CPU(unsigned long, cpu_current_top_of_stack); |
Andy Lutomirski | 9aaefe7 | 2017-12-04 15:07:21 +0100 | [diff] [blame] | 370 | #else |
Andy Lutomirski | c482fee | 2017-12-04 15:07:29 +0100 | [diff] [blame] | 371 | /* The RO copy can't be accessed with this_cpu_xyz(), so use the RW copy. */ |
| 372 | #define cpu_current_top_of_stack cpu_tss_rw.x86_tss.sp1 |
Andy Lutomirski | a7fcf28 | 2015-03-06 17:50:19 -0800 | [diff] [blame] | 373 | #endif |
| 374 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 375 | /* |
| 376 | * Save the original ist values for checking stack pointers during debugging |
| 377 | */ |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 378 | struct orig_ist { |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 379 | unsigned long ist[7]; |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 380 | }; |
| 381 | |
Glauber Costa | fe67620 | 2008-03-03 14:12:56 -0300 | [diff] [blame] | 382 | #ifdef CONFIG_X86_64 |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 383 | DECLARE_PER_CPU(struct orig_ist, orig_ist); |
Brian Gerst | 26f80bd | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 384 | |
Brian Gerst | 947e76c | 2009-01-19 12:21:28 +0900 | [diff] [blame] | 385 | union irq_stack_union { |
| 386 | char irq_stack[IRQ_STACK_SIZE]; |
| 387 | /* |
| 388 | * GCC hardcodes the stack canary as %gs:40. Since the |
| 389 | * irq_stack is the object at %gs:0, we reserve the bottom |
| 390 | * 48 bytes of the irq stack for the canary. |
| 391 | */ |
| 392 | struct { |
| 393 | char gs_base[40]; |
| 394 | unsigned long stack_canary; |
| 395 | }; |
| 396 | }; |
| 397 | |
Andi Kleen | 277d5b4 | 2013-08-05 15:02:43 -0700 | [diff] [blame] | 398 | DECLARE_PER_CPU_FIRST(union irq_stack_union, irq_stack_union) __visible; |
Brian Gerst | 2add8e2 | 2009-02-08 09:58:39 -0500 | [diff] [blame] | 399 | DECLARE_INIT_PER_CPU(irq_stack_union); |
| 400 | |
Vitaly Kuznetsov | 35060ed | 2018-03-13 18:48:05 +0100 | [diff] [blame] | 401 | static inline unsigned long cpu_kernelmode_gs_base(int cpu) |
| 402 | { |
| 403 | return (unsigned long)per_cpu(irq_stack_union.gs_base, cpu); |
| 404 | } |
| 405 | |
Brian Gerst | 26f80bd | 2009-01-19 00:38:58 +0900 | [diff] [blame] | 406 | DECLARE_PER_CPU(char *, irq_stack_ptr); |
Jaswinder Singh Rajput | 9766cdb | 2009-03-14 11:19:49 +0530 | [diff] [blame] | 407 | DECLARE_PER_CPU(unsigned int, irq_count); |
Jaswinder Singh Rajput | 9766cdb | 2009-03-14 11:19:49 +0530 | [diff] [blame] | 408 | extern asmlinkage void ignore_sysret(void); |
Vitaly Kuznetsov | 42b933b | 2018-03-13 18:48:04 +0100 | [diff] [blame] | 409 | |
| 410 | #if IS_ENABLED(CONFIG_KVM) |
| 411 | /* Save actual FS/GS selectors and bases to current->thread */ |
| 412 | void save_fsgs_for_kvm(void); |
| 413 | #endif |
Tejun Heo | 60a5317 | 2009-02-09 22:17:40 +0900 | [diff] [blame] | 414 | #else /* X86_64 */ |
Linus Torvalds | 050e9ba | 2018-06-14 12:21:18 +0900 | [diff] [blame] | 415 | #ifdef CONFIG_STACKPROTECTOR |
Jeremy Fitzhardinge | 1ea0d14 | 2009-09-03 12:27:15 -0700 | [diff] [blame] | 416 | /* |
| 417 | * Make sure stack canary segment base is cached-aligned: |
| 418 | * "For Intel Atom processors, avoid non zero segment base address |
| 419 | * that is not aligned to cache line boundary at all cost." |
| 420 | * (Optim Ref Manual Assembly/Compiler Coding Rule 15.) |
| 421 | */ |
| 422 | struct stack_canary { |
| 423 | char __pad[20]; /* canary at %gs:20 */ |
| 424 | unsigned long canary; |
| 425 | }; |
Jeremy Fitzhardinge | 53f8245 | 2009-09-03 14:31:44 -0700 | [diff] [blame] | 426 | DECLARE_PER_CPU_ALIGNED(struct stack_canary, stack_canary); |
Thomas Gleixner | 96a388d | 2007-10-11 11:20:03 +0200 | [diff] [blame] | 427 | #endif |
Steven Rostedt | 198d208 | 2014-02-06 09:41:31 -0500 | [diff] [blame] | 428 | /* |
| 429 | * per-CPU IRQ handling stacks |
| 430 | */ |
| 431 | struct irq_stack { |
| 432 | u32 stack[THREAD_SIZE/sizeof(u32)]; |
| 433 | } __aligned(THREAD_SIZE); |
| 434 | |
| 435 | DECLARE_PER_CPU(struct irq_stack *, hardirq_stack); |
| 436 | DECLARE_PER_CPU(struct irq_stack *, softirq_stack); |
Tejun Heo | 60a5317 | 2009-02-09 22:17:40 +0900 | [diff] [blame] | 437 | #endif /* X86_64 */ |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 438 | |
Fenghua Yu | bf15a8c | 2016-05-20 10:47:06 -0700 | [diff] [blame] | 439 | extern unsigned int fpu_kernel_xstate_size; |
Fenghua Yu | a1141e0 | 2016-05-20 10:47:05 -0700 | [diff] [blame] | 440 | extern unsigned int fpu_user_xstate_size; |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 441 | |
Frederic Weisbecker | 24f1e32c | 2009-09-09 19:22:48 +0200 | [diff] [blame] | 442 | struct perf_event; |
| 443 | |
Andy Lutomirski | 13d4ea0 | 2016-07-14 13:22:57 -0700 | [diff] [blame] | 444 | typedef struct { |
| 445 | unsigned long seg; |
| 446 | } mm_segment_t; |
| 447 | |
Glauber de Oliveira Costa | cb38d37 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 448 | struct thread_struct { |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 449 | /* Cached TLS descriptors: */ |
| 450 | struct desc_struct tls_array[GDT_ENTRY_TLS_ENTRIES]; |
Andy Lutomirski | d375cf1 | 2017-11-02 00:59:16 -0700 | [diff] [blame] | 451 | #ifdef CONFIG_X86_32 |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 452 | unsigned long sp0; |
Andy Lutomirski | d375cf1 | 2017-11-02 00:59:16 -0700 | [diff] [blame] | 453 | #endif |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 454 | unsigned long sp; |
Glauber de Oliveira Costa | cb38d37 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 455 | #ifdef CONFIG_X86_32 |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 456 | unsigned long sysenter_cs; |
Glauber de Oliveira Costa | cb38d37 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 457 | #else |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 458 | unsigned short es; |
| 459 | unsigned short ds; |
| 460 | unsigned short fsindex; |
| 461 | unsigned short gsindex; |
Glauber de Oliveira Costa | cb38d37 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 462 | #endif |
Andy Lutomirski | b9d989c | 2016-09-13 14:29:21 -0700 | [diff] [blame] | 463 | |
Alexey Dobriyan | d756f4ad | 2009-05-04 03:29:52 +0400 | [diff] [blame] | 464 | #ifdef CONFIG_X86_64 |
Andy Lutomirski | 296f781 | 2016-04-26 12:23:29 -0700 | [diff] [blame] | 465 | unsigned long fsbase; |
| 466 | unsigned long gsbase; |
| 467 | #else |
| 468 | /* |
| 469 | * XXX: this could presumably be unsigned short. Alternatively, |
| 470 | * 32-bit kernels could be taught to use fsindex instead. |
| 471 | */ |
| 472 | unsigned long fs; |
| 473 | unsigned long gs; |
Alexey Dobriyan | d756f4ad | 2009-05-04 03:29:52 +0400 | [diff] [blame] | 474 | #endif |
Ingo Molnar | c5bedc6 | 2015-04-23 12:49:20 +0200 | [diff] [blame] | 475 | |
Frederic Weisbecker | 24f1e32c | 2009-09-09 19:22:48 +0200 | [diff] [blame] | 476 | /* Save middle states of ptrace breakpoints */ |
| 477 | struct perf_event *ptrace_bps[HBP_NUM]; |
| 478 | /* Debug status used for traps, single steps, etc... */ |
| 479 | unsigned long debugreg6; |
Frederic Weisbecker | 326264a | 2010-02-18 18:24:18 +0100 | [diff] [blame] | 480 | /* Keep track of the exact dr7 value set by the user */ |
| 481 | unsigned long ptrace_dr7; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 482 | /* Fault info: */ |
| 483 | unsigned long cr2; |
Srikar Dronamraju | 51e7dc7 | 2012-03-12 14:55:55 +0530 | [diff] [blame] | 484 | unsigned long trap_nr; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 485 | unsigned long error_code; |
Brian Gerst | 9fda6a0 | 2015-07-29 01:41:16 -0400 | [diff] [blame] | 486 | #ifdef CONFIG_VM86 |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 487 | /* Virtual 86 mode info */ |
Brian Gerst | 9fda6a0 | 2015-07-29 01:41:16 -0400 | [diff] [blame] | 488 | struct vm86 *vm86; |
Glauber de Oliveira Costa | cb38d37 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 489 | #endif |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 490 | /* IO permissions: */ |
| 491 | unsigned long *io_bitmap_ptr; |
| 492 | unsigned long iopl; |
| 493 | /* Max allowed port in the bitmap, in bytes: */ |
| 494 | unsigned io_bitmap_max; |
Dave Hansen | 0c8c0f0 | 2015-07-17 12:28:11 +0200 | [diff] [blame] | 495 | |
Andy Lutomirski | 13d4ea0 | 2016-07-14 13:22:57 -0700 | [diff] [blame] | 496 | mm_segment_t addr_limit; |
| 497 | |
Ingo Molnar | 2a53ccb | 2016-07-15 10:21:11 +0200 | [diff] [blame] | 498 | unsigned int sig_on_uaccess_err:1; |
Andy Lutomirski | dfa9a94 | 2016-07-14 13:22:56 -0700 | [diff] [blame] | 499 | unsigned int uaccess_err:1; /* uaccess failed */ |
| 500 | |
Dave Hansen | 0c8c0f0 | 2015-07-17 12:28:11 +0200 | [diff] [blame] | 501 | /* Floating point and extended processor state */ |
| 502 | struct fpu fpu; |
| 503 | /* |
| 504 | * WARNING: 'fpu' is dynamically-sized. It *MUST* be at |
| 505 | * the end. |
| 506 | */ |
Glauber de Oliveira Costa | cb38d37 | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 507 | }; |
| 508 | |
Kees Cook | f7d83c1 | 2017-08-16 13:26:03 -0700 | [diff] [blame] | 509 | /* Whitelist the FPU state from the task_struct for hardened usercopy. */ |
| 510 | static inline void arch_thread_struct_whitelist(unsigned long *offset, |
| 511 | unsigned long *size) |
| 512 | { |
| 513 | *offset = offsetof(struct thread_struct, fpu.state); |
| 514 | *size = fpu_kernel_xstate_size; |
| 515 | } |
| 516 | |
Glauber de Oliveira Costa | 62d7d7e | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 517 | /* |
Andy Lutomirski | b9d989c | 2016-09-13 14:29:21 -0700 | [diff] [blame] | 518 | * Thread-synchronous status. |
| 519 | * |
| 520 | * This is different from the flags in that nobody else |
| 521 | * ever touches our thread-synchronous status, so we don't |
| 522 | * have to worry about atomic accesses. |
| 523 | */ |
| 524 | #define TS_COMPAT 0x0002 /* 32bit syscall active (64BIT)*/ |
| 525 | |
| 526 | /* |
Glauber de Oliveira Costa | 62d7d7e | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 527 | * Set IOPL bits in EFLAGS from given mask |
| 528 | */ |
| 529 | static inline void native_set_iopl_mask(unsigned mask) |
| 530 | { |
| 531 | #ifdef CONFIG_X86_32 |
| 532 | unsigned int reg; |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 533 | |
Joe Perches | cca2e6f | 2008-03-23 01:03:15 -0700 | [diff] [blame] | 534 | asm volatile ("pushfl;" |
| 535 | "popl %0;" |
| 536 | "andl %1, %0;" |
| 537 | "orl %2, %0;" |
| 538 | "pushl %0;" |
| 539 | "popfl" |
| 540 | : "=&r" (reg) |
| 541 | : "i" (~X86_EFLAGS_IOPL), "r" (mask)); |
Glauber de Oliveira Costa | 62d7d7e | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 542 | #endif |
| 543 | } |
| 544 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 545 | static inline void |
Andy Lutomirski | da51da1 | 2017-11-02 00:59:10 -0700 | [diff] [blame] | 546 | native_load_sp0(unsigned long sp0) |
Glauber de Oliveira Costa | 7818a1e | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 547 | { |
Andy Lutomirski | c482fee | 2017-12-04 15:07:29 +0100 | [diff] [blame] | 548 | this_cpu_write(cpu_tss_rw.x86_tss.sp0, sp0); |
Glauber de Oliveira Costa | 7818a1e | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 549 | } |
Glauber de Oliveira Costa | 1b46cbe | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 550 | |
Glauber de Oliveira Costa | e801f86 | 2008-01-30 13:32:08 +0100 | [diff] [blame] | 551 | static inline void native_swapgs(void) |
| 552 | { |
| 553 | #ifdef CONFIG_X86_64 |
| 554 | asm volatile("swapgs" ::: "memory"); |
| 555 | #endif |
| 556 | } |
| 557 | |
Andy Lutomirski | a7fcf28 | 2015-03-06 17:50:19 -0800 | [diff] [blame] | 558 | static inline unsigned long current_top_of_stack(void) |
Andy Lutomirski | 8ef46a6 | 2015-03-05 19:19:02 -0800 | [diff] [blame] | 559 | { |
Andy Lutomirski | 9aaefe7 | 2017-12-04 15:07:21 +0100 | [diff] [blame] | 560 | /* |
| 561 | * We can't read directly from tss.sp0: sp0 on x86_32 is special in |
| 562 | * and around vm86 mode and sp0 on x86_64 is special because of the |
| 563 | * entry trampoline. |
| 564 | */ |
Andy Lutomirski | a7fcf28 | 2015-03-06 17:50:19 -0800 | [diff] [blame] | 565 | return this_cpu_read_stable(cpu_current_top_of_stack); |
Andy Lutomirski | 8ef46a6 | 2015-03-05 19:19:02 -0800 | [diff] [blame] | 566 | } |
| 567 | |
Andy Lutomirski | 3383642 | 2017-11-02 00:59:17 -0700 | [diff] [blame] | 568 | static inline bool on_thread_stack(void) |
| 569 | { |
| 570 | return (unsigned long)(current_top_of_stack() - |
| 571 | current_stack_pointer) < THREAD_SIZE; |
| 572 | } |
| 573 | |
Glauber de Oliveira Costa | 7818a1e | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 574 | #ifdef CONFIG_PARAVIRT |
| 575 | #include <asm/paravirt.h> |
| 576 | #else |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 577 | #define __cpuid native_cpuid |
Glauber de Oliveira Costa | 1b46cbe | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 578 | |
Andy Lutomirski | da51da1 | 2017-11-02 00:59:10 -0700 | [diff] [blame] | 579 | static inline void load_sp0(unsigned long sp0) |
Glauber de Oliveira Costa | 7818a1e | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 580 | { |
Andy Lutomirski | da51da1 | 2017-11-02 00:59:10 -0700 | [diff] [blame] | 581 | native_load_sp0(sp0); |
Glauber de Oliveira Costa | 7818a1e | 2008-01-30 13:31:31 +0100 | [diff] [blame] | 582 | } |
| 583 | |
Glauber de Oliveira Costa | 62d7d7e | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 584 | #define set_iopl_mask native_set_iopl_mask |
Glauber de Oliveira Costa | 1b46cbe | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 585 | #endif /* CONFIG_PARAVIRT */ |
| 586 | |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 587 | /* Free all resources held by a thread. */ |
| 588 | extern void release_thread(struct task_struct *); |
| 589 | |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 590 | unsigned long get_wchan(struct task_struct *p); |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 591 | |
| 592 | /* |
| 593 | * Generic CPUID function |
| 594 | * clear %ecx since some cpus (Cyrix MII) do not set or clear %ecx |
| 595 | * resulting in stale register contents being returned. |
| 596 | */ |
| 597 | static inline void cpuid(unsigned int op, |
| 598 | unsigned int *eax, unsigned int *ebx, |
| 599 | unsigned int *ecx, unsigned int *edx) |
| 600 | { |
| 601 | *eax = op; |
| 602 | *ecx = 0; |
| 603 | __cpuid(eax, ebx, ecx, edx); |
| 604 | } |
| 605 | |
| 606 | /* Some CPUID calls want 'count' to be placed in ecx */ |
| 607 | static inline void cpuid_count(unsigned int op, int count, |
| 608 | unsigned int *eax, unsigned int *ebx, |
| 609 | unsigned int *ecx, unsigned int *edx) |
| 610 | { |
| 611 | *eax = op; |
| 612 | *ecx = count; |
| 613 | __cpuid(eax, ebx, ecx, edx); |
| 614 | } |
| 615 | |
| 616 | /* |
| 617 | * CPUID functions returning a single datum |
| 618 | */ |
| 619 | static inline unsigned int cpuid_eax(unsigned int op) |
| 620 | { |
| 621 | unsigned int eax, ebx, ecx, edx; |
| 622 | |
| 623 | cpuid(op, &eax, &ebx, &ecx, &edx); |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 624 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 625 | return eax; |
| 626 | } |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 627 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 628 | static inline unsigned int cpuid_ebx(unsigned int op) |
| 629 | { |
| 630 | unsigned int eax, ebx, ecx, edx; |
| 631 | |
| 632 | cpuid(op, &eax, &ebx, &ecx, &edx); |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 633 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 634 | return ebx; |
| 635 | } |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 636 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 637 | static inline unsigned int cpuid_ecx(unsigned int op) |
| 638 | { |
| 639 | unsigned int eax, ebx, ecx, edx; |
| 640 | |
| 641 | cpuid(op, &eax, &ebx, &ecx, &edx); |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 642 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 643 | return ecx; |
| 644 | } |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 645 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 646 | static inline unsigned int cpuid_edx(unsigned int op) |
| 647 | { |
| 648 | unsigned int eax, ebx, ecx, edx; |
| 649 | |
| 650 | cpuid(op, &eax, &ebx, &ecx, &edx); |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 651 | |
Glauber de Oliveira Costa | c758ecf | 2008-01-30 13:31:03 +0100 | [diff] [blame] | 652 | return edx; |
| 653 | } |
| 654 | |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 655 | /* REP NOP (PAUSE) is a good thing to insert into busy-wait loops. */ |
Denys Vlasenko | 0b101e6 | 2015-09-24 14:02:29 +0200 | [diff] [blame] | 656 | static __always_inline void rep_nop(void) |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 657 | { |
Joe Perches | cca2e6f | 2008-03-23 01:03:15 -0700 | [diff] [blame] | 658 | asm volatile("rep; nop" ::: "memory"); |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 659 | } |
| 660 | |
Denys Vlasenko | 0b101e6 | 2015-09-24 14:02:29 +0200 | [diff] [blame] | 661 | static __always_inline void cpu_relax(void) |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 662 | { |
| 663 | rep_nop(); |
| 664 | } |
| 665 | |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 666 | /* |
| 667 | * This function forces the icache and prefetched instruction stream to |
| 668 | * catch up with reality in two very specific cases: |
| 669 | * |
| 670 | * a) Text was modified using one virtual address and is about to be executed |
| 671 | * from the same physical page at a different virtual address. |
| 672 | * |
| 673 | * b) Text was modified on a different CPU, may subsequently be |
| 674 | * executed on this CPU, and you want to make sure the new version |
| 675 | * gets executed. This generally means you're calling this in a IPI. |
| 676 | * |
| 677 | * If you're calling this for a different reason, you're probably doing |
| 678 | * it wrong. |
| 679 | */ |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 680 | static inline void sync_core(void) |
| 681 | { |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 682 | /* |
| 683 | * There are quite a few ways to do this. IRET-to-self is nice |
| 684 | * because it works on every CPU, at any CPL (so it's compatible |
| 685 | * with paravirtualization), and it never exits to a hypervisor. |
| 686 | * The only down sides are that it's a bit slow (it seems to be |
| 687 | * a bit more than 2x slower than the fastest options) and that |
| 688 | * it unmasks NMIs. The "push %cs" is needed because, in |
| 689 | * paravirtual environments, __KERNEL_CS may not be a valid CS |
| 690 | * value when we do IRET directly. |
| 691 | * |
| 692 | * In case NMI unmasking or performance ever becomes a problem, |
| 693 | * the next best option appears to be MOV-to-CR2 and an |
| 694 | * unconditional jump. That sequence also works on all CPUs, |
Juergen Gross | ecda85e | 2017-08-16 19:31:57 +0200 | [diff] [blame] | 695 | * but it will fault at CPL3 (i.e. Xen PV). |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 696 | * |
| 697 | * CPUID is the conventional way, but it's nasty: it doesn't |
| 698 | * exist on some 486-like CPUs, and it usually exits to a |
| 699 | * hypervisor. |
| 700 | * |
| 701 | * Like all of Linux's memory ordering operations, this is a |
| 702 | * compiler barrier as well. |
| 703 | */ |
Andy Lutomirski | 1c52d85 | 2016-12-09 10:24:05 -0800 | [diff] [blame] | 704 | #ifdef CONFIG_X86_32 |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 705 | asm volatile ( |
| 706 | "pushfl\n\t" |
| 707 | "pushl %%cs\n\t" |
| 708 | "pushl $1f\n\t" |
| 709 | "iret\n\t" |
| 710 | "1:" |
Josh Poimboeuf | f5caf62 | 2017-09-20 16:24:33 -0500 | [diff] [blame] | 711 | : ASM_CALL_CONSTRAINT : : "memory"); |
H. Peter Anvin | 45c39fb | 2012-11-28 11:50:30 -0800 | [diff] [blame] | 712 | #else |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 713 | unsigned int tmp; |
| 714 | |
| 715 | asm volatile ( |
Josh Poimboeuf | 76846bf | 2017-07-11 10:33:45 -0500 | [diff] [blame] | 716 | UNWIND_HINT_SAVE |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 717 | "mov %%ss, %0\n\t" |
| 718 | "pushq %q0\n\t" |
| 719 | "pushq %%rsp\n\t" |
| 720 | "addq $8, (%%rsp)\n\t" |
| 721 | "pushfq\n\t" |
| 722 | "mov %%cs, %0\n\t" |
| 723 | "pushq %q0\n\t" |
| 724 | "pushq $1f\n\t" |
| 725 | "iretq\n\t" |
Josh Poimboeuf | 76846bf | 2017-07-11 10:33:45 -0500 | [diff] [blame] | 726 | UNWIND_HINT_RESTORE |
Andy Lutomirski | c198b12 | 2016-12-09 10:24:08 -0800 | [diff] [blame] | 727 | "1:" |
Josh Poimboeuf | f5caf62 | 2017-09-20 16:24:33 -0500 | [diff] [blame] | 728 | : "=&r" (tmp), ASM_CALL_CONSTRAINT : : "cc", "memory"); |
Ben Hutchings | 5367b68 | 2009-09-10 02:53:50 +0100 | [diff] [blame] | 729 | #endif |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 730 | } |
| 731 | |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 732 | extern void select_idle_routine(const struct cpuinfo_x86 *c); |
Borislav Petkov | 07c94a3 | 2016-12-09 19:29:11 +0100 | [diff] [blame] | 733 | extern void amd_e400_c1e_apic_setup(void); |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 734 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 735 | extern unsigned long boot_option_idle_override; |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 736 | |
Thomas Renninger | d189604 | 2010-11-03 17:06:14 +0100 | [diff] [blame] | 737 | enum idle_boot_override {IDLE_NO_OVERRIDE=0, IDLE_HALT, IDLE_NOMWAIT, |
Len Brown | 69fb367 | 2013-02-10 01:38:39 -0500 | [diff] [blame] | 738 | IDLE_POLL}; |
Thomas Renninger | d189604 | 2010-11-03 17:06:14 +0100 | [diff] [blame] | 739 | |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 740 | extern void enable_sep_cpu(void); |
| 741 | extern int sysenter_setup(void); |
| 742 | |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 743 | void early_trap_pf_init(void); |
Jan Kiszka | 29c8439 | 2010-05-20 21:04:29 -0500 | [diff] [blame] | 744 | |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 745 | /* Defined in head.S */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 746 | extern struct desc_ptr early_gdt_descr; |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 747 | |
Brian Gerst | 552be87 | 2009-01-30 17:47:53 +0900 | [diff] [blame] | 748 | extern void switch_to_new_gdt(int); |
Thomas Garnier | 45fc875 | 2017-03-14 10:05:08 -0700 | [diff] [blame] | 749 | extern void load_direct_gdt(int); |
Thomas Garnier | 69218e4 | 2017-03-14 10:05:07 -0700 | [diff] [blame] | 750 | extern void load_fixmap_gdt(int); |
Jeremy Fitzhardinge | 11e3a84 | 2009-01-30 17:47:54 +0900 | [diff] [blame] | 751 | extern void load_percpu_segment(int); |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 752 | extern void cpu_init(void); |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 753 | |
Markus Metzger | c272477 | 2008-12-11 13:49:59 +0100 | [diff] [blame] | 754 | static inline unsigned long get_debugctlmsr(void) |
| 755 | { |
Peter Zijlstra | ea8e61b | 2010-03-25 14:51:51 +0100 | [diff] [blame] | 756 | unsigned long debugctlmsr = 0; |
Markus Metzger | c272477 | 2008-12-11 13:49:59 +0100 | [diff] [blame] | 757 | |
| 758 | #ifndef CONFIG_X86_DEBUGCTLMSR |
| 759 | if (boot_cpu_data.x86 < 6) |
| 760 | return 0; |
| 761 | #endif |
| 762 | rdmsrl(MSR_IA32_DEBUGCTLMSR, debugctlmsr); |
| 763 | |
Peter Zijlstra | ea8e61b | 2010-03-25 14:51:51 +0100 | [diff] [blame] | 764 | return debugctlmsr; |
Markus Metzger | c272477 | 2008-12-11 13:49:59 +0100 | [diff] [blame] | 765 | } |
| 766 | |
Jan Beulich | 5b0e508 | 2008-03-10 13:11:17 +0000 | [diff] [blame] | 767 | static inline void update_debugctlmsr(unsigned long debugctlmsr) |
| 768 | { |
| 769 | #ifndef CONFIG_X86_DEBUGCTLMSR |
| 770 | if (boot_cpu_data.x86 < 6) |
| 771 | return; |
| 772 | #endif |
| 773 | wrmsrl(MSR_IA32_DEBUGCTLMSR, debugctlmsr); |
| 774 | } |
| 775 | |
Oleg Nesterov | 9bd1190 | 2012-09-03 15:24:17 +0200 | [diff] [blame] | 776 | extern void set_task_blockstep(struct task_struct *task, bool on); |
| 777 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 778 | /* Boot loader type from the setup header: */ |
| 779 | extern int bootloader_type; |
H. Peter Anvin | 5031296 | 2009-05-07 16:54:11 -0700 | [diff] [blame] | 780 | extern int bootloader_version; |
Glauber de Oliveira Costa | 1a53905 | 2008-01-30 13:31:39 +0100 | [diff] [blame] | 781 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 782 | extern char ignore_fpu_irq; |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 783 | |
| 784 | #define HAVE_ARCH_PICK_MMAP_LAYOUT 1 |
| 785 | #define ARCH_HAS_PREFETCHW |
| 786 | #define ARCH_HAS_SPINLOCK_PREFETCH |
| 787 | |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 788 | #ifdef CONFIG_X86_32 |
Borislav Petkov | a930dc4 | 2015-01-18 17:48:18 +0100 | [diff] [blame] | 789 | # define BASE_PREFETCH "" |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 790 | # define ARCH_HAS_PREFETCH |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 791 | #else |
Borislav Petkov | a930dc4 | 2015-01-18 17:48:18 +0100 | [diff] [blame] | 792 | # define BASE_PREFETCH "prefetcht0 %P1" |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 793 | #endif |
| 794 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 795 | /* |
| 796 | * Prefetch instructions for Pentium III (+) and AMD Athlon (+) |
| 797 | * |
| 798 | * It's not worth to care about 3dnow prefetches for the K6 |
| 799 | * because they are microcoded there and very slow. |
| 800 | */ |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 801 | static inline void prefetch(const void *x) |
| 802 | { |
Borislav Petkov | a930dc4 | 2015-01-18 17:48:18 +0100 | [diff] [blame] | 803 | alternative_input(BASE_PREFETCH, "prefetchnta %P1", |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 804 | X86_FEATURE_XMM, |
Borislav Petkov | a930dc4 | 2015-01-18 17:48:18 +0100 | [diff] [blame] | 805 | "m" (*(const char *)x)); |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 806 | } |
| 807 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 808 | /* |
| 809 | * 3dnow prefetch to get an exclusive cache line. |
| 810 | * Useful for spinlocks to avoid one state transition in the |
| 811 | * cache coherency protocol: |
| 812 | */ |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 813 | static inline void prefetchw(const void *x) |
| 814 | { |
Borislav Petkov | a930dc4 | 2015-01-18 17:48:18 +0100 | [diff] [blame] | 815 | alternative_input(BASE_PREFETCH, "prefetchw %P1", |
| 816 | X86_FEATURE_3DNOWPREFETCH, |
| 817 | "m" (*(const char *)x)); |
Glauber de Oliveira Costa | ae2e15e | 2008-01-30 13:31:40 +0100 | [diff] [blame] | 818 | } |
| 819 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 820 | static inline void spin_lock_prefetch(const void *x) |
| 821 | { |
| 822 | prefetchw(x); |
| 823 | } |
| 824 | |
Andy Lutomirski | d9e05cc | 2015-03-10 11:05:59 -0700 | [diff] [blame] | 825 | #define TOP_OF_INIT_STACK ((unsigned long)&init_stack + sizeof(init_stack) - \ |
| 826 | TOP_OF_KERNEL_STACK_PADDING) |
| 827 | |
Andy Lutomirski | 3500130 | 2017-11-02 00:59:11 -0700 | [diff] [blame] | 828 | #define task_top_of_stack(task) ((unsigned long)(task_pt_regs(task) + 1)) |
| 829 | |
Andy Lutomirski | d375cf1 | 2017-11-02 00:59:16 -0700 | [diff] [blame] | 830 | #define task_pt_regs(task) \ |
| 831 | ({ \ |
| 832 | unsigned long __ptr = (unsigned long)task_stack_page(task); \ |
| 833 | __ptr += THREAD_SIZE - TOP_OF_KERNEL_STACK_PADDING; \ |
| 834 | ((struct pt_regs *)__ptr) - 1; \ |
| 835 | }) |
| 836 | |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 837 | #ifdef CONFIG_X86_32 |
| 838 | /* |
| 839 | * User space process size: 3GB (default). |
| 840 | */ |
Dmitry Safonov | 8f3e474 | 2017-03-06 17:17:18 +0300 | [diff] [blame] | 841 | #define IA32_PAGE_OFFSET PAGE_OFFSET |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 842 | #define TASK_SIZE PAGE_OFFSET |
Kirill A. Shutemov | b569bab | 2017-07-17 01:59:52 +0300 | [diff] [blame] | 843 | #define TASK_SIZE_LOW TASK_SIZE |
Ingo Molnar | d951734 | 2009-02-20 23:32:28 +0100 | [diff] [blame] | 844 | #define TASK_SIZE_MAX TASK_SIZE |
Kirill A. Shutemov | 44b0491 | 2017-07-17 01:59:51 +0300 | [diff] [blame] | 845 | #define DEFAULT_MAP_WINDOW TASK_SIZE |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 846 | #define STACK_TOP TASK_SIZE |
| 847 | #define STACK_TOP_MAX STACK_TOP |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 848 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 849 | #define INIT_THREAD { \ |
Andy Lutomirski | d9e05cc | 2015-03-10 11:05:59 -0700 | [diff] [blame] | 850 | .sp0 = TOP_OF_INIT_STACK, \ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 851 | .sysenter_cs = __KERNEL_CS, \ |
| 852 | .io_bitmap_ptr = NULL, \ |
Andy Lutomirski | 13d4ea0 | 2016-07-14 13:22:57 -0700 | [diff] [blame] | 853 | .addr_limit = KERNEL_DS, \ |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 854 | } |
| 855 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 856 | #define KSTK_ESP(task) (task_pt_regs(task)->sp) |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 857 | |
| 858 | #else |
| 859 | /* |
Andy Lutomirski | f55f050 | 2017-12-12 07:56:45 -0800 | [diff] [blame] | 860 | * User space process size. This is the first address outside the user range. |
| 861 | * There are a few constraints that determine this: |
| 862 | * |
| 863 | * On Intel CPUs, if a SYSCALL instruction is at the highest canonical |
| 864 | * address, then that syscall will enter the kernel with a |
| 865 | * non-canonical return address, and SYSRET will explode dangerously. |
| 866 | * We avoid this particular problem by preventing anything executable |
| 867 | * from being mapped at the maximum canonical address. |
| 868 | * |
| 869 | * On AMD CPUs in the Ryzen family, there's a nasty bug in which the |
| 870 | * CPUs malfunction if they execute code from the highest canonical page. |
| 871 | * They'll speculate right off the end of the canonical space, and |
| 872 | * bad things happen. This is worked around in the same way as the |
| 873 | * Intel problem. |
| 874 | * |
| 875 | * With page table isolation enabled, we map the LDT in ... [stay tuned] |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 876 | */ |
Kirill A. Shutemov | ee00f4a | 2017-07-17 01:59:53 +0300 | [diff] [blame] | 877 | #define TASK_SIZE_MAX ((1UL << __VIRTUAL_MASK_SHIFT) - PAGE_SIZE) |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 878 | |
Kirill A. Shutemov | ee00f4a | 2017-07-17 01:59:53 +0300 | [diff] [blame] | 879 | #define DEFAULT_MAP_WINDOW ((1UL << 47) - PAGE_SIZE) |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 880 | |
| 881 | /* This decides where the kernel will search for a free chunk of vm |
| 882 | * space during mmap's. |
| 883 | */ |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 884 | #define IA32_PAGE_OFFSET ((current->personality & ADDR_LIMIT_3GB) ? \ |
| 885 | 0xc0000000 : 0xFFFFe000) |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 886 | |
Kirill A. Shutemov | b569bab | 2017-07-17 01:59:52 +0300 | [diff] [blame] | 887 | #define TASK_SIZE_LOW (test_thread_flag(TIF_ADDR32) ? \ |
| 888 | IA32_PAGE_OFFSET : DEFAULT_MAP_WINDOW) |
H. Peter Anvin | 6bd3300 | 2012-02-06 13:03:09 -0800 | [diff] [blame] | 889 | #define TASK_SIZE (test_thread_flag(TIF_ADDR32) ? \ |
Ingo Molnar | d951734 | 2009-02-20 23:32:28 +0100 | [diff] [blame] | 890 | IA32_PAGE_OFFSET : TASK_SIZE_MAX) |
H. Peter Anvin | 6bd3300 | 2012-02-06 13:03:09 -0800 | [diff] [blame] | 891 | #define TASK_SIZE_OF(child) ((test_tsk_thread_flag(child, TIF_ADDR32)) ? \ |
Ingo Molnar | d951734 | 2009-02-20 23:32:28 +0100 | [diff] [blame] | 892 | IA32_PAGE_OFFSET : TASK_SIZE_MAX) |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 893 | |
Kirill A. Shutemov | b569bab | 2017-07-17 01:59:52 +0300 | [diff] [blame] | 894 | #define STACK_TOP TASK_SIZE_LOW |
Ingo Molnar | d951734 | 2009-02-20 23:32:28 +0100 | [diff] [blame] | 895 | #define STACK_TOP_MAX TASK_SIZE_MAX |
David Howells | 922a70d | 2008-02-08 04:19:26 -0800 | [diff] [blame] | 896 | |
Andy Lutomirski | 13d4ea0 | 2016-07-14 13:22:57 -0700 | [diff] [blame] | 897 | #define INIT_THREAD { \ |
Andy Lutomirski | 13d4ea0 | 2016-07-14 13:22:57 -0700 | [diff] [blame] | 898 | .addr_limit = KERNEL_DS, \ |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 899 | } |
| 900 | |
Stefani Seibold | 89240ba | 2009-11-03 10:22:40 +0100 | [diff] [blame] | 901 | extern unsigned long KSTK_ESP(struct task_struct *task); |
H. J. Lu | d046ff8 | 2012-02-14 13:49:48 -0800 | [diff] [blame] | 902 | |
Glauber de Oliveira Costa | 2f66dcc | 2008-01-30 13:31:57 +0100 | [diff] [blame] | 903 | #endif /* CONFIG_X86_64 */ |
| 904 | |
Ingo Molnar | 513ad84 | 2008-02-21 05:18:40 +0100 | [diff] [blame] | 905 | extern void start_thread(struct pt_regs *regs, unsigned long new_ip, |
| 906 | unsigned long new_sp); |
| 907 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 908 | /* |
| 909 | * This decides where the kernel will search for a free chunk of vm |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 910 | * space during mmap's. |
| 911 | */ |
Dmitry Safonov | 8f3e474 | 2017-03-06 17:17:18 +0300 | [diff] [blame] | 912 | #define __TASK_UNMAPPED_BASE(task_size) (PAGE_ALIGN(task_size / 3)) |
Kirill A. Shutemov | b569bab | 2017-07-17 01:59:52 +0300 | [diff] [blame] | 913 | #define TASK_UNMAPPED_BASE __TASK_UNMAPPED_BASE(TASK_SIZE_LOW) |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 914 | |
Ingo Molnar | 4d46a89 | 2008-02-21 04:24:40 +0100 | [diff] [blame] | 915 | #define KSTK_EIP(task) (task_pt_regs(task)->ip) |
Glauber de Oliveira Costa | 683e025 | 2008-01-30 13:31:27 +0100 | [diff] [blame] | 916 | |
Erik Bosman | 529e25f | 2008-04-14 00:24:18 +0200 | [diff] [blame] | 917 | /* Get/set a process' ability to use the timestamp counter instruction */ |
| 918 | #define GET_TSC_CTL(adr) get_tsc_mode((adr)) |
| 919 | #define SET_TSC_CTL(val) set_tsc_mode((val)) |
| 920 | |
| 921 | extern int get_tsc_mode(unsigned long adr); |
| 922 | extern int set_tsc_mode(unsigned int val); |
| 923 | |
Kyle Huey | e9ea1e7 | 2017-03-20 01:16:26 -0700 | [diff] [blame] | 924 | DECLARE_PER_CPU(u64, msr_misc_features_shadow); |
| 925 | |
Dave Hansen | fe3d197 | 2014-11-14 07:18:29 -0800 | [diff] [blame] | 926 | /* Register/unregister a process' MPX related resource */ |
Dave Hansen | 46a6e0c | 2015-06-07 11:37:02 -0700 | [diff] [blame] | 927 | #define MPX_ENABLE_MANAGEMENT() mpx_enable_management() |
| 928 | #define MPX_DISABLE_MANAGEMENT() mpx_disable_management() |
Dave Hansen | fe3d197 | 2014-11-14 07:18:29 -0800 | [diff] [blame] | 929 | |
| 930 | #ifdef CONFIG_X86_INTEL_MPX |
Dave Hansen | 46a6e0c | 2015-06-07 11:37:02 -0700 | [diff] [blame] | 931 | extern int mpx_enable_management(void); |
| 932 | extern int mpx_disable_management(void); |
Dave Hansen | fe3d197 | 2014-11-14 07:18:29 -0800 | [diff] [blame] | 933 | #else |
Dave Hansen | 46a6e0c | 2015-06-07 11:37:02 -0700 | [diff] [blame] | 934 | static inline int mpx_enable_management(void) |
Dave Hansen | fe3d197 | 2014-11-14 07:18:29 -0800 | [diff] [blame] | 935 | { |
| 936 | return -EINVAL; |
| 937 | } |
Dave Hansen | 46a6e0c | 2015-06-07 11:37:02 -0700 | [diff] [blame] | 938 | static inline int mpx_disable_management(void) |
Dave Hansen | fe3d197 | 2014-11-14 07:18:29 -0800 | [diff] [blame] | 939 | { |
| 940 | return -EINVAL; |
| 941 | } |
| 942 | #endif /* CONFIG_X86_INTEL_MPX */ |
| 943 | |
Borislav Petkov | bc8e80d | 2017-06-13 18:28:30 +0200 | [diff] [blame] | 944 | #ifdef CONFIG_CPU_SUP_AMD |
Daniel J Blueman | 8b84c8d | 2012-11-27 14:32:10 +0800 | [diff] [blame] | 945 | extern u16 amd_get_nb_id(int cpu); |
Aravind Gopalakrishnan | cc2749e | 2015-06-15 10:28:15 +0200 | [diff] [blame] | 946 | extern u32 amd_get_nodes_per_socket(void); |
Borislav Petkov | bc8e80d | 2017-06-13 18:28:30 +0200 | [diff] [blame] | 947 | #else |
| 948 | static inline u16 amd_get_nb_id(int cpu) { return 0; } |
| 949 | static inline u32 amd_get_nodes_per_socket(void) { return 0; } |
| 950 | #endif |
Andreas Herrmann | 6a81269 | 2009-09-16 11:33:40 +0200 | [diff] [blame] | 951 | |
Jason Wang | 96e39ac | 2013-07-25 16:54:32 +0800 | [diff] [blame] | 952 | static inline uint32_t hypervisor_cpuid_base(const char *sig, uint32_t leaves) |
| 953 | { |
| 954 | uint32_t base, eax, signature[3]; |
| 955 | |
| 956 | for (base = 0x40000000; base < 0x40010000; base += 0x100) { |
| 957 | cpuid(base, &eax, &signature[0], &signature[1], &signature[2]); |
| 958 | |
| 959 | if (!memcmp(sig, signature, 12) && |
| 960 | (leaves == 0 || ((eax - base) >= leaves))) |
| 961 | return base; |
| 962 | } |
| 963 | |
| 964 | return 0; |
| 965 | } |
| 966 | |
David Howells | f05e798 | 2012-03-28 18:11:12 +0100 | [diff] [blame] | 967 | extern unsigned long arch_align_stack(unsigned long sp); |
| 968 | extern void free_init_pages(char *what, unsigned long begin, unsigned long end); |
| 969 | |
| 970 | void default_idle(void); |
Len Brown | 6a377dd | 2013-02-09 23:08:07 -0500 | [diff] [blame] | 971 | #ifdef CONFIG_XEN |
| 972 | bool xen_set_default_idle(void); |
| 973 | #else |
| 974 | #define xen_set_default_idle 0 |
| 975 | #endif |
David Howells | f05e798 | 2012-03-28 18:11:12 +0100 | [diff] [blame] | 976 | |
| 977 | void stop_this_cpu(void *dummy); |
Borislav Petkov | 4d067d8 | 2013-05-09 12:02:29 +0200 | [diff] [blame] | 978 | void df_debug(struct pt_regs *regs, long error_code); |
Borislav Petkov | 1008c52c | 2018-02-16 12:26:39 +0100 | [diff] [blame] | 979 | void microcode_check(void); |
H. Peter Anvin | 1965aae | 2008-10-22 22:26:29 -0700 | [diff] [blame] | 980 | #endif /* _ASM_X86_PROCESSOR_H */ |