Greg Kroah-Hartman | b244131 | 2017-11-01 15:07:57 +0100 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 2 | /* |
| 3 | * Xen SMP support |
| 4 | * |
| 5 | * This file implements the Xen versions of smp_ops. SMP under Xen is |
| 6 | * very straightforward. Bringing a CPU up is simply a matter of |
| 7 | * loading its initial context and setting it running. |
| 8 | * |
| 9 | * IPIs are handled through the Xen event mechanism. |
| 10 | * |
| 11 | * Because virtual CPUs can be scheduled onto any real CPU, there's no |
| 12 | * useful topology information for the kernel to make use of. As a |
| 13 | * result, all CPUs are treated as if they're single-core and |
| 14 | * single-threaded. |
| 15 | */ |
| 16 | #include <linux/sched.h> |
Andy Lutomirski | f16b3da | 2017-11-02 00:59:12 -0700 | [diff] [blame] | 17 | #include <linux/sched/task_stack.h> |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 18 | #include <linux/err.h> |
| 19 | #include <linux/slab.h> |
| 20 | #include <linux/smp.h> |
| 21 | #include <linux/irq_work.h> |
| 22 | #include <linux/tick.h> |
| 23 | #include <linux/nmi.h> |
Juergen Gross | c185dde | 2017-07-05 16:05:20 +0200 | [diff] [blame] | 24 | #include <linux/cpuhotplug.h> |
Christophe Leroy | 977e4be | 2018-10-20 09:26:49 +0200 | [diff] [blame] | 25 | #include <linux/stackprotector.h> |
Mike Rapoport | 65fddcf | 2020-06-08 21:32:42 -0700 | [diff] [blame] | 26 | #include <linux/pgtable.h> |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 27 | |
| 28 | #include <asm/paravirt.h> |
Thomas Gleixner | 2f6474e | 2020-05-21 22:05:26 +0200 | [diff] [blame] | 29 | #include <asm/idtentry.h> |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 30 | #include <asm/desc.h> |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 31 | #include <asm/cpu.h> |
| 32 | |
| 33 | #include <xen/interface/xen.h> |
| 34 | #include <xen/interface/vcpu.h> |
| 35 | #include <xen/interface/xenpmu.h> |
| 36 | |
Juergen Gross | 74899d9 | 2018-06-21 10:43:31 +0200 | [diff] [blame] | 37 | #include <asm/spec-ctrl.h> |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 38 | #include <asm/xen/interface.h> |
| 39 | #include <asm/xen/hypercall.h> |
| 40 | |
| 41 | #include <xen/xen.h> |
| 42 | #include <xen/page.h> |
| 43 | #include <xen/events.h> |
| 44 | |
| 45 | #include <xen/hvc-console.h> |
| 46 | #include "xen-ops.h" |
| 47 | #include "mmu.h" |
| 48 | #include "smp.h" |
| 49 | #include "pmu.h" |
| 50 | |
| 51 | cpumask_var_t xen_cpu_initialized_map; |
| 52 | |
| 53 | static DEFINE_PER_CPU(struct xen_common_irq, xen_irq_work) = { .irq = -1 }; |
| 54 | static DEFINE_PER_CPU(struct xen_common_irq, xen_pmu_irq) = { .irq = -1 }; |
| 55 | |
| 56 | static irqreturn_t xen_irq_work_interrupt(int irq, void *dev_id); |
Miroslav Benes | c3881eb | 2020-03-26 10:26:03 +0100 | [diff] [blame] | 57 | void asm_cpu_bringup_and_idle(void); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 58 | |
| 59 | static void cpu_bringup(void) |
| 60 | { |
| 61 | int cpu; |
| 62 | |
Thomas Gleixner | 7652ac9 | 2019-07-10 21:42:46 +0200 | [diff] [blame] | 63 | cr4_init(); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 64 | cpu_init(); |
| 65 | touch_softlockup_watchdog(); |
| 66 | preempt_disable(); |
| 67 | |
| 68 | /* PVH runs in ring 0 and allows us to do native syscalls. Yay! */ |
| 69 | if (!xen_feature(XENFEAT_supervisor_mode_kernel)) { |
| 70 | xen_enable_sysenter(); |
| 71 | xen_enable_syscall(); |
| 72 | } |
| 73 | cpu = smp_processor_id(); |
| 74 | smp_store_cpu_info(cpu); |
| 75 | cpu_data(cpu).x86_max_cores = 1; |
| 76 | set_cpu_sibling_map(cpu); |
| 77 | |
Juergen Gross | 74899d9 | 2018-06-21 10:43:31 +0200 | [diff] [blame] | 78 | speculative_store_bypass_ht_init(); |
| 79 | |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 80 | xen_setup_cpu_clockevents(); |
| 81 | |
| 82 | notify_cpu_starting(cpu); |
| 83 | |
| 84 | set_cpu_online(cpu, true); |
| 85 | |
| 86 | cpu_set_state_online(cpu); /* Implies full memory barrier. */ |
| 87 | |
| 88 | /* We can take interrupts now: we're officially "up". */ |
| 89 | local_irq_enable(); |
| 90 | } |
| 91 | |
| 92 | asmlinkage __visible void cpu_bringup_and_idle(void) |
| 93 | { |
| 94 | cpu_bringup(); |
| 95 | cpu_startup_entry(CPUHP_AP_ONLINE_IDLE); |
| 96 | } |
| 97 | |
| 98 | void xen_smp_intr_free_pv(unsigned int cpu) |
| 99 | { |
| 100 | if (per_cpu(xen_irq_work, cpu).irq >= 0) { |
| 101 | unbind_from_irqhandler(per_cpu(xen_irq_work, cpu).irq, NULL); |
| 102 | per_cpu(xen_irq_work, cpu).irq = -1; |
| 103 | kfree(per_cpu(xen_irq_work, cpu).name); |
| 104 | per_cpu(xen_irq_work, cpu).name = NULL; |
| 105 | } |
| 106 | |
| 107 | if (per_cpu(xen_pmu_irq, cpu).irq >= 0) { |
| 108 | unbind_from_irqhandler(per_cpu(xen_pmu_irq, cpu).irq, NULL); |
| 109 | per_cpu(xen_pmu_irq, cpu).irq = -1; |
| 110 | kfree(per_cpu(xen_pmu_irq, cpu).name); |
| 111 | per_cpu(xen_pmu_irq, cpu).name = NULL; |
| 112 | } |
| 113 | } |
| 114 | |
| 115 | int xen_smp_intr_init_pv(unsigned int cpu) |
| 116 | { |
| 117 | int rc; |
| 118 | char *callfunc_name, *pmu_name; |
| 119 | |
| 120 | callfunc_name = kasprintf(GFP_KERNEL, "irqwork%d", cpu); |
| 121 | rc = bind_ipi_to_irqhandler(XEN_IRQ_WORK_VECTOR, |
| 122 | cpu, |
| 123 | xen_irq_work_interrupt, |
| 124 | IRQF_PERCPU|IRQF_NOBALANCING, |
| 125 | callfunc_name, |
| 126 | NULL); |
| 127 | if (rc < 0) |
| 128 | goto fail; |
| 129 | per_cpu(xen_irq_work, cpu).irq = rc; |
| 130 | per_cpu(xen_irq_work, cpu).name = callfunc_name; |
| 131 | |
| 132 | if (is_xen_pmu(cpu)) { |
| 133 | pmu_name = kasprintf(GFP_KERNEL, "pmu%d", cpu); |
| 134 | rc = bind_virq_to_irqhandler(VIRQ_XENPMU, cpu, |
| 135 | xen_pmu_irq_handler, |
| 136 | IRQF_PERCPU|IRQF_NOBALANCING, |
| 137 | pmu_name, NULL); |
| 138 | if (rc < 0) |
| 139 | goto fail; |
| 140 | per_cpu(xen_pmu_irq, cpu).irq = rc; |
| 141 | per_cpu(xen_pmu_irq, cpu).name = pmu_name; |
| 142 | } |
| 143 | |
| 144 | return 0; |
| 145 | |
| 146 | fail: |
| 147 | xen_smp_intr_free_pv(cpu); |
| 148 | return rc; |
| 149 | } |
| 150 | |
| 151 | static void __init xen_fill_possible_map(void) |
| 152 | { |
| 153 | int i, rc; |
| 154 | |
| 155 | if (xen_initial_domain()) |
| 156 | return; |
| 157 | |
| 158 | for (i = 0; i < nr_cpu_ids; i++) { |
| 159 | rc = HYPERVISOR_vcpu_op(VCPUOP_is_up, i, NULL); |
| 160 | if (rc >= 0) { |
| 161 | num_processors++; |
| 162 | set_cpu_possible(i, true); |
| 163 | } |
| 164 | } |
| 165 | } |
| 166 | |
| 167 | static void __init xen_filter_cpu_maps(void) |
| 168 | { |
| 169 | int i, rc; |
| 170 | unsigned int subtract = 0; |
| 171 | |
| 172 | if (!xen_initial_domain()) |
| 173 | return; |
| 174 | |
| 175 | num_processors = 0; |
| 176 | disabled_cpus = 0; |
| 177 | for (i = 0; i < nr_cpu_ids; i++) { |
| 178 | rc = HYPERVISOR_vcpu_op(VCPUOP_is_up, i, NULL); |
| 179 | if (rc >= 0) { |
| 180 | num_processors++; |
| 181 | set_cpu_possible(i, true); |
| 182 | } else { |
| 183 | set_cpu_possible(i, false); |
| 184 | set_cpu_present(i, false); |
| 185 | subtract++; |
| 186 | } |
| 187 | } |
| 188 | #ifdef CONFIG_HOTPLUG_CPU |
| 189 | /* This is akin to using 'nr_cpus' on the Linux command line. |
| 190 | * Which is OK as when we use 'dom0_max_vcpus=X' we can only |
| 191 | * have up to X, while nr_cpu_ids is greater than X. This |
| 192 | * normally is not a problem, except when CPU hotplugging |
| 193 | * is involved and then there might be more than X CPUs |
| 194 | * in the guest - which will not work as there is no |
| 195 | * hypercall to expand the max number of VCPUs an already |
| 196 | * running guest has. So cap it up to X. */ |
| 197 | if (subtract) |
| 198 | nr_cpu_ids = nr_cpu_ids - subtract; |
| 199 | #endif |
| 200 | |
| 201 | } |
| 202 | |
| 203 | static void __init xen_pv_smp_prepare_boot_cpu(void) |
| 204 | { |
| 205 | BUG_ON(smp_processor_id() != 0); |
| 206 | native_smp_prepare_boot_cpu(); |
| 207 | |
| 208 | if (!xen_feature(XENFEAT_writable_page_tables)) |
| 209 | /* We've switched to the "real" per-cpu gdt, so make |
| 210 | * sure the old memory can be recycled. */ |
| 211 | make_lowmem_page_readwrite(xen_initial_gdt); |
| 212 | |
| 213 | #ifdef CONFIG_X86_32 |
| 214 | /* |
| 215 | * Xen starts us with XEN_FLAT_RING1_DS, but linux code |
| 216 | * expects __USER_DS |
| 217 | */ |
| 218 | loadsegment(ds, __USER_DS); |
| 219 | loadsegment(es, __USER_DS); |
| 220 | #endif |
| 221 | |
| 222 | xen_filter_cpu_maps(); |
| 223 | xen_setup_vcpu_info_placement(); |
| 224 | |
| 225 | /* |
| 226 | * The alternative logic (which patches the unlock/lock) runs before |
| 227 | * the smp bootup up code is activated. Hence we need to set this up |
| 228 | * the core kernel is being patched. Otherwise we will have only |
| 229 | * modules patched but not core code. |
| 230 | */ |
| 231 | xen_init_spinlocks(); |
| 232 | } |
| 233 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 234 | static void __init xen_pv_smp_prepare_cpus(unsigned int max_cpus) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 235 | { |
| 236 | unsigned cpu; |
| 237 | unsigned int i; |
| 238 | |
| 239 | if (skip_ioapic_setup) { |
| 240 | char *m = (max_cpus == 0) ? |
| 241 | "The nosmp parameter is incompatible with Xen; " \ |
| 242 | "use Xen dom0_max_vcpus=1 parameter" : |
| 243 | "The noapic parameter is incompatible with Xen"; |
| 244 | |
| 245 | xen_raw_printk(m); |
| 246 | panic(m); |
| 247 | } |
| 248 | xen_init_lock_cpu(0); |
| 249 | |
| 250 | smp_store_boot_cpu_info(); |
| 251 | cpu_data(0).x86_max_cores = 1; |
| 252 | |
| 253 | for_each_possible_cpu(i) { |
| 254 | zalloc_cpumask_var(&per_cpu(cpu_sibling_map, i), GFP_KERNEL); |
| 255 | zalloc_cpumask_var(&per_cpu(cpu_core_map, i), GFP_KERNEL); |
Len Brown | 2e4c54d | 2019-05-13 13:58:56 -0400 | [diff] [blame] | 256 | zalloc_cpumask_var(&per_cpu(cpu_die_map, i), GFP_KERNEL); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 257 | zalloc_cpumask_var(&per_cpu(cpu_llc_shared_map, i), GFP_KERNEL); |
| 258 | } |
| 259 | set_cpu_sibling_map(0); |
| 260 | |
Juergen Gross | 74899d9 | 2018-06-21 10:43:31 +0200 | [diff] [blame] | 261 | speculative_store_bypass_ht_init(); |
| 262 | |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 263 | xen_pmu_init(0); |
| 264 | |
Boris Ostrovsky | f31b969 | 2017-04-26 09:42:48 -0400 | [diff] [blame] | 265 | if (xen_smp_intr_init(0) || xen_smp_intr_init_pv(0)) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 266 | BUG(); |
| 267 | |
| 268 | if (!alloc_cpumask_var(&xen_cpu_initialized_map, GFP_KERNEL)) |
| 269 | panic("could not allocate xen_cpu_initialized_map\n"); |
| 270 | |
| 271 | cpumask_copy(xen_cpu_initialized_map, cpumask_of(0)); |
| 272 | |
| 273 | /* Restrict the possible_map according to max_cpus. */ |
| 274 | while ((num_possible_cpus() > 1) && (num_possible_cpus() > max_cpus)) { |
| 275 | for (cpu = nr_cpu_ids - 1; !cpu_possible(cpu); cpu--) |
| 276 | continue; |
| 277 | set_cpu_possible(cpu, false); |
| 278 | } |
| 279 | |
| 280 | for_each_possible_cpu(cpu) |
| 281 | set_cpu_present(cpu, true); |
| 282 | } |
| 283 | |
| 284 | static int |
| 285 | cpu_initialize_context(unsigned int cpu, struct task_struct *idle) |
| 286 | { |
| 287 | struct vcpu_guest_context *ctxt; |
| 288 | struct desc_struct *gdt; |
| 289 | unsigned long gdt_mfn; |
| 290 | |
| 291 | /* used to tell cpu_init() that it can proceed with initialization */ |
| 292 | cpumask_set_cpu(cpu, cpu_callout_mask); |
| 293 | if (cpumask_test_and_set_cpu(cpu, xen_cpu_initialized_map)) |
| 294 | return 0; |
| 295 | |
| 296 | ctxt = kzalloc(sizeof(*ctxt), GFP_KERNEL); |
| 297 | if (ctxt == NULL) |
| 298 | return -ENOMEM; |
| 299 | |
| 300 | gdt = get_cpu_gdt_rw(cpu); |
| 301 | |
| 302 | #ifdef CONFIG_X86_32 |
| 303 | ctxt->user_regs.fs = __KERNEL_PERCPU; |
| 304 | ctxt->user_regs.gs = __KERNEL_STACK_CANARY; |
| 305 | #endif |
| 306 | memset(&ctxt->fpu_ctxt, 0, sizeof(ctxt->fpu_ctxt)); |
| 307 | |
Andy Lutomirski | f16b3da | 2017-11-02 00:59:12 -0700 | [diff] [blame] | 308 | /* |
| 309 | * Bring up the CPU in cpu_bringup_and_idle() with the stack |
| 310 | * pointing just below where pt_regs would be if it were a normal |
| 311 | * kernel entry. |
| 312 | */ |
Miroslav Benes | c3881eb | 2020-03-26 10:26:03 +0100 | [diff] [blame] | 313 | ctxt->user_regs.eip = (unsigned long)asm_cpu_bringup_and_idle; |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 314 | ctxt->flags = VGCF_IN_KERNEL; |
| 315 | ctxt->user_regs.eflags = 0x1000; /* IOPL_RING1 */ |
| 316 | ctxt->user_regs.ds = __USER_DS; |
| 317 | ctxt->user_regs.es = __USER_DS; |
| 318 | ctxt->user_regs.ss = __KERNEL_DS; |
Andy Lutomirski | f16b3da | 2017-11-02 00:59:12 -0700 | [diff] [blame] | 319 | ctxt->user_regs.cs = __KERNEL_CS; |
| 320 | ctxt->user_regs.esp = (unsigned long)task_pt_regs(idle); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 321 | |
| 322 | xen_copy_trap_info(ctxt->trap_ctxt); |
| 323 | |
| 324 | ctxt->ldt_ents = 0; |
| 325 | |
| 326 | BUG_ON((unsigned long)gdt & ~PAGE_MASK); |
| 327 | |
| 328 | gdt_mfn = arbitrary_virt_to_mfn(gdt); |
| 329 | make_lowmem_page_readonly(gdt); |
| 330 | make_lowmem_page_readonly(mfn_to_virt(gdt_mfn)); |
| 331 | |
| 332 | ctxt->gdt_frames[0] = gdt_mfn; |
| 333 | ctxt->gdt_ents = GDT_ENTRIES; |
| 334 | |
Andy Lutomirski | f16b3da | 2017-11-02 00:59:12 -0700 | [diff] [blame] | 335 | /* |
| 336 | * Set SS:SP that Xen will use when entering guest kernel mode |
| 337 | * from guest user mode. Subsequent calls to load_sp0() can |
| 338 | * change this value. |
| 339 | */ |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 340 | ctxt->kernel_ss = __KERNEL_DS; |
Andy Lutomirski | f16b3da | 2017-11-02 00:59:12 -0700 | [diff] [blame] | 341 | ctxt->kernel_sp = task_top_of_stack(idle); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 342 | |
| 343 | #ifdef CONFIG_X86_32 |
| 344 | ctxt->event_callback_cs = __KERNEL_CS; |
| 345 | ctxt->failsafe_callback_cs = __KERNEL_CS; |
| 346 | #else |
| 347 | ctxt->gs_base_kernel = per_cpu_offset(cpu); |
| 348 | #endif |
| 349 | ctxt->event_callback_eip = |
Thomas Gleixner | 2f6474e | 2020-05-21 22:05:26 +0200 | [diff] [blame] | 350 | (unsigned long)xen_asm_exc_xen_hypervisor_callback; |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 351 | ctxt->failsafe_callback_eip = |
| 352 | (unsigned long)xen_failsafe_callback; |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 353 | per_cpu(xen_cr3, cpu) = __pa(swapper_pg_dir); |
| 354 | |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 355 | ctxt->ctrlreg[3] = xen_pfn_to_cr3(virt_to_gfn(swapper_pg_dir)); |
| 356 | if (HYPERVISOR_vcpu_op(VCPUOP_initialise, xen_vcpu_nr(cpu), ctxt)) |
| 357 | BUG(); |
| 358 | |
| 359 | kfree(ctxt); |
| 360 | return 0; |
| 361 | } |
| 362 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 363 | static int xen_pv_cpu_up(unsigned int cpu, struct task_struct *idle) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 364 | { |
| 365 | int rc; |
| 366 | |
Thomas Gleixner | 66c7ceb | 2019-04-14 18:00:04 +0200 | [diff] [blame] | 367 | rc = common_cpu_up(cpu, idle); |
| 368 | if (rc) |
| 369 | return rc; |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 370 | |
| 371 | xen_setup_runstate_info(cpu); |
| 372 | |
| 373 | /* |
| 374 | * PV VCPUs are always successfully taken down (see 'while' loop |
| 375 | * in xen_cpu_die()), so -EBUSY is an error. |
| 376 | */ |
| 377 | rc = cpu_check_up_prepare(cpu); |
| 378 | if (rc) |
| 379 | return rc; |
| 380 | |
| 381 | /* make sure interrupts start blocked */ |
| 382 | per_cpu(xen_vcpu, cpu)->evtchn_upcall_mask = 1; |
| 383 | |
| 384 | rc = cpu_initialize_context(cpu, idle); |
| 385 | if (rc) |
| 386 | return rc; |
| 387 | |
| 388 | xen_pmu_init(cpu); |
| 389 | |
| 390 | rc = HYPERVISOR_vcpu_op(VCPUOP_up, xen_vcpu_nr(cpu), NULL); |
| 391 | BUG_ON(rc); |
| 392 | |
| 393 | while (cpu_report_state(cpu) != CPU_ONLINE) |
| 394 | HYPERVISOR_sched_op(SCHEDOP_yield, NULL); |
| 395 | |
| 396 | return 0; |
| 397 | } |
| 398 | |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 399 | #ifdef CONFIG_HOTPLUG_CPU |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 400 | static int xen_pv_cpu_disable(void) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 401 | { |
| 402 | unsigned int cpu = smp_processor_id(); |
| 403 | if (cpu == 0) |
| 404 | return -EBUSY; |
| 405 | |
| 406 | cpu_disable_common(); |
| 407 | |
| 408 | load_cr3(swapper_pg_dir); |
| 409 | return 0; |
| 410 | } |
| 411 | |
| 412 | static void xen_pv_cpu_die(unsigned int cpu) |
| 413 | { |
| 414 | while (HYPERVISOR_vcpu_op(VCPUOP_is_up, |
| 415 | xen_vcpu_nr(cpu), NULL)) { |
| 416 | __set_current_state(TASK_UNINTERRUPTIBLE); |
| 417 | schedule_timeout(HZ/10); |
| 418 | } |
| 419 | |
| 420 | if (common_cpu_die(cpu) == 0) { |
| 421 | xen_smp_intr_free(cpu); |
| 422 | xen_uninit_lock_cpu(cpu); |
| 423 | xen_teardown_timer(cpu); |
| 424 | xen_pmu_finish(cpu); |
| 425 | } |
| 426 | } |
| 427 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 428 | static void xen_pv_play_dead(void) /* used only with HOTPLUG_CPU */ |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 429 | { |
| 430 | play_dead_common(); |
| 431 | HYPERVISOR_vcpu_op(VCPUOP_down, xen_vcpu_nr(smp_processor_id()), NULL); |
| 432 | cpu_bringup(); |
| 433 | /* |
| 434 | * commit 4b0c0f294 (tick: Cleanup NOHZ per cpu data on cpu down) |
| 435 | * clears certain data that the cpu_idle loop (which called us |
| 436 | * and that we return from) expects. The only way to get that |
| 437 | * data back is to call: |
| 438 | */ |
| 439 | tick_nohz_idle_enter(); |
Rafael J. Wysocki | 0e77676 | 2018-04-05 18:58:27 +0200 | [diff] [blame] | 440 | tick_nohz_idle_stop_tick_protected(); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 441 | |
Juergen Gross | c185dde | 2017-07-05 16:05:20 +0200 | [diff] [blame] | 442 | cpuhp_online_idle(CPUHP_AP_ONLINE_IDLE); |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 443 | } |
| 444 | |
| 445 | #else /* !CONFIG_HOTPLUG_CPU */ |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 446 | static int xen_pv_cpu_disable(void) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 447 | { |
| 448 | return -ENOSYS; |
| 449 | } |
| 450 | |
| 451 | static void xen_pv_cpu_die(unsigned int cpu) |
| 452 | { |
| 453 | BUG(); |
| 454 | } |
| 455 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 456 | static void xen_pv_play_dead(void) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 457 | { |
| 458 | BUG(); |
| 459 | } |
| 460 | |
| 461 | #endif |
| 462 | static void stop_self(void *v) |
| 463 | { |
| 464 | int cpu = smp_processor_id(); |
| 465 | |
| 466 | /* make sure we're not pinning something down */ |
| 467 | load_cr3(swapper_pg_dir); |
| 468 | /* should set up a minimal gdt */ |
| 469 | |
| 470 | set_cpu_online(cpu, false); |
| 471 | |
| 472 | HYPERVISOR_vcpu_op(VCPUOP_down, xen_vcpu_nr(cpu), NULL); |
| 473 | BUG(); |
| 474 | } |
| 475 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 476 | static void xen_pv_stop_other_cpus(int wait) |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 477 | { |
| 478 | smp_call_function(stop_self, NULL, wait); |
| 479 | } |
| 480 | |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 481 | static irqreturn_t xen_irq_work_interrupt(int irq, void *dev_id) |
| 482 | { |
| 483 | irq_enter(); |
| 484 | irq_work_run(); |
| 485 | inc_irq_stat(apic_irq_work_irqs); |
| 486 | irq_exit(); |
| 487 | |
| 488 | return IRQ_HANDLED; |
| 489 | } |
| 490 | |
| 491 | static const struct smp_ops xen_smp_ops __initconst = { |
| 492 | .smp_prepare_boot_cpu = xen_pv_smp_prepare_boot_cpu, |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 493 | .smp_prepare_cpus = xen_pv_smp_prepare_cpus, |
Ankur Arora | ae03900 | 2017-06-02 17:06:02 -0700 | [diff] [blame] | 494 | .smp_cpus_done = xen_smp_cpus_done, |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 495 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 496 | .cpu_up = xen_pv_cpu_up, |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 497 | .cpu_die = xen_pv_cpu_die, |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 498 | .cpu_disable = xen_pv_cpu_disable, |
| 499 | .play_dead = xen_pv_play_dead, |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 500 | |
Vitaly Kuznetsov | 8cb6de3 | 2017-03-14 18:35:56 +0100 | [diff] [blame] | 501 | .stop_other_cpus = xen_pv_stop_other_cpus, |
Vitaly Kuznetsov | 83b9679 | 2017-03-14 18:35:46 +0100 | [diff] [blame] | 502 | .smp_send_reschedule = xen_smp_send_reschedule, |
| 503 | |
| 504 | .send_call_func_ipi = xen_smp_send_call_function_ipi, |
| 505 | .send_call_func_single_ipi = xen_smp_send_call_function_single_ipi, |
| 506 | }; |
| 507 | |
| 508 | void __init xen_smp_init(void) |
| 509 | { |
| 510 | smp_ops = xen_smp_ops; |
| 511 | xen_fill_possible_map(); |
| 512 | } |