blob: 40270d7bc597fea3abbbbcd896b72c8f22e4e7cb [file] [log] [blame]
Thomas Gleixner20c8ccb2019-06-04 10:11:32 +02001// SPDX-License-Identifier: GPL-2.0-only
Eddie Dong97222cc2007-09-12 10:58:04 +03002
3/*
4 * Local APIC virtualization
5 *
6 * Copyright (C) 2006 Qumranet, Inc.
7 * Copyright (C) 2007 Novell
8 * Copyright (C) 2007 Intel
Nicolas Kaiser9611c182010-10-06 14:23:22 +02009 * Copyright 2009 Red Hat, Inc. and/or its affiliates.
Eddie Dong97222cc2007-09-12 10:58:04 +030010 *
11 * Authors:
12 * Dor Laor <dor.laor@qumranet.com>
13 * Gregory Haskins <ghaskins@novell.com>
14 * Yaozu (Eddie) Dong <eddie.dong@intel.com>
15 *
16 * Based on Xen 3.1 code, Copyright (c) 2004, Intel Corporation.
Eddie Dong97222cc2007-09-12 10:58:04 +030017 */
18
Avi Kivityedf88412007-12-16 11:02:48 +020019#include <linux/kvm_host.h>
Eddie Dong97222cc2007-09-12 10:58:04 +030020#include <linux/kvm.h>
21#include <linux/mm.h>
22#include <linux/highmem.h>
23#include <linux/smp.h>
24#include <linux/hrtimer.h>
25#include <linux/io.h>
Paul Gortmaker1767e932016-07-13 20:19:00 -040026#include <linux/export.h>
Roman Zippel6f6d6a12008-05-01 04:34:28 -070027#include <linux/math64.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090028#include <linux/slab.h>
Eddie Dong97222cc2007-09-12 10:58:04 +030029#include <asm/processor.h>
30#include <asm/msr.h>
31#include <asm/page.h>
32#include <asm/current.h>
33#include <asm/apicdef.h>
Marcelo Tosattid0659d92014-12-16 09:08:15 -050034#include <asm/delay.h>
Arun Sharma600634972011-07-26 16:09:06 -070035#include <linux/atomic.h>
Gleb Natapovc5cc4212012-08-05 15:58:30 +030036#include <linux/jump_label.h>
Marcelo Tosatti5fdbf972008-06-27 14:58:02 -030037#include "kvm_cache_regs.h"
Eddie Dong97222cc2007-09-12 10:58:04 +030038#include "irq.h"
彭浩(Richard)88197e62020-05-21 05:57:49 +000039#include "ioapic.h"
Marcelo Tosatti229456f2009-06-17 09:22:14 -030040#include "trace.h"
Gleb Natapovfc61b802009-07-05 17:39:35 +030041#include "x86.h"
Avi Kivity00b27a32011-11-23 16:30:32 +020042#include "cpuid.h"
Andrey Smetanin5c9194122015-11-10 15:36:34 +030043#include "hyperv.h"
Eddie Dong97222cc2007-09-12 10:58:04 +030044
Marcelo Tosattib682b812009-02-10 20:41:41 -020045#ifndef CONFIG_X86_64
46#define mod_64(x, y) ((x) - (y) * div64_u64(x, y))
47#else
48#define mod_64(x, y) ((x) % (y))
49#endif
50
Eddie Dong97222cc2007-09-12 10:58:04 +030051#define PRId64 "d"
52#define PRIx64 "llx"
53#define PRIu64 "u"
54#define PRIo64 "o"
55
Eddie Dong97222cc2007-09-12 10:58:04 +030056/* 14 is the version for Xeon and Pentium 8.4.8*/
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -050057#define APIC_VERSION (0x14UL | ((KVM_APIC_LVT_NUM - 1) << 16))
Eddie Dong97222cc2007-09-12 10:58:04 +030058#define LAPIC_MMIO_LENGTH (1 << 12)
59/* followed define is not in apicdef.h */
Eddie Dong97222cc2007-09-12 10:58:04 +030060#define MAX_APIC_VECTOR 256
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +090061#define APIC_VECTORS_PER_REG 32
Eddie Dong97222cc2007-09-12 10:58:04 +030062
Wanpeng Lid0f5a862019-09-17 16:16:26 +080063static bool lapic_timer_advance_dynamic __read_mostly;
Wanpeng Lia0f00372019-09-26 08:54:03 +080064#define LAPIC_TIMER_ADVANCE_ADJUST_MIN 100 /* clock cycles */
65#define LAPIC_TIMER_ADVANCE_ADJUST_MAX 10000 /* clock cycles */
66#define LAPIC_TIMER_ADVANCE_NS_INIT 1000
67#define LAPIC_TIMER_ADVANCE_NS_MAX 5000
Wanpeng Li3b8a5df2018-10-09 09:02:08 +080068/* step-by-step approximation to mitigate fluctuation */
69#define LAPIC_TIMER_ADVANCE_ADJUST_STEP 8
70
Michael S. Tsirkina0c9a8222012-04-11 18:49:55 +030071static inline int apic_test_vector(int vec, void *bitmap)
72{
73 return test_bit(VEC_POS(vec), (bitmap) + REG_POS(vec));
74}
75
Yang Zhang10606912013-04-11 19:21:38 +080076bool kvm_apic_pending_eoi(struct kvm_vcpu *vcpu, int vector)
77{
78 struct kvm_lapic *apic = vcpu->arch.apic;
79
80 return apic_test_vector(vector, apic->regs + APIC_ISR) ||
81 apic_test_vector(vector, apic->regs + APIC_IRR);
82}
83
Michael S. Tsirkin8680b942012-06-24 19:24:26 +030084static inline int __apic_test_and_set_vector(int vec, void *bitmap)
85{
86 return __test_and_set_bit(VEC_POS(vec), (bitmap) + REG_POS(vec));
87}
88
89static inline int __apic_test_and_clear_vector(int vec, void *bitmap)
90{
91 return __test_and_clear_bit(VEC_POS(vec), (bitmap) + REG_POS(vec));
92}
93
Cun Li6e4e3b42021-01-11 23:24:35 +080094__read_mostly DEFINE_STATIC_KEY_DEFERRED_FALSE(apic_hw_disabled, HZ);
95__read_mostly DEFINE_STATIC_KEY_DEFERRED_FALSE(apic_sw_disabled, HZ);
Gleb Natapovf8c1ea12012-08-05 15:58:31 +030096
Eddie Dong97222cc2007-09-12 10:58:04 +030097static inline int apic_enabled(struct kvm_lapic *apic)
98{
Gleb Natapovc48f1492012-08-05 15:58:33 +030099 return kvm_apic_sw_enabled(apic) && kvm_apic_hw_enabled(apic);
Gleb Natapov54e98182012-08-05 15:58:32 +0300100}
101
Eddie Dong97222cc2007-09-12 10:58:04 +0300102#define LVT_MASK \
103 (APIC_LVT_MASKED | APIC_SEND_PENDING | APIC_VECTOR_MASK)
104
105#define LINT_MASK \
106 (LVT_MASK | APIC_MODE_MASK | APIC_INPUT_POLARITY | \
107 APIC_LVT_REMOTE_IRR | APIC_LVT_LEVEL_TRIGGER)
108
Radim Krčmář6e500432016-12-15 18:06:46 +0100109static inline u32 kvm_x2apic_id(struct kvm_lapic *apic)
110{
111 return apic->vcpu->vcpu_id;
112}
113
Paolo Bonzini199a8b82020-05-05 06:45:35 -0400114static bool kvm_can_post_timer_interrupt(struct kvm_vcpu *vcpu)
Wanpeng Li0c5f81d2019-07-06 09:26:51 +0800115{
116 return pi_inject_timer && kvm_vcpu_apicv_active(vcpu);
117}
Paolo Bonzini199a8b82020-05-05 06:45:35 -0400118
119bool kvm_can_use_hv_timer(struct kvm_vcpu *vcpu)
120{
121 return kvm_x86_ops.set_hv_timer
122 && !(kvm_mwait_in_guest(vcpu->kvm) ||
123 kvm_can_post_timer_interrupt(vcpu));
124}
125EXPORT_SYMBOL_GPL(kvm_can_use_hv_timer);
Wanpeng Li0c5f81d2019-07-06 09:26:51 +0800126
127static bool kvm_use_posted_timer_interrupt(struct kvm_vcpu *vcpu)
128{
129 return kvm_can_post_timer_interrupt(vcpu) && vcpu->mode == IN_GUEST_MODE;
130}
131
Radim Krčmáře45115b2016-07-12 22:09:19 +0200132static inline bool kvm_apic_map_get_logical_dest(struct kvm_apic_map *map,
133 u32 dest_id, struct kvm_lapic ***cluster, u16 *mask) {
134 switch (map->mode) {
135 case KVM_APIC_MODE_X2APIC: {
136 u32 offset = (dest_id >> 16) * 16;
Radim Krčmář0ca52e72016-07-12 22:09:20 +0200137 u32 max_apic_id = map->max_apic_id;
Radim Krčmář3548a252015-02-12 19:41:33 +0100138
Radim Krčmáře45115b2016-07-12 22:09:19 +0200139 if (offset <= max_apic_id) {
140 u8 cluster_size = min(max_apic_id - offset + 1, 16U);
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100141
Paolo Bonzini1d487e92019-04-11 11:16:47 +0200142 offset = array_index_nospec(offset, map->max_apic_id + 1);
Radim Krčmáře45115b2016-07-12 22:09:19 +0200143 *cluster = &map->phys_map[offset];
144 *mask = dest_id & (0xffff >> (16 - cluster_size));
145 } else {
146 *mask = 0;
147 }
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100148
Radim Krčmáře45115b2016-07-12 22:09:19 +0200149 return true;
150 }
151 case KVM_APIC_MODE_XAPIC_FLAT:
152 *cluster = map->xapic_flat_map;
153 *mask = dest_id & 0xff;
154 return true;
155 case KVM_APIC_MODE_XAPIC_CLUSTER:
Radim Krčmář444fdad2016-11-22 20:20:14 +0100156 *cluster = map->xapic_cluster_map[(dest_id >> 4) & 0xf];
Radim Krčmáře45115b2016-07-12 22:09:19 +0200157 *mask = dest_id & 0xf;
158 return true;
159 default:
160 /* Not optimized. */
161 return false;
162 }
Eddie Dong97222cc2007-09-12 10:58:04 +0300163}
164
Radim Krčmářaf1bae52016-07-12 22:09:30 +0200165static void kvm_apic_map_free(struct rcu_head *rcu)
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100166{
Radim Krčmářaf1bae52016-07-12 22:09:30 +0200167 struct kvm_apic_map *map = container_of(rcu, struct kvm_apic_map, rcu);
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100168
Radim Krčmářaf1bae52016-07-12 22:09:30 +0200169 kvfree(map);
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100170}
171
Paolo Bonzini44d52712020-06-22 16:37:42 +0200172/*
173 * CLEAN -> DIRTY and UPDATE_IN_PROGRESS -> DIRTY changes happen without a lock.
174 *
175 * DIRTY -> UPDATE_IN_PROGRESS and UPDATE_IN_PROGRESS -> CLEAN happen with
176 * apic_map_lock_held.
177 */
178enum {
179 CLEAN,
180 UPDATE_IN_PROGRESS,
181 DIRTY
182};
183
Wanpeng Li4abaffc2020-02-26 10:41:02 +0800184void kvm_recalculate_apic_map(struct kvm *kvm)
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300185{
186 struct kvm_apic_map *new, *old = NULL;
187 struct kvm_vcpu *vcpu;
Marc Zyngier46808a42021-11-16 16:04:02 +0000188 unsigned long i;
Radim Krčmář6e500432016-12-15 18:06:46 +0100189 u32 max_id = 255; /* enough space for any xAPIC ID */
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300190
Paolo Bonzini44d52712020-06-22 16:37:42 +0200191 /* Read kvm->arch.apic_map_dirty before kvm->arch.apic_map. */
192 if (atomic_read_acquire(&kvm->arch.apic_map_dirty) == CLEAN)
Wanpeng Li4abaffc2020-02-26 10:41:02 +0800193 return;
Wanpeng Li4abaffc2020-02-26 10:41:02 +0800194
Sean Christophersonc2f79a62021-07-13 09:32:49 -0700195 WARN_ONCE(!irqchip_in_kernel(kvm),
196 "Dirty APIC map without an in-kernel local APIC");
197
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300198 mutex_lock(&kvm->arch.apic_map_lock);
Paolo Bonzini44d52712020-06-22 16:37:42 +0200199 /*
200 * Read kvm->arch.apic_map_dirty before kvm->arch.apic_map
201 * (if clean) or the APIC registers (if dirty).
202 */
203 if (atomic_cmpxchg_acquire(&kvm->arch.apic_map_dirty,
204 DIRTY, UPDATE_IN_PROGRESS) == CLEAN) {
Wanpeng Li4abaffc2020-02-26 10:41:02 +0800205 /* Someone else has updated the map. */
206 mutex_unlock(&kvm->arch.apic_map_lock);
207 return;
208 }
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300209
Radim Krčmář0ca52e72016-07-12 22:09:20 +0200210 kvm_for_each_vcpu(i, vcpu, kvm)
211 if (kvm_apic_present(vcpu))
Radim Krčmář6e500432016-12-15 18:06:46 +0100212 max_id = max(max_id, kvm_x2apic_id(vcpu->arch.apic));
Radim Krčmář0ca52e72016-07-12 22:09:20 +0200213
Michal Hockoa7c3e902017-05-08 15:57:09 -0700214 new = kvzalloc(sizeof(struct kvm_apic_map) +
Ben Gardon254272c2019-02-11 11:02:50 -0800215 sizeof(struct kvm_lapic *) * ((u64)max_id + 1),
216 GFP_KERNEL_ACCOUNT);
Radim Krčmář0ca52e72016-07-12 22:09:20 +0200217
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300218 if (!new)
219 goto out;
220
Radim Krčmář0ca52e72016-07-12 22:09:20 +0200221 new->max_apic_id = max_id;
222
Nadav Amit173beed2014-11-02 11:54:54 +0200223 kvm_for_each_vcpu(i, vcpu, kvm) {
224 struct kvm_lapic *apic = vcpu->arch.apic;
Radim Krčmáře45115b2016-07-12 22:09:19 +0200225 struct kvm_lapic **cluster;
226 u16 mask;
Radim Krčmář5bd5db32016-12-15 18:06:48 +0100227 u32 ldr;
228 u8 xapic_id;
229 u32 x2apic_id;
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300230
Radim Krčmářdf04d1d2015-01-29 22:33:35 +0100231 if (!kvm_apic_present(vcpu))
232 continue;
233
Radim Krčmář5bd5db32016-12-15 18:06:48 +0100234 xapic_id = kvm_xapic_id(apic);
235 x2apic_id = kvm_x2apic_id(apic);
236
237 /* Hotplug hack: see kvm_apic_match_physical_addr(), ... */
238 if ((apic_x2apic_mode(apic) || x2apic_id > 0xff) &&
239 x2apic_id <= new->max_apic_id)
240 new->phys_map[x2apic_id] = apic;
241 /*
242 * ... xAPIC ID of VCPUs with APIC ID > 0xff will wrap-around,
243 * prevent them from masking VCPUs with APIC ID <= 0xff.
244 */
245 if (!apic_x2apic_mode(apic) && !new->phys_map[xapic_id])
246 new->phys_map[xapic_id] = apic;
Radim Krčmář3548a252015-02-12 19:41:33 +0100247
Radim Krcmarb14c8762019-08-13 23:37:37 -0400248 if (!kvm_apic_sw_enabled(apic))
249 continue;
250
Radim Krčmář6e500432016-12-15 18:06:46 +0100251 ldr = kvm_lapic_get_reg(apic, APIC_LDR);
252
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100253 if (apic_x2apic_mode(apic)) {
254 new->mode |= KVM_APIC_MODE_X2APIC;
255 } else if (ldr) {
256 ldr = GET_APIC_LOGICAL_ID(ldr);
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -0500257 if (kvm_lapic_get_reg(apic, APIC_DFR) == APIC_DFR_FLAT)
Radim Krčmář3b5a5ff2015-02-12 19:41:34 +0100258 new->mode |= KVM_APIC_MODE_XAPIC_FLAT;
259 else
260 new->mode |= KVM_APIC_MODE_XAPIC_CLUSTER;
261 }
262
Radim Krčmáře45115b2016-07-12 22:09:19 +0200263 if (!kvm_apic_map_get_logical_dest(new, ldr, &cluster, &mask))
Radim Krčmář3548a252015-02-12 19:41:33 +0100264 continue;
265
Radim Krčmáře45115b2016-07-12 22:09:19 +0200266 if (mask)
267 cluster[ffs(mask) - 1] = apic;
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300268 }
269out:
270 old = rcu_dereference_protected(kvm->arch.apic_map,
271 lockdep_is_held(&kvm->arch.apic_map_lock));
272 rcu_assign_pointer(kvm->arch.apic_map, new);
Wanpeng Li4abaffc2020-02-26 10:41:02 +0800273 /*
Paolo Bonzini44d52712020-06-22 16:37:42 +0200274 * Write kvm->arch.apic_map before clearing apic->apic_map_dirty.
275 * If another update has come in, leave it DIRTY.
Wanpeng Li4abaffc2020-02-26 10:41:02 +0800276 */
Paolo Bonzini44d52712020-06-22 16:37:42 +0200277 atomic_cmpxchg_release(&kvm->arch.apic_map_dirty,
278 UPDATE_IN_PROGRESS, CLEAN);
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300279 mutex_unlock(&kvm->arch.apic_map_lock);
280
281 if (old)
Radim Krčmářaf1bae52016-07-12 22:09:30 +0200282 call_rcu(&old->rcu, kvm_apic_map_free);
Yang Zhangc7c9c562013-01-25 10:18:51 +0800283
Steve Rutherfordb053b2a2015-07-29 23:32:35 -0700284 kvm_make_scan_ioapic_request(kvm);
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300285}
286
Nadav Amit1e1b6c22014-08-19 00:03:00 +0300287static inline void apic_set_spiv(struct kvm_lapic *apic, u32 val)
288{
Radim Krčmáře4627552014-10-30 15:06:45 +0100289 bool enabled = val & APIC_SPIV_APIC_ENABLED;
Nadav Amit1e1b6c22014-08-19 00:03:00 +0300290
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500291 kvm_lapic_set_reg(apic, APIC_SPIV, val);
Radim Krčmáře4627552014-10-30 15:06:45 +0100292
293 if (enabled != apic->sw_enabled) {
294 apic->sw_enabled = enabled;
Peng Haoeb1ff0a2018-12-04 17:42:50 +0800295 if (enabled)
Cun Li6e4e3b42021-01-11 23:24:35 +0800296 static_branch_slow_dec_deferred(&apic_sw_disabled);
Peng Haoeb1ff0a2018-12-04 17:42:50 +0800297 else
Cun Li6e4e3b42021-01-11 23:24:35 +0800298 static_branch_inc(&apic_sw_disabled.key);
Radim Krcmarb14c8762019-08-13 23:37:37 -0400299
Paolo Bonzini44d52712020-06-22 16:37:42 +0200300 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
Nadav Amit1e1b6c22014-08-19 00:03:00 +0300301 }
Vitaly Kuznetsov2f15d022021-04-22 11:29:48 +0200302
303 /* Check if there are APF page ready requests pending */
304 if (enabled)
305 kvm_make_request(KVM_REQ_APF_READY, apic->vcpu);
Nadav Amit1e1b6c22014-08-19 00:03:00 +0300306}
307
Radim Krčmářa92e2542016-07-12 22:09:22 +0200308static inline void kvm_apic_set_xapic_id(struct kvm_lapic *apic, u8 id)
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300309{
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500310 kvm_lapic_set_reg(apic, APIC_ID, id << 24);
Paolo Bonzini44d52712020-06-22 16:37:42 +0200311 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300312}
313
314static inline void kvm_apic_set_ldr(struct kvm_lapic *apic, u32 id)
315{
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500316 kvm_lapic_set_reg(apic, APIC_LDR, id);
Paolo Bonzini44d52712020-06-22 16:37:42 +0200317 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300318}
319
Wanpeng Liae6f2492020-08-19 16:55:26 +0800320static inline void kvm_apic_set_dfr(struct kvm_lapic *apic, u32 val)
321{
322 kvm_lapic_set_reg(apic, APIC_DFR, val);
323 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
324}
325
Dr. David Alan Gilberte872fa92017-11-17 11:52:49 +0000326static inline u32 kvm_apic_calc_x2apic_ldr(u32 id)
327{
328 return ((id >> 4) << 16) | (1 << (id & 0xf));
329}
330
Radim Krčmářa92e2542016-07-12 22:09:22 +0200331static inline void kvm_apic_set_x2apic_id(struct kvm_lapic *apic, u32 id)
Radim Krčmář257b9a52015-05-22 18:45:11 +0200332{
Dr. David Alan Gilberte872fa92017-11-17 11:52:49 +0000333 u32 ldr = kvm_apic_calc_x2apic_ldr(id);
Radim Krčmář257b9a52015-05-22 18:45:11 +0200334
Radim Krčmář6e500432016-12-15 18:06:46 +0100335 WARN_ON_ONCE(id != apic->vcpu->vcpu_id);
336
Radim Krčmářa92e2542016-07-12 22:09:22 +0200337 kvm_lapic_set_reg(apic, APIC_ID, id);
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500338 kvm_lapic_set_reg(apic, APIC_LDR, ldr);
Paolo Bonzini44d52712020-06-22 16:37:42 +0200339 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
Radim Krčmář257b9a52015-05-22 18:45:11 +0200340}
341
Eddie Dong97222cc2007-09-12 10:58:04 +0300342static inline int apic_lvt_enabled(struct kvm_lapic *apic, int lvt_type)
343{
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -0500344 return !(kvm_lapic_get_reg(apic, lvt_type) & APIC_LVT_MASKED);
Eddie Dong97222cc2007-09-12 10:58:04 +0300345}
346
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +0800347static inline int apic_lvtt_oneshot(struct kvm_lapic *apic)
348{
Radim Krčmářf30ebc32014-10-30 15:06:47 +0100349 return apic->lapic_timer.timer_mode == APIC_LVT_TIMER_ONESHOT;
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +0800350}
351
Eddie Dong97222cc2007-09-12 10:58:04 +0300352static inline int apic_lvtt_period(struct kvm_lapic *apic)
353{
Radim Krčmářf30ebc32014-10-30 15:06:47 +0100354 return apic->lapic_timer.timer_mode == APIC_LVT_TIMER_PERIODIC;
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +0800355}
356
357static inline int apic_lvtt_tscdeadline(struct kvm_lapic *apic)
358{
Radim Krčmářf30ebc32014-10-30 15:06:47 +0100359 return apic->lapic_timer.timer_mode == APIC_LVT_TIMER_TSCDEADLINE;
Eddie Dong97222cc2007-09-12 10:58:04 +0300360}
361
Jan Kiszkacc6e4622008-10-20 10:20:03 +0200362static inline int apic_lvt_nmi_mode(u32 lvt_val)
363{
364 return (lvt_val & (APIC_MODE_MASK | APIC_LVT_MASKED)) == APIC_DM_NMI;
365}
366
Gleb Natapovfc61b802009-07-05 17:39:35 +0300367void kvm_apic_set_version(struct kvm_vcpu *vcpu)
368{
369 struct kvm_lapic *apic = vcpu->arch.apic;
Gleb Natapovfc61b802009-07-05 17:39:35 +0300370 u32 v = APIC_VERSION;
371
Paolo Bonzinibce87cc2016-01-08 13:48:51 +0100372 if (!lapic_in_kernel(vcpu))
Gleb Natapovfc61b802009-07-05 17:39:35 +0300373 return;
374
Vitaly Kuznetsov0bcc3fb2018-02-09 14:01:33 +0100375 /*
376 * KVM emulates 82093AA datasheet (with in-kernel IOAPIC implementation)
377 * which doesn't have EOI register; Some buggy OSes (e.g. Windows with
378 * Hyper-V role) disable EOI broadcast in lapic not checking for IOAPIC
379 * version first and level-triggered interrupts never get EOIed in
380 * IOAPIC.
381 */
Xiaoyao Li565b7822020-07-08 14:50:53 +0800382 if (guest_cpuid_has(vcpu, X86_FEATURE_X2APIC) &&
Vitaly Kuznetsov0bcc3fb2018-02-09 14:01:33 +0100383 !ioapic_in_kernel(vcpu->kvm))
Gleb Natapovfc61b802009-07-05 17:39:35 +0300384 v |= APIC_LVR_DIRECTED_EOI;
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500385 kvm_lapic_set_reg(apic, APIC_LVR, v);
Gleb Natapovfc61b802009-07-05 17:39:35 +0300386}
387
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500388static const unsigned int apic_lvt_mask[KVM_APIC_LVT_NUM] = {
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +0800389 LVT_MASK , /* part LVTT mask, timer mode mask added at runtime */
Eddie Dong97222cc2007-09-12 10:58:04 +0300390 LVT_MASK | APIC_MODE_MASK, /* LVTTHMR */
391 LVT_MASK | APIC_MODE_MASK, /* LVTPC */
392 LINT_MASK, LINT_MASK, /* LVT0-1 */
393 LVT_MASK /* LVTERR */
394};
395
396static int find_highest_vector(void *bitmap)
397{
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +0900398 int vec;
399 u32 *reg;
Eddie Dong97222cc2007-09-12 10:58:04 +0300400
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +0900401 for (vec = MAX_APIC_VECTOR - APIC_VECTORS_PER_REG;
402 vec >= 0; vec -= APIC_VECTORS_PER_REG) {
403 reg = bitmap + REG_POS(vec);
404 if (*reg)
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100405 return __fls(*reg) + vec;
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +0900406 }
Eddie Dong97222cc2007-09-12 10:58:04 +0300407
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +0900408 return -1;
Eddie Dong97222cc2007-09-12 10:58:04 +0300409}
410
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300411static u8 count_vectors(void *bitmap)
412{
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +0900413 int vec;
414 u32 *reg;
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300415 u8 count = 0;
Takuya Yoshikawaecba9a52012-09-05 19:30:01 +0900416
417 for (vec = 0; vec < MAX_APIC_VECTOR; vec += APIC_VECTORS_PER_REG) {
418 reg = bitmap + REG_POS(vec);
419 count += hweight32(*reg);
420 }
421
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300422 return count;
423}
424
Liran Alone7387b02017-12-24 18:12:54 +0200425bool __kvm_apic_update_irr(u32 *pir, void *regs, int *max_irr)
Yang Zhanga20ed542013-04-11 19:25:15 +0800426{
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100427 u32 i, vec;
Liran Alone7387b02017-12-24 18:12:54 +0200428 u32 pir_val, irr_val, prev_irr_val;
429 int max_updated_irr;
430
431 max_updated_irr = -1;
432 *max_irr = -1;
Yang Zhanga20ed542013-04-11 19:25:15 +0800433
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100434 for (i = vec = 0; i <= 7; i++, vec += 32) {
Paolo Bonziniad361092016-09-20 16:15:05 +0200435 pir_val = READ_ONCE(pir[i]);
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100436 irr_val = *((u32 *)(regs + APIC_IRR + i * 0x10));
Paolo Bonziniad361092016-09-20 16:15:05 +0200437 if (pir_val) {
Liran Alone7387b02017-12-24 18:12:54 +0200438 prev_irr_val = irr_val;
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100439 irr_val |= xchg(&pir[i], 0);
440 *((u32 *)(regs + APIC_IRR + i * 0x10)) = irr_val;
Liran Alone7387b02017-12-24 18:12:54 +0200441 if (prev_irr_val != irr_val) {
442 max_updated_irr =
443 __fls(irr_val ^ prev_irr_val) + vec;
444 }
Paolo Bonziniad361092016-09-20 16:15:05 +0200445 }
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100446 if (irr_val)
Liran Alone7387b02017-12-24 18:12:54 +0200447 *max_irr = __fls(irr_val) + vec;
Yang Zhanga20ed542013-04-11 19:25:15 +0800448 }
Paolo Bonzini810e6de2016-12-19 13:05:46 +0100449
Liran Alone7387b02017-12-24 18:12:54 +0200450 return ((max_updated_irr != -1) &&
451 (max_updated_irr == *max_irr));
Yang Zhanga20ed542013-04-11 19:25:15 +0800452}
Wincy Van705699a2015-02-03 23:58:17 +0800453EXPORT_SYMBOL_GPL(__kvm_apic_update_irr);
454
Liran Alone7387b02017-12-24 18:12:54 +0200455bool kvm_apic_update_irr(struct kvm_vcpu *vcpu, u32 *pir, int *max_irr)
Wincy Van705699a2015-02-03 23:58:17 +0800456{
457 struct kvm_lapic *apic = vcpu->arch.apic;
458
Liran Alone7387b02017-12-24 18:12:54 +0200459 return __kvm_apic_update_irr(pir, apic->regs, max_irr);
Wincy Van705699a2015-02-03 23:58:17 +0800460}
Yang Zhanga20ed542013-04-11 19:25:15 +0800461EXPORT_SYMBOL_GPL(kvm_apic_update_irr);
462
Gleb Natapov33e4c682009-06-11 11:06:51 +0300463static inline int apic_search_irr(struct kvm_lapic *apic)
Eddie Dong97222cc2007-09-12 10:58:04 +0300464{
Gleb Natapov33e4c682009-06-11 11:06:51 +0300465 return find_highest_vector(apic->regs + APIC_IRR);
Eddie Dong97222cc2007-09-12 10:58:04 +0300466}
467
468static inline int apic_find_highest_irr(struct kvm_lapic *apic)
469{
470 int result;
471
Yang Zhangc7c9c562013-01-25 10:18:51 +0800472 /*
473 * Note that irr_pending is just a hint. It will be always
474 * true with virtual interrupt delivery enabled.
475 */
Gleb Natapov33e4c682009-06-11 11:06:51 +0300476 if (!apic->irr_pending)
477 return -1;
478
479 result = apic_search_irr(apic);
Eddie Dong97222cc2007-09-12 10:58:04 +0300480 ASSERT(result == -1 || result >= 16);
481
482 return result;
483}
484
Gleb Natapov33e4c682009-06-11 11:06:51 +0300485static inline void apic_clear_irr(int vec, struct kvm_lapic *apic)
486{
Wanpeng Li56cc2402014-08-05 12:42:24 +0800487 struct kvm_vcpu *vcpu;
488
489 vcpu = apic->vcpu;
490
Andrey Smetanind62caab2015-11-10 15:36:33 +0300491 if (unlikely(vcpu->arch.apicv_active)) {
Paolo Bonzinib95234c2016-12-19 13:57:33 +0100492 /* need to update RVI */
Wei Yangee171d22019-03-31 19:17:22 -0700493 kvm_lapic_clear_vector(vec, apic->regs + APIC_IRR);
Jason Baronb36464772021-01-14 22:27:56 -0500494 static_call(kvm_x86_hwapic_irr_update)(vcpu,
Paolo Bonzinib95234c2016-12-19 13:57:33 +0100495 apic_find_highest_irr(apic));
Nadav Amitf210f752014-11-16 23:49:07 +0200496 } else {
497 apic->irr_pending = false;
Wei Yangee171d22019-03-31 19:17:22 -0700498 kvm_lapic_clear_vector(vec, apic->regs + APIC_IRR);
Nadav Amitf210f752014-11-16 23:49:07 +0200499 if (apic_search_irr(apic) != -1)
500 apic->irr_pending = true;
Wanpeng Li56cc2402014-08-05 12:42:24 +0800501 }
Gleb Natapov33e4c682009-06-11 11:06:51 +0300502}
503
Sean Christopherson25bb2cf2020-08-12 10:51:29 -0700504void kvm_apic_clear_irr(struct kvm_vcpu *vcpu, int vec)
505{
506 apic_clear_irr(vec, vcpu->arch.apic);
507}
508EXPORT_SYMBOL_GPL(kvm_apic_clear_irr);
509
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300510static inline void apic_set_isr(int vec, struct kvm_lapic *apic)
511{
Wanpeng Li56cc2402014-08-05 12:42:24 +0800512 struct kvm_vcpu *vcpu;
Paolo Bonzinifc57ac22014-05-14 17:40:58 +0200513
Wanpeng Li56cc2402014-08-05 12:42:24 +0800514 if (__apic_test_and_set_vector(vec, apic->regs + APIC_ISR))
515 return;
516
517 vcpu = apic->vcpu;
518
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300519 /*
Wanpeng Li56cc2402014-08-05 12:42:24 +0800520 * With APIC virtualization enabled, all caching is disabled
521 * because the processor can modify ISR under the hood. Instead
522 * just set SVI.
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300523 */
Andrey Smetanind62caab2015-11-10 15:36:33 +0300524 if (unlikely(vcpu->arch.apicv_active))
Jason Baronb36464772021-01-14 22:27:56 -0500525 static_call(kvm_x86_hwapic_isr_update)(vcpu, vec);
Wanpeng Li56cc2402014-08-05 12:42:24 +0800526 else {
527 ++apic->isr_count;
528 BUG_ON(apic->isr_count > MAX_APIC_VECTOR);
529 /*
530 * ISR (in service register) bit is set when injecting an interrupt.
531 * The highest vector is injected. Thus the latest bit set matches
532 * the highest bit in ISR.
533 */
534 apic->highest_isr_cache = vec;
535 }
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300536}
537
Paolo Bonzinifc57ac22014-05-14 17:40:58 +0200538static inline int apic_find_highest_isr(struct kvm_lapic *apic)
539{
540 int result;
541
542 /*
543 * Note that isr_count is always 1, and highest_isr_cache
544 * is always -1, with APIC virtualization enabled.
545 */
546 if (!apic->isr_count)
547 return -1;
548 if (likely(apic->highest_isr_cache != -1))
549 return apic->highest_isr_cache;
550
551 result = find_highest_vector(apic->regs + APIC_ISR);
552 ASSERT(result == -1 || result >= 16);
553
554 return result;
555}
556
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300557static inline void apic_clear_isr(int vec, struct kvm_lapic *apic)
558{
Paolo Bonzinifc57ac22014-05-14 17:40:58 +0200559 struct kvm_vcpu *vcpu;
560 if (!__apic_test_and_clear_vector(vec, apic->regs + APIC_ISR))
561 return;
562
563 vcpu = apic->vcpu;
564
565 /*
566 * We do get here for APIC virtualization enabled if the guest
567 * uses the Hyper-V APIC enlightenment. In this case we may need
568 * to trigger a new interrupt delivery by writing the SVI field;
569 * on the other hand isr_count and highest_isr_cache are unused
570 * and must be left alone.
571 */
Andrey Smetanind62caab2015-11-10 15:36:33 +0300572 if (unlikely(vcpu->arch.apicv_active))
Jason Baronb36464772021-01-14 22:27:56 -0500573 static_call(kvm_x86_hwapic_isr_update)(vcpu,
574 apic_find_highest_isr(apic));
Paolo Bonzinifc57ac22014-05-14 17:40:58 +0200575 else {
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300576 --apic->isr_count;
Paolo Bonzinifc57ac22014-05-14 17:40:58 +0200577 BUG_ON(apic->isr_count < 0);
578 apic->highest_isr_cache = -1;
579 }
Michael S. Tsirkin8680b942012-06-24 19:24:26 +0300580}
581
Yang, Sheng6e5d8652007-09-12 18:03:11 +0800582int kvm_lapic_find_highest_irr(struct kvm_vcpu *vcpu)
583{
Gleb Natapov33e4c682009-06-11 11:06:51 +0300584 /* This may race with setting of irr in __apic_accept_irq() and
585 * value returned may be wrong, but kvm_vcpu_kick() in __apic_accept_irq
586 * will cause vmexit immediately and the value will be recalculated
587 * on the next vmentry.
588 */
Paolo Bonzinif8543d62016-01-08 13:42:24 +0100589 return apic_find_highest_irr(vcpu->arch.apic);
Yang, Sheng6e5d8652007-09-12 18:03:11 +0800590}
Paolo Bonzini76dfafd52016-12-19 17:17:11 +0100591EXPORT_SYMBOL_GPL(kvm_lapic_find_highest_irr);
Yang, Sheng6e5d8652007-09-12 18:03:11 +0800592
Gleb Natapov6da7e3f2009-03-05 16:34:44 +0200593static int __apic_accept_irq(struct kvm_lapic *apic, int delivery_mode,
Yang Zhangb4f22252013-04-11 19:21:37 +0800594 int vector, int level, int trig_mode,
Joerg Roedel9e4aabe2016-02-29 16:04:43 +0100595 struct dest_map *dest_map);
Gleb Natapov6da7e3f2009-03-05 16:34:44 +0200596
Yang Zhangb4f22252013-04-11 19:21:37 +0800597int kvm_apic_set_irq(struct kvm_vcpu *vcpu, struct kvm_lapic_irq *irq,
Joerg Roedel9e4aabe2016-02-29 16:04:43 +0100598 struct dest_map *dest_map)
Eddie Dong97222cc2007-09-12 10:58:04 +0300599{
Zhang Xiantaoad312c72007-12-13 23:50:52 +0800600 struct kvm_lapic *apic = vcpu->arch.apic;
Zhang Xiantao8be54532007-12-02 22:35:57 +0800601
Gleb Natapov58c2dde2009-03-05 16:35:04 +0200602 return __apic_accept_irq(apic, irq->delivery_mode, irq->vector,
Yang Zhangb4f22252013-04-11 19:21:37 +0800603 irq->level, irq->trig_mode, dest_map);
Eddie Dong97222cc2007-09-12 10:58:04 +0300604}
605
Miaohe Lin1a686232019-11-09 17:46:49 +0800606static int __pv_send_ipi(unsigned long *ipi_bitmap, struct kvm_apic_map *map,
607 struct kvm_lapic_irq *irq, u32 min)
608{
609 int i, count = 0;
610 struct kvm_vcpu *vcpu;
611
612 if (min > map->max_apic_id)
613 return 0;
614
615 for_each_set_bit(i, ipi_bitmap,
616 min((u32)BITS_PER_LONG, (map->max_apic_id - min + 1))) {
617 if (map->phys_map[min + i]) {
618 vcpu = map->phys_map[min + i]->vcpu;
619 count += kvm_apic_set_irq(vcpu, irq, NULL);
620 }
621 }
622
623 return count;
624}
625
Wanpeng Li4180bf12018-07-23 14:39:54 +0800626int kvm_pv_send_ipi(struct kvm *kvm, unsigned long ipi_bitmap_low,
Wanpeng Libdf7ffc2018-08-30 10:03:30 +0800627 unsigned long ipi_bitmap_high, u32 min,
Wanpeng Li4180bf12018-07-23 14:39:54 +0800628 unsigned long icr, int op_64_bit)
629{
Wanpeng Li4180bf12018-07-23 14:39:54 +0800630 struct kvm_apic_map *map;
Wanpeng Li4180bf12018-07-23 14:39:54 +0800631 struct kvm_lapic_irq irq = {0};
632 int cluster_size = op_64_bit ? 64 : 32;
Miaohe Lin1a686232019-11-09 17:46:49 +0800633 int count;
634
635 if (icr & (APIC_DEST_MASK | APIC_SHORT_MASK))
636 return -KVM_EINVAL;
Wanpeng Li4180bf12018-07-23 14:39:54 +0800637
638 irq.vector = icr & APIC_VECTOR_MASK;
639 irq.delivery_mode = icr & APIC_MODE_MASK;
640 irq.level = (icr & APIC_INT_ASSERT) != 0;
641 irq.trig_mode = icr & APIC_INT_LEVELTRIG;
642
Wanpeng Li4180bf12018-07-23 14:39:54 +0800643 rcu_read_lock();
644 map = rcu_dereference(kvm->arch.apic_map);
645
Miaohe Lin1a686232019-11-09 17:46:49 +0800646 count = -EOPNOTSUPP;
647 if (likely(map)) {
648 count = __pv_send_ipi(&ipi_bitmap_low, map, &irq, min);
649 min += cluster_size;
650 count += __pv_send_ipi(&ipi_bitmap_high, map, &irq, min);
Wanpeng Li38ab0122018-11-20 09:39:30 +0800651 }
652
Wanpeng Li4180bf12018-07-23 14:39:54 +0800653 rcu_read_unlock();
654 return count;
655}
656
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300657static int pv_eoi_put_user(struct kvm_vcpu *vcpu, u8 val)
658{
Paolo Bonzini4e335d92017-05-02 16:20:18 +0200659
660 return kvm_write_guest_cached(vcpu->kvm, &vcpu->arch.pv_eoi.data, &val,
661 sizeof(val));
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300662}
663
664static int pv_eoi_get_user(struct kvm_vcpu *vcpu, u8 *val)
665{
Paolo Bonzini4e335d92017-05-02 16:20:18 +0200666
667 return kvm_read_guest_cached(vcpu->kvm, &vcpu->arch.pv_eoi.data, val,
668 sizeof(*val));
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300669}
670
671static inline bool pv_eoi_enabled(struct kvm_vcpu *vcpu)
672{
673 return vcpu->arch.pv_eoi.msr_val & KVM_MSR_ENABLED;
674}
675
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300676static void pv_eoi_set_pending(struct kvm_vcpu *vcpu)
677{
Li RongQingce5977b2021-11-04 19:56:13 +0800678 if (pv_eoi_put_user(vcpu, KVM_PV_EOI_ENABLED) < 0)
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300679 return;
Li RongQingce5977b2021-11-04 19:56:13 +0800680
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300681 __set_bit(KVM_APIC_PV_EOI_PENDING, &vcpu->arch.apic_attention);
682}
683
Li RongQing51b12092021-11-04 19:56:14 +0800684static bool pv_eoi_test_and_clr_pending(struct kvm_vcpu *vcpu)
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300685{
Li RongQing51b12092021-11-04 19:56:14 +0800686 u8 val;
Li RongQingce5977b2021-11-04 19:56:13 +0800687
Li RongQing51b12092021-11-04 19:56:14 +0800688 if (pv_eoi_get_user(vcpu, &val) < 0)
689 return false;
690
691 val &= KVM_PV_EOI_ENABLED;
692
693 if (val && pv_eoi_put_user(vcpu, KVM_PV_EOI_DISABLED) < 0)
694 return false;
695
696 /*
697 * Clear pending bit in any case: it will be set again on vmentry.
698 * While this might not be ideal from performance point of view,
699 * this makes sure pv eoi is only enabled when we know it's safe.
700 */
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300701 __clear_bit(KVM_APIC_PV_EOI_PENDING, &vcpu->arch.apic_attention);
Li RongQing51b12092021-11-04 19:56:14 +0800702
703 return val;
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +0300704}
705
Paolo Bonzinib3c045d2016-12-18 21:47:54 +0100706static int apic_has_interrupt_for_ppr(struct kvm_lapic *apic, u32 ppr)
707{
Paolo Bonzini3d927892016-12-19 13:29:03 +0100708 int highest_irr;
Paolo Bonzini37c4dbf2021-11-22 19:43:10 -0500709 if (kvm_x86_ops.sync_pir_to_irr)
Jason Baronb36464772021-01-14 22:27:56 -0500710 highest_irr = static_call(kvm_x86_sync_pir_to_irr)(apic->vcpu);
Paolo Bonzini76dfafd52016-12-19 17:17:11 +0100711 else
712 highest_irr = apic_find_highest_irr(apic);
Paolo Bonzinib3c045d2016-12-18 21:47:54 +0100713 if (highest_irr == -1 || (highest_irr & 0xF0) <= ppr)
714 return -1;
715 return highest_irr;
716}
717
718static bool __apic_update_ppr(struct kvm_lapic *apic, u32 *new_ppr)
Eddie Dong97222cc2007-09-12 10:58:04 +0300719{
Avi Kivity3842d132010-07-27 12:30:24 +0300720 u32 tpr, isrv, ppr, old_ppr;
Eddie Dong97222cc2007-09-12 10:58:04 +0300721 int isr;
722
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -0500723 old_ppr = kvm_lapic_get_reg(apic, APIC_PROCPRI);
724 tpr = kvm_lapic_get_reg(apic, APIC_TASKPRI);
Eddie Dong97222cc2007-09-12 10:58:04 +0300725 isr = apic_find_highest_isr(apic);
726 isrv = (isr != -1) ? isr : 0;
727
728 if ((tpr & 0xf0) >= (isrv & 0xf0))
729 ppr = tpr & 0xff;
730 else
731 ppr = isrv & 0xf0;
732
Paolo Bonzinib3c045d2016-12-18 21:47:54 +0100733 *new_ppr = ppr;
734 if (old_ppr != ppr)
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500735 kvm_lapic_set_reg(apic, APIC_PROCPRI, ppr);
Paolo Bonzinib3c045d2016-12-18 21:47:54 +0100736
737 return ppr < old_ppr;
738}
739
740static void apic_update_ppr(struct kvm_lapic *apic)
741{
742 u32 ppr;
743
Paolo Bonzini26fbbee2016-12-18 13:54:58 +0100744 if (__apic_update_ppr(apic, &ppr) &&
745 apic_has_interrupt_for_ppr(apic, ppr) != -1)
Paolo Bonzinib3c045d2016-12-18 21:47:54 +0100746 kvm_make_request(KVM_REQ_EVENT, apic->vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +0300747}
748
Paolo Bonzinieb90f342016-12-18 14:02:21 +0100749void kvm_apic_update_ppr(struct kvm_vcpu *vcpu)
750{
751 apic_update_ppr(vcpu->arch.apic);
752}
753EXPORT_SYMBOL_GPL(kvm_apic_update_ppr);
754
Eddie Dong97222cc2007-09-12 10:58:04 +0300755static void apic_set_tpr(struct kvm_lapic *apic, u32 tpr)
756{
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500757 kvm_lapic_set_reg(apic, APIC_TASKPRI, tpr);
Eddie Dong97222cc2007-09-12 10:58:04 +0300758 apic_update_ppr(apic);
759}
760
Radim Krčmář03d22492015-02-12 19:41:31 +0100761static bool kvm_apic_broadcast(struct kvm_lapic *apic, u32 mda)
Eddie Dong97222cc2007-09-12 10:58:04 +0300762{
Radim Krčmářb4535b52016-12-15 18:06:47 +0100763 return mda == (apic_x2apic_mode(apic) ?
764 X2APIC_BROADCAST : APIC_BROADCAST);
Eddie Dong97222cc2007-09-12 10:58:04 +0300765}
766
Radim Krčmář03d22492015-02-12 19:41:31 +0100767static bool kvm_apic_match_physical_addr(struct kvm_lapic *apic, u32 mda)
Nadav Amit394457a2014-10-03 00:30:52 +0300768{
Radim Krčmář03d22492015-02-12 19:41:31 +0100769 if (kvm_apic_broadcast(apic, mda))
770 return true;
771
772 if (apic_x2apic_mode(apic))
Radim Krčmář6e500432016-12-15 18:06:46 +0100773 return mda == kvm_x2apic_id(apic);
Radim Krčmář03d22492015-02-12 19:41:31 +0100774
Radim Krčmář5bd5db32016-12-15 18:06:48 +0100775 /*
776 * Hotplug hack: Make LAPIC in xAPIC mode also accept interrupts as if
777 * it were in x2APIC mode. Hotplugged VCPUs start in xAPIC mode and
778 * this allows unique addressing of VCPUs with APIC ID over 0xff.
779 * The 0xff condition is needed because writeable xAPIC ID.
780 */
781 if (kvm_x2apic_id(apic) > 0xff && mda == kvm_x2apic_id(apic))
782 return true;
783
Radim Krčmářb4535b52016-12-15 18:06:47 +0100784 return mda == kvm_xapic_id(apic);
Nadav Amit394457a2014-10-03 00:30:52 +0300785}
786
Radim Krčmář52c233a2015-01-29 22:48:48 +0100787static bool kvm_apic_match_logical_addr(struct kvm_lapic *apic, u32 mda)
Eddie Dong97222cc2007-09-12 10:58:04 +0300788{
Gleb Natapov0105d1a2009-07-05 17:39:36 +0300789 u32 logical_id;
790
Nadav Amit394457a2014-10-03 00:30:52 +0300791 if (kvm_apic_broadcast(apic, mda))
Radim Krčmář9368b562015-01-29 22:48:49 +0100792 return true;
Nadav Amit394457a2014-10-03 00:30:52 +0300793
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -0500794 logical_id = kvm_lapic_get_reg(apic, APIC_LDR);
Eddie Dong97222cc2007-09-12 10:58:04 +0300795
Radim Krčmář9368b562015-01-29 22:48:49 +0100796 if (apic_x2apic_mode(apic))
Radim Krčmář8a395362015-01-29 22:48:51 +0100797 return ((logical_id >> 16) == (mda >> 16))
798 && (logical_id & mda & 0xffff) != 0;
Radim Krčmář9368b562015-01-29 22:48:49 +0100799
800 logical_id = GET_APIC_LOGICAL_ID(logical_id);
Eddie Dong97222cc2007-09-12 10:58:04 +0300801
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -0500802 switch (kvm_lapic_get_reg(apic, APIC_DFR)) {
Eddie Dong97222cc2007-09-12 10:58:04 +0300803 case APIC_DFR_FLAT:
Radim Krčmář9368b562015-01-29 22:48:49 +0100804 return (logical_id & mda) != 0;
Eddie Dong97222cc2007-09-12 10:58:04 +0300805 case APIC_DFR_CLUSTER:
Radim Krčmář9368b562015-01-29 22:48:49 +0100806 return ((logical_id >> 4) == (mda >> 4))
807 && (logical_id & mda & 0xf) != 0;
Eddie Dong97222cc2007-09-12 10:58:04 +0300808 default:
Radim Krčmář9368b562015-01-29 22:48:49 +0100809 return false;
Eddie Dong97222cc2007-09-12 10:58:04 +0300810 }
Eddie Dong97222cc2007-09-12 10:58:04 +0300811}
812
Radim Krčmářc5192652016-07-12 22:09:28 +0200813/* The KVM local APIC implementation has two quirks:
814 *
Radim Krčmářb4535b52016-12-15 18:06:47 +0100815 * - Real hardware delivers interrupts destined to x2APIC ID > 0xff to LAPICs
816 * in xAPIC mode if the "destination & 0xff" matches its xAPIC ID.
817 * KVM doesn't do that aliasing.
Radim Krčmářc5192652016-07-12 22:09:28 +0200818 *
819 * - in-kernel IOAPIC messages have to be delivered directly to
820 * x2APIC, because the kernel does not support interrupt remapping.
821 * In order to support broadcast without interrupt remapping, x2APIC
822 * rewrites the destination of non-IPI messages from APIC_BROADCAST
823 * to X2APIC_BROADCAST.
824 *
825 * The broadcast quirk can be disabled with KVM_CAP_X2APIC_API. This is
826 * important when userspace wants to use x2APIC-format MSIs, because
827 * APIC_BROADCAST (0xff) is a legal route for "cluster 0, CPUs 0-7".
Radim Krčmář03d22492015-02-12 19:41:31 +0100828 */
Radim Krčmářc5192652016-07-12 22:09:28 +0200829static u32 kvm_apic_mda(struct kvm_vcpu *vcpu, unsigned int dest_id,
830 struct kvm_lapic *source, struct kvm_lapic *target)
Radim Krčmář03d22492015-02-12 19:41:31 +0100831{
832 bool ipi = source != NULL;
Radim Krčmář03d22492015-02-12 19:41:31 +0100833
Radim Krčmářc5192652016-07-12 22:09:28 +0200834 if (!vcpu->kvm->arch.x2apic_broadcast_quirk_disabled &&
Radim Krčmářb4535b52016-12-15 18:06:47 +0100835 !ipi && dest_id == APIC_BROADCAST && apic_x2apic_mode(target))
Radim Krčmář03d22492015-02-12 19:41:31 +0100836 return X2APIC_BROADCAST;
837
Radim Krčmářb4535b52016-12-15 18:06:47 +0100838 return dest_id;
Radim Krčmář03d22492015-02-12 19:41:31 +0100839}
840
Radim Krčmář52c233a2015-01-29 22:48:48 +0100841bool kvm_apic_match_dest(struct kvm_vcpu *vcpu, struct kvm_lapic *source,
Peter Xu5c69d5c2019-12-04 20:07:20 +0100842 int shorthand, unsigned int dest, int dest_mode)
Eddie Dong97222cc2007-09-12 10:58:04 +0300843{
Zhang Xiantaoad312c72007-12-13 23:50:52 +0800844 struct kvm_lapic *target = vcpu->arch.apic;
Radim Krčmářc5192652016-07-12 22:09:28 +0200845 u32 mda = kvm_apic_mda(vcpu, dest, source, target);
Eddie Dong97222cc2007-09-12 10:58:04 +0300846
Zachary Amsdenbd371392010-06-14 11:42:15 -1000847 ASSERT(target);
Peter Xu5c69d5c2019-12-04 20:07:20 +0100848 switch (shorthand) {
Eddie Dong97222cc2007-09-12 10:58:04 +0300849 case APIC_DEST_NOSHORT:
Radim Krčmář3697f302015-01-29 22:48:50 +0100850 if (dest_mode == APIC_DEST_PHYSICAL)
Radim Krčmář03d22492015-02-12 19:41:31 +0100851 return kvm_apic_match_physical_addr(target, mda);
Gleb Natapov343f94f2009-03-05 16:34:54 +0200852 else
Radim Krčmář03d22492015-02-12 19:41:31 +0100853 return kvm_apic_match_logical_addr(target, mda);
Eddie Dong97222cc2007-09-12 10:58:04 +0300854 case APIC_DEST_SELF:
Radim Krčmář9368b562015-01-29 22:48:49 +0100855 return target == source;
Eddie Dong97222cc2007-09-12 10:58:04 +0300856 case APIC_DEST_ALLINC:
Radim Krčmář9368b562015-01-29 22:48:49 +0100857 return true;
Eddie Dong97222cc2007-09-12 10:58:04 +0300858 case APIC_DEST_ALLBUT:
Radim Krčmář9368b562015-01-29 22:48:49 +0100859 return target != source;
Eddie Dong97222cc2007-09-12 10:58:04 +0300860 default:
Radim Krčmář9368b562015-01-29 22:48:49 +0100861 return false;
Eddie Dong97222cc2007-09-12 10:58:04 +0300862 }
Eddie Dong97222cc2007-09-12 10:58:04 +0300863}
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -0500864EXPORT_SYMBOL_GPL(kvm_apic_match_dest);
Eddie Dong97222cc2007-09-12 10:58:04 +0300865
Feng Wu520040142016-01-25 16:53:33 +0800866int kvm_vector_to_index(u32 vector, u32 dest_vcpus,
867 const unsigned long *bitmap, u32 bitmap_size)
868{
869 u32 mod;
870 int i, idx = -1;
871
872 mod = vector % dest_vcpus;
873
874 for (i = 0; i <= mod; i++) {
875 idx = find_next_bit(bitmap, bitmap_size, idx + 1);
876 BUG_ON(idx == bitmap_size);
877 }
878
879 return idx;
880}
881
Radim Krčmář4efd8052016-02-12 15:00:15 +0100882static void kvm_apic_disabled_lapic_found(struct kvm *kvm)
883{
884 if (!kvm->arch.disabled_lapic_found) {
885 kvm->arch.disabled_lapic_found = true;
886 printk(KERN_INFO
887 "Disabled LAPIC found during irq injection\n");
888 }
889}
890
Radim Krčmářc5192652016-07-12 22:09:28 +0200891static bool kvm_apic_is_broadcast_dest(struct kvm *kvm, struct kvm_lapic **src,
892 struct kvm_lapic_irq *irq, struct kvm_apic_map *map)
893{
894 if (kvm->arch.x2apic_broadcast_quirk_disabled) {
895 if ((irq->dest_id == APIC_BROADCAST &&
896 map->mode != KVM_APIC_MODE_X2APIC))
897 return true;
898 if (irq->dest_id == X2APIC_BROADCAST)
899 return true;
900 } else {
901 bool x2apic_ipi = src && *src && apic_x2apic_mode(*src);
902 if (irq->dest_id == (x2apic_ipi ?
903 X2APIC_BROADCAST : APIC_BROADCAST))
904 return true;
905 }
906
907 return false;
908}
909
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200910/* Return true if the interrupt can be handled by using *bitmap as index mask
911 * for valid destinations in *dst array.
912 * Return false if kvm_apic_map_get_dest_lapic did nothing useful.
913 * Note: we may have zero kvm_lapic destinations when we return true, which
914 * means that the interrupt should be dropped. In this case, *bitmap would be
915 * zero and *dst undefined.
916 */
917static inline bool kvm_apic_map_get_dest_lapic(struct kvm *kvm,
918 struct kvm_lapic **src, struct kvm_lapic_irq *irq,
919 struct kvm_apic_map *map, struct kvm_lapic ***dst,
920 unsigned long *bitmap)
921{
922 int i, lowest;
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200923
924 if (irq->shorthand == APIC_DEST_SELF && src) {
925 *dst = src;
926 *bitmap = 1;
927 return true;
928 } else if (irq->shorthand)
929 return false;
930
Radim Krčmářc5192652016-07-12 22:09:28 +0200931 if (!map || kvm_apic_is_broadcast_dest(kvm, src, irq, map))
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200932 return false;
933
934 if (irq->dest_mode == APIC_DEST_PHYSICAL) {
Radim Krčmář0ca52e72016-07-12 22:09:20 +0200935 if (irq->dest_id > map->max_apic_id) {
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200936 *bitmap = 0;
937 } else {
Paolo Bonzini1d487e92019-04-11 11:16:47 +0200938 u32 dest_id = array_index_nospec(irq->dest_id, map->max_apic_id + 1);
939 *dst = &map->phys_map[dest_id];
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200940 *bitmap = 1;
941 }
942 return true;
943 }
944
Radim Krčmáře45115b2016-07-12 22:09:19 +0200945 *bitmap = 0;
946 if (!kvm_apic_map_get_logical_dest(map, irq->dest_id, dst,
947 (u16 *)bitmap))
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200948 return false;
949
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200950 if (!kvm_lowest_prio_delivery(irq))
951 return true;
952
953 if (!kvm_vector_hashing_enabled()) {
954 lowest = -1;
955 for_each_set_bit(i, bitmap, 16) {
956 if (!(*dst)[i])
957 continue;
958 if (lowest < 0)
959 lowest = i;
960 else if (kvm_apic_compare_prio((*dst)[i]->vcpu,
961 (*dst)[lowest]->vcpu) < 0)
962 lowest = i;
963 }
964 } else {
965 if (!*bitmap)
966 return true;
967
968 lowest = kvm_vector_to_index(irq->vector, hweight16(*bitmap),
969 bitmap, 16);
970
971 if (!(*dst)[lowest]) {
972 kvm_apic_disabled_lapic_found(kvm);
973 *bitmap = 0;
974 return true;
975 }
976 }
977
978 *bitmap = (lowest >= 0) ? 1 << lowest : 0;
979
980 return true;
981}
982
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300983bool kvm_irq_delivery_to_apic_fast(struct kvm *kvm, struct kvm_lapic *src,
Joerg Roedel9e4aabe2016-02-29 16:04:43 +0100984 struct kvm_lapic_irq *irq, int *r, struct dest_map *dest_map)
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300985{
986 struct kvm_apic_map *map;
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200987 unsigned long bitmap;
988 struct kvm_lapic **dst = NULL;
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300989 int i;
Radim Krčmář64aa47b2016-07-12 22:09:18 +0200990 bool ret;
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300991
992 *r = -1;
993
994 if (irq->shorthand == APIC_DEST_SELF) {
Yang Zhangb4f22252013-04-11 19:21:37 +0800995 *r = kvm_apic_set_irq(src->vcpu, irq, dest_map);
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300996 return true;
997 }
998
Gleb Natapov1e08ec42012-09-13 17:19:24 +0300999 rcu_read_lock();
1000 map = rcu_dereference(kvm->arch.apic_map);
1001
Radim Krčmář64aa47b2016-07-12 22:09:18 +02001002 ret = kvm_apic_map_get_dest_lapic(kvm, &src, irq, map, &dst, &bitmap);
Paolo Bonzini0624fca2018-10-01 16:07:18 +02001003 if (ret) {
1004 *r = 0;
Radim Krčmář64aa47b2016-07-12 22:09:18 +02001005 for_each_set_bit(i, &bitmap, 16) {
1006 if (!dst[i])
1007 continue;
Radim Krčmář64aa47b2016-07-12 22:09:18 +02001008 *r += kvm_apic_set_irq(dst[i]->vcpu, irq, dest_map);
Radim Krčmář3548a252015-02-12 19:41:33 +01001009 }
Paolo Bonzini0624fca2018-10-01 16:07:18 +02001010 }
Radim Krčmář3548a252015-02-12 19:41:33 +01001011
Gleb Natapov1e08ec42012-09-13 17:19:24 +03001012 rcu_read_unlock();
1013 return ret;
1014}
1015
Feng Wu6228a0d2016-01-25 16:53:34 +08001016/*
Miaohe Lin00116792019-12-11 14:26:23 +08001017 * This routine tries to handle interrupts in posted mode, here is how
Feng Wu6228a0d2016-01-25 16:53:34 +08001018 * it deals with different cases:
1019 * - For single-destination interrupts, handle it in posted mode
1020 * - Else if vector hashing is enabled and it is a lowest-priority
1021 * interrupt, handle it in posted mode and use the following mechanism
Miaohe Lin67b0ae42019-12-11 14:26:22 +08001022 * to find the destination vCPU.
Feng Wu6228a0d2016-01-25 16:53:34 +08001023 * 1. For lowest-priority interrupts, store all the possible
1024 * destination vCPUs in an array.
1025 * 2. Use "guest vector % max number of destination vCPUs" to find
1026 * the right destination vCPU in the array for the lowest-priority
1027 * interrupt.
1028 * - Otherwise, use remapped mode to inject the interrupt.
1029 */
Feng Wu8feb4a02015-09-18 22:29:47 +08001030bool kvm_intr_is_single_vcpu_fast(struct kvm *kvm, struct kvm_lapic_irq *irq,
1031 struct kvm_vcpu **dest_vcpu)
1032{
1033 struct kvm_apic_map *map;
Radim Krčmář64aa47b2016-07-12 22:09:18 +02001034 unsigned long bitmap;
1035 struct kvm_lapic **dst = NULL;
Feng Wu8feb4a02015-09-18 22:29:47 +08001036 bool ret = false;
Feng Wu8feb4a02015-09-18 22:29:47 +08001037
1038 if (irq->shorthand)
1039 return false;
1040
1041 rcu_read_lock();
1042 map = rcu_dereference(kvm->arch.apic_map);
1043
Radim Krčmář64aa47b2016-07-12 22:09:18 +02001044 if (kvm_apic_map_get_dest_lapic(kvm, NULL, irq, map, &dst, &bitmap) &&
1045 hweight16(bitmap) == 1) {
1046 unsigned long i = find_first_bit(&bitmap, 16);
Feng Wu8feb4a02015-09-18 22:29:47 +08001047
Radim Krčmář64aa47b2016-07-12 22:09:18 +02001048 if (dst[i]) {
1049 *dest_vcpu = dst[i]->vcpu;
1050 ret = true;
Feng Wu8feb4a02015-09-18 22:29:47 +08001051 }
Feng Wu8feb4a02015-09-18 22:29:47 +08001052 }
1053
Feng Wu8feb4a02015-09-18 22:29:47 +08001054 rcu_read_unlock();
1055 return ret;
1056}
1057
Eddie Dong97222cc2007-09-12 10:58:04 +03001058/*
1059 * Add a pending IRQ into lapic.
1060 * Return 1 if successfully added and 0 if discarded.
1061 */
1062static int __apic_accept_irq(struct kvm_lapic *apic, int delivery_mode,
Yang Zhangb4f22252013-04-11 19:21:37 +08001063 int vector, int level, int trig_mode,
Joerg Roedel9e4aabe2016-02-29 16:04:43 +01001064 struct dest_map *dest_map)
Eddie Dong97222cc2007-09-12 10:58:04 +03001065{
Gleb Natapov6da7e3f2009-03-05 16:34:44 +02001066 int result = 0;
He, Qingc5ec1532007-09-03 17:07:41 +03001067 struct kvm_vcpu *vcpu = apic->vcpu;
Eddie Dong97222cc2007-09-12 10:58:04 +03001068
Paolo Bonzinia183b632014-09-11 11:51:02 +02001069 trace_kvm_apic_accept_irq(vcpu->vcpu_id, delivery_mode,
1070 trig_mode, vector);
Eddie Dong97222cc2007-09-12 10:58:04 +03001071 switch (delivery_mode) {
Eddie Dong97222cc2007-09-12 10:58:04 +03001072 case APIC_DM_LOWEST:
Gleb Natapove1035712009-03-05 16:34:59 +02001073 vcpu->arch.apic_arb_prio++;
Gustavo A. R. Silvadf561f662020-08-23 17:36:59 -05001074 fallthrough;
Gleb Natapove1035712009-03-05 16:34:59 +02001075 case APIC_DM_FIXED:
Paolo Bonzinibdaffe12015-07-29 15:03:06 +02001076 if (unlikely(trig_mode && !level))
1077 break;
1078
Eddie Dong97222cc2007-09-12 10:58:04 +03001079 /* FIXME add logic for vcpu on reset */
1080 if (unlikely(!apic_enabled(apic)))
1081 break;
1082
Jan Kiszka11f5cc02013-07-25 09:58:45 +02001083 result = 1;
1084
Joerg Roedel9daa5002016-02-29 16:04:44 +01001085 if (dest_map) {
Joerg Roedel9e4aabe2016-02-29 16:04:43 +01001086 __set_bit(vcpu->vcpu_id, dest_map->map);
Joerg Roedel9daa5002016-02-29 16:04:44 +01001087 dest_map->vectors[vcpu->vcpu_id] = vector;
1088 }
Avi Kivitya5d36f82009-12-29 12:42:16 +02001089
Paolo Bonzinibdaffe12015-07-29 15:03:06 +02001090 if (apic_test_vector(vector, apic->regs + APIC_TMR) != !!trig_mode) {
1091 if (trig_mode)
Wei Yangee171d22019-03-31 19:17:22 -07001092 kvm_lapic_set_vector(vector,
1093 apic->regs + APIC_TMR);
Paolo Bonzinibdaffe12015-07-29 15:03:06 +02001094 else
Wei Yangee171d22019-03-31 19:17:22 -07001095 kvm_lapic_clear_vector(vector,
1096 apic->regs + APIC_TMR);
Paolo Bonzinibdaffe12015-07-29 15:03:06 +02001097 }
1098
Jason Baronb36464772021-01-14 22:27:56 -05001099 if (static_call(kvm_x86_deliver_posted_interrupt)(vcpu, vector)) {
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05001100 kvm_lapic_set_irr(vector, apic);
Yang Zhang5a717852013-04-11 19:25:16 +08001101 kvm_make_request(KVM_REQ_EVENT, vcpu);
1102 kvm_vcpu_kick(vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +03001103 }
Eddie Dong97222cc2007-09-12 10:58:04 +03001104 break;
1105
1106 case APIC_DM_REMRD:
Raghavendra K T24d21662013-08-26 14:18:35 +05301107 result = 1;
1108 vcpu->arch.pv.pv_unhalted = 1;
1109 kvm_make_request(KVM_REQ_EVENT, vcpu);
1110 kvm_vcpu_kick(vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +03001111 break;
1112
1113 case APIC_DM_SMI:
Paolo Bonzini64d60672015-05-07 11:36:11 +02001114 result = 1;
1115 kvm_make_request(KVM_REQ_SMI, vcpu);
1116 kvm_vcpu_kick(vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +03001117 break;
Sheng Yang3419ffc2008-05-15 09:52:48 +08001118
Eddie Dong97222cc2007-09-12 10:58:04 +03001119 case APIC_DM_NMI:
Gleb Natapov6da7e3f2009-03-05 16:34:44 +02001120 result = 1;
Sheng Yang3419ffc2008-05-15 09:52:48 +08001121 kvm_inject_nmi(vcpu);
Jan Kiszka26df99c2008-09-26 09:30:54 +02001122 kvm_vcpu_kick(vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +03001123 break;
1124
1125 case APIC_DM_INIT:
Julian Stecklinaa52315e2012-01-16 14:02:20 +01001126 if (!trig_mode || level) {
Gleb Natapov6da7e3f2009-03-05 16:34:44 +02001127 result = 1;
Jan Kiszka66450a22013-03-13 12:42:34 +01001128 /* assumes that there are only KVM_APIC_INIT/SIPI */
1129 apic->pending_events = (1UL << KVM_APIC_INIT);
Avi Kivity3842d132010-07-27 12:30:24 +03001130 kvm_make_request(KVM_REQ_EVENT, vcpu);
He, Qingc5ec1532007-09-03 17:07:41 +03001131 kvm_vcpu_kick(vcpu);
He, Qingc5ec1532007-09-03 17:07:41 +03001132 }
Eddie Dong97222cc2007-09-12 10:58:04 +03001133 break;
1134
1135 case APIC_DM_STARTUP:
Jan Kiszka66450a22013-03-13 12:42:34 +01001136 result = 1;
1137 apic->sipi_vector = vector;
1138 /* make sure sipi_vector is visible for the receiver */
1139 smp_wmb();
1140 set_bit(KVM_APIC_SIPI, &apic->pending_events);
1141 kvm_make_request(KVM_REQ_EVENT, vcpu);
1142 kvm_vcpu_kick(vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +03001143 break;
1144
Jan Kiszka23930f92008-09-26 09:30:52 +02001145 case APIC_DM_EXTINT:
1146 /*
1147 * Should only be called by kvm_apic_local_deliver() with LVT0,
1148 * before NMI watchdog was enabled. Already handled by
1149 * kvm_apic_accept_pic_intr().
1150 */
1151 break;
1152
Eddie Dong97222cc2007-09-12 10:58:04 +03001153 default:
1154 printk(KERN_ERR "TODO: unsupported delivery mode %x\n",
1155 delivery_mode);
1156 break;
1157 }
1158 return result;
1159}
1160
Nitesh Narayan Lal7ee30bc2019-11-07 07:53:43 -05001161/*
1162 * This routine identifies the destination vcpus mask meant to receive the
1163 * IOAPIC interrupts. It either uses kvm_apic_map_get_dest_lapic() to find
1164 * out the destination vcpus array and set the bitmap or it traverses to
1165 * each available vcpu to identify the same.
1166 */
1167void kvm_bitmap_or_dest_vcpus(struct kvm *kvm, struct kvm_lapic_irq *irq,
1168 unsigned long *vcpu_bitmap)
1169{
1170 struct kvm_lapic **dest_vcpu = NULL;
1171 struct kvm_lapic *src = NULL;
1172 struct kvm_apic_map *map;
1173 struct kvm_vcpu *vcpu;
Marc Zyngier46808a42021-11-16 16:04:02 +00001174 unsigned long bitmap, i;
1175 int vcpu_idx;
Nitesh Narayan Lal7ee30bc2019-11-07 07:53:43 -05001176 bool ret;
1177
1178 rcu_read_lock();
1179 map = rcu_dereference(kvm->arch.apic_map);
1180
1181 ret = kvm_apic_map_get_dest_lapic(kvm, &src, irq, map, &dest_vcpu,
1182 &bitmap);
1183 if (ret) {
1184 for_each_set_bit(i, &bitmap, 16) {
1185 if (!dest_vcpu[i])
1186 continue;
1187 vcpu_idx = dest_vcpu[i]->vcpu->vcpu_idx;
1188 __set_bit(vcpu_idx, vcpu_bitmap);
1189 }
1190 } else {
1191 kvm_for_each_vcpu(i, vcpu, kvm) {
1192 if (!kvm_apic_present(vcpu))
1193 continue;
1194 if (!kvm_apic_match_dest(vcpu, NULL,
Peter Xub4b29632019-12-04 20:07:16 +01001195 irq->shorthand,
Nitesh Narayan Lal7ee30bc2019-11-07 07:53:43 -05001196 irq->dest_id,
1197 irq->dest_mode))
1198 continue;
1199 __set_bit(i, vcpu_bitmap);
1200 }
1201 }
1202 rcu_read_unlock();
1203}
1204
Gleb Natapove1035712009-03-05 16:34:59 +02001205int kvm_apic_compare_prio(struct kvm_vcpu *vcpu1, struct kvm_vcpu *vcpu2)
Eddie Dong97222cc2007-09-12 10:58:04 +03001206{
Gleb Natapove1035712009-03-05 16:34:59 +02001207 return vcpu1->arch.apic_arb_prio - vcpu2->arch.apic_arb_prio;
Zhang Xiantao8be54532007-12-02 22:35:57 +08001208}
1209
Paolo Bonzini3bb345f2015-07-29 10:43:18 +02001210static bool kvm_ioapic_handles_vector(struct kvm_lapic *apic, int vector)
1211{
Andrey Smetanin63086302015-11-10 15:36:32 +03001212 return test_bit(vector, apic->vcpu->arch.ioapic_handled_vectors);
Paolo Bonzini3bb345f2015-07-29 10:43:18 +02001213}
1214
Yang Zhangc7c9c562013-01-25 10:18:51 +08001215static void kvm_ioapic_send_eoi(struct kvm_lapic *apic, int vector)
1216{
Steve Rutherford7543a632015-07-29 23:21:41 -07001217 int trigger_mode;
Paolo Bonzini3bb345f2015-07-29 10:43:18 +02001218
Steve Rutherford7543a632015-07-29 23:21:41 -07001219 /* Eoi the ioapic only if the ioapic doesn't own the vector. */
1220 if (!kvm_ioapic_handles_vector(apic, vector))
1221 return;
1222
1223 /* Request a KVM exit to inform the userspace IOAPIC. */
1224 if (irqchip_split(apic->vcpu->kvm)) {
1225 apic->vcpu->arch.pending_ioapic_eoi = vector;
1226 kvm_make_request(KVM_REQ_IOAPIC_EOI_EXIT, apic->vcpu);
1227 return;
Yang Zhangc7c9c562013-01-25 10:18:51 +08001228 }
Steve Rutherford7543a632015-07-29 23:21:41 -07001229
1230 if (apic_test_vector(vector, apic->regs + APIC_TMR))
1231 trigger_mode = IOAPIC_LEVEL_TRIG;
1232 else
1233 trigger_mode = IOAPIC_EDGE_TRIG;
1234
1235 kvm_ioapic_update_eoi(apic->vcpu, vector, trigger_mode);
Yang Zhangc7c9c562013-01-25 10:18:51 +08001236}
1237
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03001238static int apic_set_eoi(struct kvm_lapic *apic)
Eddie Dong97222cc2007-09-12 10:58:04 +03001239{
1240 int vector = apic_find_highest_isr(apic);
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03001241
1242 trace_kvm_eoi(apic, vector);
1243
Eddie Dong97222cc2007-09-12 10:58:04 +03001244 /*
1245 * Not every write EOI will has corresponding ISR,
1246 * one example is when Kernel check timer on setup_IO_APIC
1247 */
1248 if (vector == -1)
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03001249 return vector;
Eddie Dong97222cc2007-09-12 10:58:04 +03001250
Michael S. Tsirkin8680b942012-06-24 19:24:26 +03001251 apic_clear_isr(vector, apic);
Eddie Dong97222cc2007-09-12 10:58:04 +03001252 apic_update_ppr(apic);
1253
Vitaly Kuznetsovf2bc14b2021-01-26 14:48:12 +01001254 if (to_hv_vcpu(apic->vcpu) &&
1255 test_bit(vector, to_hv_synic(apic->vcpu)->vec_bitmap))
Andrey Smetanin5c9194122015-11-10 15:36:34 +03001256 kvm_hv_synic_send_eoi(apic->vcpu, vector);
1257
Yang Zhangc7c9c562013-01-25 10:18:51 +08001258 kvm_ioapic_send_eoi(apic, vector);
Avi Kivity3842d132010-07-27 12:30:24 +03001259 kvm_make_request(KVM_REQ_EVENT, apic->vcpu);
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03001260 return vector;
Eddie Dong97222cc2007-09-12 10:58:04 +03001261}
1262
Yang Zhangc7c9c562013-01-25 10:18:51 +08001263/*
1264 * this interface assumes a trap-like exit, which has already finished
1265 * desired side effect including vISR and vPPR update.
1266 */
1267void kvm_apic_set_eoi_accelerated(struct kvm_vcpu *vcpu, int vector)
1268{
1269 struct kvm_lapic *apic = vcpu->arch.apic;
1270
1271 trace_kvm_eoi(apic, vector);
1272
1273 kvm_ioapic_send_eoi(apic, vector);
1274 kvm_make_request(KVM_REQ_EVENT, apic->vcpu);
1275}
1276EXPORT_SYMBOL_GPL(kvm_apic_set_eoi_accelerated);
1277
Wanpeng Lid5361672020-03-26 10:20:02 +08001278void kvm_apic_send_ipi(struct kvm_lapic *apic, u32 icr_low, u32 icr_high)
Eddie Dong97222cc2007-09-12 10:58:04 +03001279{
Gleb Natapov58c2dde2009-03-05 16:35:04 +02001280 struct kvm_lapic_irq irq;
Eddie Dong97222cc2007-09-12 10:58:04 +03001281
Gleb Natapov58c2dde2009-03-05 16:35:04 +02001282 irq.vector = icr_low & APIC_VECTOR_MASK;
1283 irq.delivery_mode = icr_low & APIC_MODE_MASK;
1284 irq.dest_mode = icr_low & APIC_DEST_MASK;
Paolo Bonzinib7cb2232015-04-21 14:57:05 +02001285 irq.level = (icr_low & APIC_INT_ASSERT) != 0;
Gleb Natapov58c2dde2009-03-05 16:35:04 +02001286 irq.trig_mode = icr_low & APIC_INT_LEVELTRIG;
1287 irq.shorthand = icr_low & APIC_SHORT_MASK;
James Sullivan93bbf0b2015-03-18 19:26:03 -06001288 irq.msi_redir_hint = false;
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001289 if (apic_x2apic_mode(apic))
1290 irq.dest_id = icr_high;
1291 else
1292 irq.dest_id = GET_APIC_DEST_FIELD(icr_high);
Eddie Dong97222cc2007-09-12 10:58:04 +03001293
Gleb Natapov1000ff82009-07-07 16:00:57 +03001294 trace_kvm_apic_ipi(icr_low, irq.dest_id);
1295
Yang Zhangb4f22252013-04-11 19:21:37 +08001296 kvm_irq_delivery_to_apic(apic->vcpu->kvm, apic, &irq, NULL);
Eddie Dong97222cc2007-09-12 10:58:04 +03001297}
1298
1299static u32 apic_get_tmcct(struct kvm_lapic *apic)
1300{
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001301 ktime_t remaining, now;
Marcelo Tosattib682b812009-02-10 20:41:41 -02001302 s64 ns;
Kevin Pedretti9da8f4e2007-10-21 08:55:50 +02001303 u32 tmcct;
Eddie Dong97222cc2007-09-12 10:58:04 +03001304
1305 ASSERT(apic != NULL);
1306
Kevin Pedretti9da8f4e2007-10-21 08:55:50 +02001307 /* if initial count is 0, current count should also be 0 */
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05001308 if (kvm_lapic_get_reg(apic, APIC_TMICT) == 0 ||
Andy Honigb963a222013-11-19 14:12:18 -08001309 apic->lapic_timer.period == 0)
Kevin Pedretti9da8f4e2007-10-21 08:55:50 +02001310 return 0;
1311
Paolo Bonzini55878592016-10-25 15:23:49 +02001312 now = ktime_get();
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001313 remaining = ktime_sub(apic->lapic_timer.target_expiration, now);
Marcelo Tosattib682b812009-02-10 20:41:41 -02001314 if (ktime_to_ns(remaining) < 0)
Thomas Gleixner8b0e1952016-12-25 12:30:41 +01001315 remaining = 0;
Eddie Dong97222cc2007-09-12 10:58:04 +03001316
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03001317 ns = mod_64(ktime_to_ns(remaining), apic->lapic_timer.period);
1318 tmcct = div64_u64(ns,
1319 (APIC_BUS_CYCLE_NS * apic->divide_count));
Eddie Dong97222cc2007-09-12 10:58:04 +03001320
1321 return tmcct;
1322}
1323
Avi Kivityb209749f2007-10-22 16:50:39 +02001324static void __report_tpr_access(struct kvm_lapic *apic, bool write)
1325{
1326 struct kvm_vcpu *vcpu = apic->vcpu;
1327 struct kvm_run *run = vcpu->run;
1328
Avi Kivitya8eeb042010-05-10 12:34:53 +03001329 kvm_make_request(KVM_REQ_REPORT_TPR_ACCESS, vcpu);
Marcelo Tosatti5fdbf972008-06-27 14:58:02 -03001330 run->tpr_access.rip = kvm_rip_read(vcpu);
Avi Kivityb209749f2007-10-22 16:50:39 +02001331 run->tpr_access.is_write = write;
1332}
1333
1334static inline void report_tpr_access(struct kvm_lapic *apic, bool write)
1335{
1336 if (apic->vcpu->arch.tpr_access_reporting)
1337 __report_tpr_access(apic, write);
1338}
1339
Eddie Dong97222cc2007-09-12 10:58:04 +03001340static u32 __apic_read(struct kvm_lapic *apic, unsigned int offset)
1341{
1342 u32 val = 0;
1343
1344 if (offset >= LAPIC_MMIO_LENGTH)
1345 return 0;
1346
1347 switch (offset) {
1348 case APIC_ARBPRI:
Eddie Dong97222cc2007-09-12 10:58:04 +03001349 break;
1350
1351 case APIC_TMCCT: /* Timer CCR */
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08001352 if (apic_lvtt_tscdeadline(apic))
1353 return 0;
1354
Eddie Dong97222cc2007-09-12 10:58:04 +03001355 val = apic_get_tmcct(apic);
1356 break;
Avi Kivity4a4541a2012-07-22 17:41:00 +03001357 case APIC_PROCPRI:
1358 apic_update_ppr(apic);
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05001359 val = kvm_lapic_get_reg(apic, offset);
Avi Kivity4a4541a2012-07-22 17:41:00 +03001360 break;
Avi Kivityb209749f2007-10-22 16:50:39 +02001361 case APIC_TASKPRI:
1362 report_tpr_access(apic, false);
Gustavo A. R. Silvadf561f662020-08-23 17:36:59 -05001363 fallthrough;
Eddie Dong97222cc2007-09-12 10:58:04 +03001364 default:
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05001365 val = kvm_lapic_get_reg(apic, offset);
Eddie Dong97222cc2007-09-12 10:58:04 +03001366 break;
1367 }
1368
1369 return val;
1370}
1371
Gregory Haskinsd76685c42009-06-01 12:54:50 -04001372static inline struct kvm_lapic *to_lapic(struct kvm_io_device *dev)
1373{
1374 return container_of(dev, struct kvm_lapic, dev);
1375}
1376
Paolo Bonzini01402cf2019-07-05 14:57:58 +02001377#define APIC_REG_MASK(reg) (1ull << ((reg) >> 4))
1378#define APIC_REGS_MASK(first, count) \
1379 (APIC_REG_MASK(first) * ((1ull << (count)) - 1))
1380
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05001381int kvm_lapic_reg_read(struct kvm_lapic *apic, u32 offset, int len,
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001382 void *data)
Michael S. Tsirkinbda90202009-06-29 22:24:32 +03001383{
Eddie Dong97222cc2007-09-12 10:58:04 +03001384 unsigned char alignment = offset & 0xf;
1385 u32 result;
Guo Chaod5b0b5b2012-06-28 15:22:57 +08001386 /* this bitmask has a bit cleared for each reserved register */
Paolo Bonzini01402cf2019-07-05 14:57:58 +02001387 u64 valid_reg_mask =
1388 APIC_REG_MASK(APIC_ID) |
1389 APIC_REG_MASK(APIC_LVR) |
1390 APIC_REG_MASK(APIC_TASKPRI) |
1391 APIC_REG_MASK(APIC_PROCPRI) |
1392 APIC_REG_MASK(APIC_LDR) |
1393 APIC_REG_MASK(APIC_DFR) |
1394 APIC_REG_MASK(APIC_SPIV) |
1395 APIC_REGS_MASK(APIC_ISR, APIC_ISR_NR) |
1396 APIC_REGS_MASK(APIC_TMR, APIC_ISR_NR) |
1397 APIC_REGS_MASK(APIC_IRR, APIC_ISR_NR) |
1398 APIC_REG_MASK(APIC_ESR) |
1399 APIC_REG_MASK(APIC_ICR) |
1400 APIC_REG_MASK(APIC_ICR2) |
1401 APIC_REG_MASK(APIC_LVTT) |
1402 APIC_REG_MASK(APIC_LVTTHMR) |
1403 APIC_REG_MASK(APIC_LVTPC) |
1404 APIC_REG_MASK(APIC_LVT0) |
1405 APIC_REG_MASK(APIC_LVT1) |
1406 APIC_REG_MASK(APIC_LVTERR) |
1407 APIC_REG_MASK(APIC_TMICT) |
1408 APIC_REG_MASK(APIC_TMCCT) |
1409 APIC_REG_MASK(APIC_TDCR);
Eddie Dong97222cc2007-09-12 10:58:04 +03001410
Paolo Bonzini01402cf2019-07-05 14:57:58 +02001411 /* ARBPRI is not valid on x2APIC */
1412 if (!apic_x2apic_mode(apic))
1413 valid_reg_mask |= APIC_REG_MASK(APIC_ARBPRI);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001414
Jim Mattson218bf772021-06-02 13:52:24 -07001415 if (alignment + len > 4)
1416 return 1;
1417
Yi Wang0d888002019-07-06 01:08:48 +08001418 if (offset > 0x3f0 || !(valid_reg_mask & APIC_REG_MASK(offset)))
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001419 return 1;
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001420
Eddie Dong97222cc2007-09-12 10:58:04 +03001421 result = __apic_read(apic, offset & ~0xf);
1422
Marcelo Tosatti229456f2009-06-17 09:22:14 -03001423 trace_kvm_apic_read(offset, result);
1424
Eddie Dong97222cc2007-09-12 10:58:04 +03001425 switch (len) {
1426 case 1:
1427 case 2:
1428 case 4:
1429 memcpy(data, (char *)&result + alignment, len);
1430 break;
1431 default:
1432 printk(KERN_ERR "Local APIC read with len = %x, "
1433 "should be 1,2, or 4 instead\n", len);
1434 break;
1435 }
Michael S. Tsirkinbda90202009-06-29 22:24:32 +03001436 return 0;
Eddie Dong97222cc2007-09-12 10:58:04 +03001437}
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05001438EXPORT_SYMBOL_GPL(kvm_lapic_reg_read);
Eddie Dong97222cc2007-09-12 10:58:04 +03001439
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001440static int apic_mmio_in_range(struct kvm_lapic *apic, gpa_t addr)
1441{
Vitaly Kuznetsovd1766202018-08-02 17:08:16 +02001442 return addr >= apic->base_address &&
1443 addr < apic->base_address + LAPIC_MMIO_LENGTH;
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001444}
1445
Nikolay Nikolaeve32edf42015-03-26 14:39:28 +00001446static int apic_mmio_read(struct kvm_vcpu *vcpu, struct kvm_io_device *this,
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001447 gpa_t address, int len, void *data)
1448{
1449 struct kvm_lapic *apic = to_lapic(this);
1450 u32 offset = address - apic->base_address;
1451
1452 if (!apic_mmio_in_range(apic, address))
1453 return -EOPNOTSUPP;
1454
Vitaly Kuznetsovd1766202018-08-02 17:08:16 +02001455 if (!kvm_apic_hw_enabled(apic) || apic_x2apic_mode(apic)) {
1456 if (!kvm_check_has_quirk(vcpu->kvm,
1457 KVM_X86_QUIRK_LAPIC_MMIO_HOLE))
1458 return -EOPNOTSUPP;
1459
1460 memset(data, 0xff, len);
1461 return 0;
1462 }
1463
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05001464 kvm_lapic_reg_read(apic, offset, len, data);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03001465
1466 return 0;
1467}
1468
Eddie Dong97222cc2007-09-12 10:58:04 +03001469static void update_divide_count(struct kvm_lapic *apic)
1470{
1471 u32 tmp1, tmp2, tdcr;
1472
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05001473 tdcr = kvm_lapic_get_reg(apic, APIC_TDCR);
Eddie Dong97222cc2007-09-12 10:58:04 +03001474 tmp1 = tdcr & 0xf;
1475 tmp2 = ((tmp1 & 0x3) | ((tmp1 & 0x8) >> 1)) + 1;
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03001476 apic->divide_count = 0x1 << (tmp2 & 0x7);
Eddie Dong97222cc2007-09-12 10:58:04 +03001477}
1478
Wanpeng Liccbfa1d2017-10-05 18:54:24 -07001479static void limit_periodic_timer_frequency(struct kvm_lapic *apic)
1480{
1481 /*
1482 * Do not allow the guest to program periodic timers with small
1483 * interval, since the hrtimers are not throttled by the host
1484 * scheduler.
1485 */
Wanpeng Lidedf9c52017-10-05 18:54:25 -07001486 if (apic_lvtt_period(apic) && apic->lapic_timer.period) {
Wanpeng Liccbfa1d2017-10-05 18:54:24 -07001487 s64 min_period = min_timer_period_us * 1000LL;
1488
1489 if (apic->lapic_timer.period < min_period) {
1490 pr_info_ratelimited(
1491 "kvm: vcpu %i: requested %lld ns "
1492 "lapic timer period limited to %lld ns\n",
1493 apic->vcpu->vcpu_id,
1494 apic->lapic_timer.period, min_period);
1495 apic->lapic_timer.period = min_period;
1496 }
1497 }
1498}
1499
Wanpeng Li94be4b82020-03-24 14:32:10 +08001500static void cancel_hv_timer(struct kvm_lapic *apic);
1501
Wanpeng Lie898da72021-06-07 00:19:43 -07001502static void cancel_apic_timer(struct kvm_lapic *apic)
1503{
1504 hrtimer_cancel(&apic->lapic_timer.timer);
1505 preempt_disable();
1506 if (apic->lapic_timer.hv_timer_in_use)
1507 cancel_hv_timer(apic);
1508 preempt_enable();
1509}
1510
Radim Krčmářb6ac0692015-06-05 20:57:41 +02001511static void apic_update_lvtt(struct kvm_lapic *apic)
1512{
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05001513 u32 timer_mode = kvm_lapic_get_reg(apic, APIC_LVTT) &
Radim Krčmářb6ac0692015-06-05 20:57:41 +02001514 apic->lapic_timer.timer_mode_mask;
1515
1516 if (apic->lapic_timer.timer_mode != timer_mode) {
Wanpeng Lic69518c2017-10-05 03:53:51 -07001517 if (apic_lvtt_tscdeadline(apic) != (timer_mode ==
Wanpeng Lidedf9c52017-10-05 18:54:25 -07001518 APIC_LVT_TIMER_TSCDEADLINE)) {
Wanpeng Lie898da72021-06-07 00:19:43 -07001519 cancel_apic_timer(apic);
Radim Krčmář44275932017-10-06 19:25:55 +02001520 kvm_lapic_set_reg(apic, APIC_TMICT, 0);
1521 apic->lapic_timer.period = 0;
1522 apic->lapic_timer.tscdeadline = 0;
Wanpeng Lidedf9c52017-10-05 18:54:25 -07001523 }
Radim Krčmářb6ac0692015-06-05 20:57:41 +02001524 apic->lapic_timer.timer_mode = timer_mode;
Wanpeng Lidedf9c52017-10-05 18:54:25 -07001525 limit_periodic_timer_frequency(apic);
Radim Krčmářb6ac0692015-06-05 20:57:41 +02001526 }
1527}
1528
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001529/*
1530 * On APICv, this test will cause a busy wait
1531 * during a higher-priority task.
1532 */
1533
1534static bool lapic_timer_int_injected(struct kvm_vcpu *vcpu)
1535{
1536 struct kvm_lapic *apic = vcpu->arch.apic;
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05001537 u32 reg = kvm_lapic_get_reg(apic, APIC_LVTT);
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001538
1539 if (kvm_apic_hw_enabled(apic)) {
1540 int vec = reg & APIC_VECTOR_MASK;
Marcelo Tosattif9339862015-02-02 15:26:08 -02001541 void *bitmap = apic->regs + APIC_ISR;
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001542
Andrey Smetanind62caab2015-11-10 15:36:33 +03001543 if (vcpu->arch.apicv_active)
Marcelo Tosattif9339862015-02-02 15:26:08 -02001544 bitmap = apic->regs + APIC_IRR;
1545
1546 if (apic_test_vector(vec, bitmap))
1547 return true;
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001548 }
1549 return false;
1550}
1551
Sean Christophersonb6aa57c2019-04-17 10:15:34 -07001552static inline void __wait_lapic_expire(struct kvm_vcpu *vcpu, u64 guest_cycles)
1553{
1554 u64 timer_advance_ns = vcpu->arch.apic->lapic_timer.timer_advance_ns;
1555
1556 /*
1557 * If the guest TSC is running at a different ratio than the host, then
1558 * convert the delay to nanoseconds to achieve an accurate delay. Note
1559 * that __delay() uses delay_tsc whenever the hardware has TSC, thus
1560 * always for VMX enabled hardware.
1561 */
1562 if (vcpu->arch.tsc_scaling_ratio == kvm_default_tsc_scaling_ratio) {
1563 __delay(min(guest_cycles,
1564 nsec_to_cycles(vcpu, timer_advance_ns)));
1565 } else {
1566 u64 delay_ns = guest_cycles * 1000000ULL;
1567 do_div(delay_ns, vcpu->arch.virtual_tsc_khz);
1568 ndelay(min_t(u32, delay_ns, timer_advance_ns));
1569 }
1570}
1571
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001572static inline void adjust_lapic_timer_advance(struct kvm_vcpu *vcpu,
Wanpeng Liec0671d2019-05-20 16:18:08 +08001573 s64 advance_expire_delta)
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001574{
1575 struct kvm_lapic *apic = vcpu->arch.apic;
Sean Christopherson39497d72019-04-17 10:15:32 -07001576 u32 timer_advance_ns = apic->lapic_timer.timer_advance_ns;
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001577 u64 ns;
1578
Wanpeng Lid0f5a862019-09-17 16:16:26 +08001579 /* Do not adjust for tiny fluctuations or large random spikes. */
1580 if (abs(advance_expire_delta) > LAPIC_TIMER_ADVANCE_ADJUST_MAX ||
1581 abs(advance_expire_delta) < LAPIC_TIMER_ADVANCE_ADJUST_MIN)
1582 return;
1583
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001584 /* too early */
Wanpeng Liec0671d2019-05-20 16:18:08 +08001585 if (advance_expire_delta < 0) {
1586 ns = -advance_expire_delta * 1000000ULL;
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001587 do_div(ns, vcpu->arch.virtual_tsc_khz);
Wanpeng Lid0f5a862019-09-17 16:16:26 +08001588 timer_advance_ns -= ns/LAPIC_TIMER_ADVANCE_ADJUST_STEP;
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001589 } else {
1590 /* too late */
Wanpeng Liec0671d2019-05-20 16:18:08 +08001591 ns = advance_expire_delta * 1000000ULL;
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001592 do_div(ns, vcpu->arch.virtual_tsc_khz);
Wanpeng Lid0f5a862019-09-17 16:16:26 +08001593 timer_advance_ns += ns/LAPIC_TIMER_ADVANCE_ADJUST_STEP;
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001594 }
1595
Wanpeng Lia0f00372019-09-26 08:54:03 +08001596 if (unlikely(timer_advance_ns > LAPIC_TIMER_ADVANCE_NS_MAX))
1597 timer_advance_ns = LAPIC_TIMER_ADVANCE_NS_INIT;
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001598 apic->lapic_timer.timer_advance_ns = timer_advance_ns;
1599}
1600
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001601static void __kvm_wait_lapic_expire(struct kvm_vcpu *vcpu)
Wanpeng Li84ea3ac2019-05-20 16:18:05 +08001602{
1603 struct kvm_lapic *apic = vcpu->arch.apic;
1604 u64 guest_tsc, tsc_deadline;
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001605
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001606 tsc_deadline = apic->lapic_timer.expired_tscdeadline;
1607 apic->lapic_timer.expired_tscdeadline = 0;
Haozhong Zhang4ba76532015-10-20 15:39:07 +08001608 guest_tsc = kvm_read_l1_tsc(vcpu, rdtsc());
Wanpeng Liec0671d2019-05-20 16:18:08 +08001609 apic->lapic_timer.advance_expire_delta = guest_tsc - tsc_deadline;
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001610
Wanpeng Li9805cf02021-05-18 05:00:35 -07001611 if (lapic_timer_advance_dynamic) {
1612 adjust_lapic_timer_advance(vcpu, apic->lapic_timer.advance_expire_delta);
1613 /*
1614 * If the timer fired early, reread the TSC to account for the
1615 * overhead of the above adjustment to avoid waiting longer
1616 * than is necessary.
1617 */
1618 if (guest_tsc < tsc_deadline)
1619 guest_tsc = kvm_read_l1_tsc(vcpu, rdtsc());
1620 }
1621
Marcelo Tosattid0659d92014-12-16 09:08:15 -05001622 if (guest_tsc < tsc_deadline)
Sean Christophersonb6aa57c2019-04-17 10:15:34 -07001623 __wait_lapic_expire(vcpu, tsc_deadline - guest_tsc);
Radim Krčmář5d87db72014-10-10 19:15:08 +02001624}
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001625
1626void kvm_wait_lapic_expire(struct kvm_vcpu *vcpu)
1627{
Wanpeng Li010fd372020-09-10 17:50:41 +08001628 if (lapic_in_kernel(vcpu) &&
1629 vcpu->arch.apic->lapic_timer.expired_tscdeadline &&
1630 vcpu->arch.apic->lapic_timer.timer_advance_ns &&
1631 lapic_timer_int_injected(vcpu))
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001632 __kvm_wait_lapic_expire(vcpu);
1633}
Wanpeng Lib6c4bc62019-05-20 16:18:09 +08001634EXPORT_SYMBOL_GPL(kvm_wait_lapic_expire);
Radim Krčmář5d87db72014-10-10 19:15:08 +02001635
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001636static void kvm_apic_inject_pending_timer_irqs(struct kvm_lapic *apic)
1637{
1638 struct kvm_timer *ktimer = &apic->lapic_timer;
1639
1640 kvm_apic_local_deliver(apic, APIC_LVTT);
Haiwei Li17ac43a2020-01-16 16:50:21 +08001641 if (apic_lvtt_tscdeadline(apic)) {
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001642 ktimer->tscdeadline = 0;
Haiwei Li17ac43a2020-01-16 16:50:21 +08001643 } else if (apic_lvtt_oneshot(apic)) {
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001644 ktimer->tscdeadline = 0;
1645 ktimer->target_expiration = 0;
1646 }
1647}
1648
Wanpeng Liae95f562020-04-28 14:23:28 +08001649static void apic_timer_expired(struct kvm_lapic *apic, bool from_timer_fn)
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001650{
1651 struct kvm_vcpu *vcpu = apic->vcpu;
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001652 struct kvm_timer *ktimer = &apic->lapic_timer;
1653
1654 if (atomic_read(&apic->lapic_timer.pending))
1655 return;
1656
1657 if (apic_lvtt_tscdeadline(apic) || ktimer->hv_timer_in_use)
1658 ktimer->expired_tscdeadline = ktimer->tscdeadline;
1659
Wanpeng Liae95f562020-04-28 14:23:28 +08001660 if (!from_timer_fn && vcpu->arch.apicv_active) {
1661 WARN_ON(kvm_get_running_vcpu() != vcpu);
1662 kvm_apic_inject_pending_timer_irqs(apic);
1663 return;
1664 }
1665
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001666 if (kvm_use_posted_timer_interrupt(apic->vcpu)) {
Sean Christophersonbeda4302021-03-04 18:18:08 -08001667 /*
1668 * Ensure the guest's timer has truly expired before posting an
1669 * interrupt. Open code the relevant checks to avoid querying
1670 * lapic_timer_int_injected(), which will be false since the
1671 * interrupt isn't yet injected. Waiting until after injecting
1672 * is not an option since that won't help a posted interrupt.
1673 */
1674 if (vcpu->arch.apic->lapic_timer.expired_tscdeadline &&
1675 vcpu->arch.apic->lapic_timer.timer_advance_ns)
1676 __kvm_wait_lapic_expire(vcpu);
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001677 kvm_apic_inject_pending_timer_irqs(apic);
1678 return;
1679 }
1680
1681 atomic_inc(&apic->lapic_timer.pending);
Marcelo Tosatti084071d2021-05-25 10:41:17 -03001682 kvm_make_request(KVM_REQ_UNBLOCK, vcpu);
Wanpeng Li68ca76632020-09-10 17:50:40 +08001683 if (from_timer_fn)
1684 kvm_vcpu_kick(vcpu);
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08001685}
1686
Yunhong Jiang53f9eed2016-06-13 14:20:00 -07001687static void start_sw_tscdeadline(struct kvm_lapic *apic)
1688{
Sean Christopherson39497d72019-04-17 10:15:32 -07001689 struct kvm_timer *ktimer = &apic->lapic_timer;
1690 u64 guest_tsc, tscdeadline = ktimer->tscdeadline;
Yunhong Jiang53f9eed2016-06-13 14:20:00 -07001691 u64 ns = 0;
1692 ktime_t expire;
1693 struct kvm_vcpu *vcpu = apic->vcpu;
1694 unsigned long this_tsc_khz = vcpu->arch.virtual_tsc_khz;
1695 unsigned long flags;
1696 ktime_t now;
1697
1698 if (unlikely(!tscdeadline || !this_tsc_khz))
1699 return;
1700
1701 local_irq_save(flags);
1702
Paolo Bonzini55878592016-10-25 15:23:49 +02001703 now = ktime_get();
Yunhong Jiang53f9eed2016-06-13 14:20:00 -07001704 guest_tsc = kvm_read_l1_tsc(vcpu, rdtsc());
Liran Alonc09d65d2019-04-16 20:36:34 +03001705
1706 ns = (tscdeadline - guest_tsc) * 1000000ULL;
1707 do_div(ns, this_tsc_khz);
1708
1709 if (likely(tscdeadline > guest_tsc) &&
Sean Christopherson39497d72019-04-17 10:15:32 -07001710 likely(ns > apic->lapic_timer.timer_advance_ns)) {
Yunhong Jiang53f9eed2016-06-13 14:20:00 -07001711 expire = ktime_add_ns(now, ns);
Sean Christopherson39497d72019-04-17 10:15:32 -07001712 expire = ktime_sub_ns(expire, ktimer->timer_advance_ns);
Sebastian Andrzej Siewior2c0d2782019-07-26 20:30:55 +02001713 hrtimer_start(&ktimer->timer, expire, HRTIMER_MODE_ABS_HARD);
Yunhong Jiang53f9eed2016-06-13 14:20:00 -07001714 } else
Wanpeng Liae95f562020-04-28 14:23:28 +08001715 apic_timer_expired(apic, false);
Yunhong Jiang53f9eed2016-06-13 14:20:00 -07001716
1717 local_irq_restore(flags);
1718}
1719
Peter Shier24647e02018-10-10 15:56:53 -07001720static inline u64 tmict_to_ns(struct kvm_lapic *apic, u32 tmict)
1721{
1722 return (u64)tmict * APIC_BUS_CYCLE_NS * (u64)apic->divide_count;
1723}
1724
Wanpeng Lic301b902017-10-06 07:38:32 -07001725static void update_target_expiration(struct kvm_lapic *apic, uint32_t old_divisor)
1726{
1727 ktime_t now, remaining;
1728 u64 ns_remaining_old, ns_remaining_new;
1729
Peter Shier24647e02018-10-10 15:56:53 -07001730 apic->lapic_timer.period =
1731 tmict_to_ns(apic, kvm_lapic_get_reg(apic, APIC_TMICT));
Wanpeng Lic301b902017-10-06 07:38:32 -07001732 limit_periodic_timer_frequency(apic);
1733
1734 now = ktime_get();
1735 remaining = ktime_sub(apic->lapic_timer.target_expiration, now);
1736 if (ktime_to_ns(remaining) < 0)
1737 remaining = 0;
1738
1739 ns_remaining_old = ktime_to_ns(remaining);
1740 ns_remaining_new = mul_u64_u32_div(ns_remaining_old,
1741 apic->divide_count, old_divisor);
1742
1743 apic->lapic_timer.tscdeadline +=
1744 nsec_to_cycles(apic->vcpu, ns_remaining_new) -
1745 nsec_to_cycles(apic->vcpu, ns_remaining_old);
1746 apic->lapic_timer.target_expiration = ktime_add_ns(now, ns_remaining_new);
1747}
1748
Peter Shier24647e02018-10-10 15:56:53 -07001749static bool set_target_expiration(struct kvm_lapic *apic, u32 count_reg)
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001750{
1751 ktime_t now;
1752 u64 tscl = rdtsc();
Peter Shier24647e02018-10-10 15:56:53 -07001753 s64 deadline;
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001754
Paolo Bonzini55878592016-10-25 15:23:49 +02001755 now = ktime_get();
Peter Shier24647e02018-10-10 15:56:53 -07001756 apic->lapic_timer.period =
1757 tmict_to_ns(apic, kvm_lapic_get_reg(apic, APIC_TMICT));
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001758
Radim Krčmář5d74a692017-10-06 19:25:54 +02001759 if (!apic->lapic_timer.period) {
1760 apic->lapic_timer.tscdeadline = 0;
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001761 return false;
Wanpeng Li7d7f7da2016-10-24 18:23:09 +08001762 }
1763
Wanpeng Liccbfa1d2017-10-05 18:54:24 -07001764 limit_periodic_timer_frequency(apic);
Peter Shier24647e02018-10-10 15:56:53 -07001765 deadline = apic->lapic_timer.period;
1766
1767 if (apic_lvtt_period(apic) || apic_lvtt_oneshot(apic)) {
1768 if (unlikely(count_reg != APIC_TMICT)) {
1769 deadline = tmict_to_ns(apic,
1770 kvm_lapic_get_reg(apic, count_reg));
1771 if (unlikely(deadline <= 0))
1772 deadline = apic->lapic_timer.period;
1773 else if (unlikely(deadline > apic->lapic_timer.period)) {
1774 pr_info_ratelimited(
1775 "kvm: vcpu %i: requested lapic timer restore with "
1776 "starting count register %#x=%u (%lld ns) > initial count (%lld ns). "
1777 "Using initial count to start timer.\n",
1778 apic->vcpu->vcpu_id,
1779 count_reg,
1780 kvm_lapic_get_reg(apic, count_reg),
1781 deadline, apic->lapic_timer.period);
1782 kvm_lapic_set_reg(apic, count_reg, 0);
1783 deadline = apic->lapic_timer.period;
1784 }
1785 }
1786 }
Wanpeng Li7d7f7da2016-10-24 18:23:09 +08001787
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001788 apic->lapic_timer.tscdeadline = kvm_read_l1_tsc(apic->vcpu, tscl) +
Peter Shier24647e02018-10-10 15:56:53 -07001789 nsec_to_cycles(apic->vcpu, deadline);
1790 apic->lapic_timer.target_expiration = ktime_add_ns(now, deadline);
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001791
1792 return true;
1793}
1794
1795static void advance_periodic_target_expiration(struct kvm_lapic *apic)
1796{
David Vrabeld8f2f492018-05-18 16:55:46 +01001797 ktime_t now = ktime_get();
1798 u64 tscl = rdtsc();
1799 ktime_t delta;
1800
1801 /*
1802 * Synchronize both deadlines to the same time source or
1803 * differences in the periods (caused by differences in the
1804 * underlying clocks or numerical approximation errors) will
1805 * cause the two to drift apart over time as the errors
1806 * accumulate.
1807 */
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001808 apic->lapic_timer.target_expiration =
1809 ktime_add_ns(apic->lapic_timer.target_expiration,
1810 apic->lapic_timer.period);
David Vrabeld8f2f492018-05-18 16:55:46 +01001811 delta = ktime_sub(apic->lapic_timer.target_expiration, now);
1812 apic->lapic_timer.tscdeadline = kvm_read_l1_tsc(apic->vcpu, tscl) +
1813 nsec_to_cycles(apic->vcpu, delta);
Wanpeng Li7d7f7da2016-10-24 18:23:09 +08001814}
1815
Anthoine Bourgeoisecf08da2018-04-29 22:05:58 +00001816static void start_sw_period(struct kvm_lapic *apic)
1817{
1818 if (!apic->lapic_timer.period)
1819 return;
1820
1821 if (ktime_after(ktime_get(),
1822 apic->lapic_timer.target_expiration)) {
Wanpeng Liae95f562020-04-28 14:23:28 +08001823 apic_timer_expired(apic, false);
Anthoine Bourgeoisecf08da2018-04-29 22:05:58 +00001824
1825 if (apic_lvtt_oneshot(apic))
1826 return;
1827
1828 advance_periodic_target_expiration(apic);
1829 }
1830
1831 hrtimer_start(&apic->lapic_timer.timer,
1832 apic->lapic_timer.target_expiration,
He Zheedec6e02020-03-20 15:06:07 +08001833 HRTIMER_MODE_ABS_HARD);
Anthoine Bourgeoisecf08da2018-04-29 22:05:58 +00001834}
1835
Yunhong Jiangce7a0582016-06-13 14:20:01 -07001836bool kvm_lapic_hv_timer_in_use(struct kvm_vcpu *vcpu)
1837{
Wanpeng Li91005302016-08-03 12:04:12 +08001838 if (!lapic_in_kernel(vcpu))
1839 return false;
1840
Yunhong Jiangce7a0582016-06-13 14:20:01 -07001841 return vcpu->arch.apic->lapic_timer.hv_timer_in_use;
1842}
1843EXPORT_SYMBOL_GPL(kvm_lapic_hv_timer_in_use);
1844
Wanpeng Li7e810a32016-10-24 18:23:12 +08001845static void cancel_hv_timer(struct kvm_lapic *apic)
Wanpeng Libd97ad02016-06-30 08:52:49 +08001846{
Wanpeng Li1d518c62017-07-25 00:43:15 -07001847 WARN_ON(preemptible());
Paolo Bonzinia749e242017-06-29 17:14:50 +02001848 WARN_ON(!apic->lapic_timer.hv_timer_in_use);
Jason Baronb36464772021-01-14 22:27:56 -05001849 static_call(kvm_x86_cancel_hv_timer)(apic->vcpu);
Wanpeng Libd97ad02016-06-30 08:52:49 +08001850 apic->lapic_timer.hv_timer_in_use = false;
1851}
1852
Paolo Bonzinia749e242017-06-29 17:14:50 +02001853static bool start_hv_timer(struct kvm_lapic *apic)
Paolo Bonzini35ee9e42017-06-29 17:14:50 +02001854{
1855 struct kvm_timer *ktimer = &apic->lapic_timer;
Sean Christophersonf9927982019-04-16 13:32:46 -07001856 struct kvm_vcpu *vcpu = apic->vcpu;
1857 bool expired;
Paolo Bonzini35ee9e42017-06-29 17:14:50 +02001858
Wanpeng Li1d518c62017-07-25 00:43:15 -07001859 WARN_ON(preemptible());
Paolo Bonzini199a8b82020-05-05 06:45:35 -04001860 if (!kvm_can_use_hv_timer(vcpu))
Paolo Bonzinia749e242017-06-29 17:14:50 +02001861 return false;
1862
Radim Krčmář86bbc1e2017-10-06 19:25:53 +02001863 if (!ktimer->tscdeadline)
1864 return false;
1865
Jason Baronb36464772021-01-14 22:27:56 -05001866 if (static_call(kvm_x86_set_hv_timer)(vcpu, ktimer->tscdeadline, &expired))
Paolo Bonzini35ee9e42017-06-29 17:14:50 +02001867 return false;
1868
1869 ktimer->hv_timer_in_use = true;
1870 hrtimer_cancel(&ktimer->timer);
1871
1872 /*
Sean Christophersonf1ba5cf2019-04-16 13:32:45 -07001873 * To simplify handling the periodic timer, leave the hv timer running
1874 * even if the deadline timer has expired, i.e. rely on the resulting
1875 * VM-Exit to recompute the periodic timer's target expiration.
Paolo Bonzini35ee9e42017-06-29 17:14:50 +02001876 */
Sean Christophersonf1ba5cf2019-04-16 13:32:45 -07001877 if (!apic_lvtt_period(apic)) {
1878 /*
1879 * Cancel the hv timer if the sw timer fired while the hv timer
1880 * was being programmed, or if the hv timer itself expired.
1881 */
1882 if (atomic_read(&ktimer->pending)) {
1883 cancel_hv_timer(apic);
Sean Christophersonf9927982019-04-16 13:32:46 -07001884 } else if (expired) {
Wanpeng Liae95f562020-04-28 14:23:28 +08001885 apic_timer_expired(apic, false);
Sean Christophersonf1ba5cf2019-04-16 13:32:45 -07001886 cancel_hv_timer(apic);
1887 }
Wanpeng Lic8533542017-06-29 06:28:09 -07001888 }
Paolo Bonzinia749e242017-06-29 17:14:50 +02001889
Sean Christophersonf9927982019-04-16 13:32:46 -07001890 trace_kvm_hv_timer_state(vcpu->vcpu_id, ktimer->hv_timer_in_use);
Sean Christophersonf1ba5cf2019-04-16 13:32:45 -07001891
Paolo Bonzini35ee9e42017-06-29 17:14:50 +02001892 return true;
1893}
1894
Paolo Bonzinia749e242017-06-29 17:14:50 +02001895static void start_sw_timer(struct kvm_lapic *apic)
Wanpeng Li196f20c2016-06-28 14:54:19 +08001896{
Paolo Bonzinia749e242017-06-29 17:14:50 +02001897 struct kvm_timer *ktimer = &apic->lapic_timer;
Wanpeng Li1d518c62017-07-25 00:43:15 -07001898
1899 WARN_ON(preemptible());
Paolo Bonzinia749e242017-06-29 17:14:50 +02001900 if (apic->lapic_timer.hv_timer_in_use)
1901 cancel_hv_timer(apic);
1902 if (!apic_lvtt_period(apic) && atomic_read(&ktimer->pending))
1903 return;
Paolo Bonzini35ee9e42017-06-29 17:14:50 +02001904
Paolo Bonzinia749e242017-06-29 17:14:50 +02001905 if (apic_lvtt_period(apic) || apic_lvtt_oneshot(apic))
1906 start_sw_period(apic);
1907 else if (apic_lvtt_tscdeadline(apic))
1908 start_sw_tscdeadline(apic);
1909 trace_kvm_hv_timer_state(apic->vcpu->vcpu_id, false);
1910}
1911
1912static void restart_apic_timer(struct kvm_lapic *apic)
1913{
Wanpeng Li1d518c62017-07-25 00:43:15 -07001914 preempt_disable();
Sean Christopherson4ca88b32019-04-16 13:32:47 -07001915
1916 if (!apic_lvtt_period(apic) && atomic_read(&apic->lapic_timer.pending))
1917 goto out;
1918
Paolo Bonzinia749e242017-06-29 17:14:50 +02001919 if (!start_hv_timer(apic))
1920 start_sw_timer(apic);
Sean Christopherson4ca88b32019-04-16 13:32:47 -07001921out:
Wanpeng Li1d518c62017-07-25 00:43:15 -07001922 preempt_enable();
Wanpeng Li196f20c2016-06-28 14:54:19 +08001923}
1924
Eddie Dong97222cc2007-09-12 10:58:04 +03001925void kvm_lapic_expired_hv_timer(struct kvm_vcpu *vcpu)
1926{
1927 struct kvm_lapic *apic = vcpu->arch.apic;
1928
Wanpeng Li1d518c62017-07-25 00:43:15 -07001929 preempt_disable();
1930 /* If the preempt notifier has already run, it also called apic_timer_expired */
1931 if (!apic->lapic_timer.hv_timer_in_use)
1932 goto out;
Sean Christophersond92a5d12021-10-08 19:12:12 -07001933 WARN_ON(kvm_vcpu_is_blocking(vcpu));
Wanpeng Liae95f562020-04-28 14:23:28 +08001934 apic_timer_expired(apic, false);
Wanpeng Lid981dd12021-04-28 19:08:02 +08001935 cancel_hv_timer(apic);
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001936
1937 if (apic_lvtt_period(apic) && apic->lapic_timer.period) {
1938 advance_periodic_target_expiration(apic);
Paolo Bonzinia749e242017-06-29 17:14:50 +02001939 restart_apic_timer(apic);
Wanpeng Li8003c9a2016-10-24 18:23:13 +08001940 }
Wanpeng Li1d518c62017-07-25 00:43:15 -07001941out:
1942 preempt_enable();
Eddie Dong97222cc2007-09-12 10:58:04 +03001943}
1944EXPORT_SYMBOL_GPL(kvm_lapic_expired_hv_timer);
1945
Yunhong Jiangce7a0582016-06-13 14:20:01 -07001946void kvm_lapic_switch_to_hv_timer(struct kvm_vcpu *vcpu)
1947{
Paolo Bonzinia749e242017-06-29 17:14:50 +02001948 restart_apic_timer(vcpu->arch.apic);
Yunhong Jiangce7a0582016-06-13 14:20:01 -07001949}
1950EXPORT_SYMBOL_GPL(kvm_lapic_switch_to_hv_timer);
1951
1952void kvm_lapic_switch_to_sw_timer(struct kvm_vcpu *vcpu)
1953{
1954 struct kvm_lapic *apic = vcpu->arch.apic;
1955
Wanpeng Li1d518c62017-07-25 00:43:15 -07001956 preempt_disable();
Yunhong Jiangce7a0582016-06-13 14:20:01 -07001957 /* Possibly the TSC deadline timer is not enabled yet */
Paolo Bonzinia749e242017-06-29 17:14:50 +02001958 if (apic->lapic_timer.hv_timer_in_use)
1959 start_sw_timer(apic);
Wanpeng Li1d518c62017-07-25 00:43:15 -07001960 preempt_enable();
Yunhong Jiangce7a0582016-06-13 14:20:01 -07001961}
1962EXPORT_SYMBOL_GPL(kvm_lapic_switch_to_sw_timer);
1963
Paolo Bonzinia749e242017-06-29 17:14:50 +02001964void kvm_lapic_restart_hv_timer(struct kvm_vcpu *vcpu)
1965{
1966 struct kvm_lapic *apic = vcpu->arch.apic;
1967
1968 WARN_ON(!apic->lapic_timer.hv_timer_in_use);
1969 restart_apic_timer(apic);
1970}
1971
Peter Shier24647e02018-10-10 15:56:53 -07001972static void __start_apic_timer(struct kvm_lapic *apic, u32 count_reg)
Eddie Dong97222cc2007-09-12 10:58:04 +03001973{
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03001974 atomic_set(&apic->lapic_timer.pending, 0);
Avi Kivity0b975a32008-02-24 14:37:50 +02001975
Paolo Bonzinia749e242017-06-29 17:14:50 +02001976 if ((apic_lvtt_period(apic) || apic_lvtt_oneshot(apic))
Peter Shier24647e02018-10-10 15:56:53 -07001977 && !set_target_expiration(apic, count_reg))
Paolo Bonzinia749e242017-06-29 17:14:50 +02001978 return;
1979
1980 restart_apic_timer(apic);
Eddie Dong97222cc2007-09-12 10:58:04 +03001981}
1982
Peter Shier24647e02018-10-10 15:56:53 -07001983static void start_apic_timer(struct kvm_lapic *apic)
1984{
1985 __start_apic_timer(apic, APIC_TMICT);
1986}
1987
Jan Kiszkacc6e4622008-10-20 10:20:03 +02001988static void apic_manage_nmi_watchdog(struct kvm_lapic *apic, u32 lvt0_val)
1989{
Radim Krčmář59fd1322015-06-30 22:19:16 +02001990 bool lvt0_in_nmi_mode = apic_lvt_nmi_mode(lvt0_val);
Jan Kiszkacc6e4622008-10-20 10:20:03 +02001991
Radim Krčmář59fd1322015-06-30 22:19:16 +02001992 if (apic->lvt0_in_nmi_mode != lvt0_in_nmi_mode) {
1993 apic->lvt0_in_nmi_mode = lvt0_in_nmi_mode;
1994 if (lvt0_in_nmi_mode) {
Radim Krčmář42720132015-07-01 15:31:49 +02001995 atomic_inc(&apic->vcpu->kvm->arch.vapics_in_nmi_mode);
Radim Krčmář59fd1322015-06-30 22:19:16 +02001996 } else
1997 atomic_dec(&apic->vcpu->kvm->arch.vapics_in_nmi_mode);
1998 }
Jan Kiszkacc6e4622008-10-20 10:20:03 +02001999}
2000
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002001int kvm_lapic_reg_write(struct kvm_lapic *apic, u32 reg, u32 val)
Eddie Dong97222cc2007-09-12 10:58:04 +03002002{
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002003 int ret = 0;
Eddie Dong97222cc2007-09-12 10:58:04 +03002004
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002005 trace_kvm_apic_write(reg, val);
Eddie Dong97222cc2007-09-12 10:58:04 +03002006
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002007 switch (reg) {
Eddie Dong97222cc2007-09-12 10:58:04 +03002008 case APIC_ID: /* Local APIC ID */
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002009 if (!apic_x2apic_mode(apic))
Radim Krčmářa92e2542016-07-12 22:09:22 +02002010 kvm_apic_set_xapic_id(apic, val >> 24);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002011 else
2012 ret = 1;
Eddie Dong97222cc2007-09-12 10:58:04 +03002013 break;
2014
2015 case APIC_TASKPRI:
Avi Kivityb209749f2007-10-22 16:50:39 +02002016 report_tpr_access(apic, true);
Eddie Dong97222cc2007-09-12 10:58:04 +03002017 apic_set_tpr(apic, val & 0xff);
2018 break;
2019
2020 case APIC_EOI:
2021 apic_set_eoi(apic);
2022 break;
2023
2024 case APIC_LDR:
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002025 if (!apic_x2apic_mode(apic))
Gleb Natapov1e08ec42012-09-13 17:19:24 +03002026 kvm_apic_set_ldr(apic, val & APIC_LDR_MASK);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002027 else
2028 ret = 1;
Eddie Dong97222cc2007-09-12 10:58:04 +03002029 break;
2030
2031 case APIC_DFR:
Wanpeng Liae6f2492020-08-19 16:55:26 +08002032 if (!apic_x2apic_mode(apic))
2033 kvm_apic_set_dfr(apic, val | 0x0FFFFFFF);
2034 else
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002035 ret = 1;
Eddie Dong97222cc2007-09-12 10:58:04 +03002036 break;
2037
Gleb Natapovfc61b802009-07-05 17:39:35 +03002038 case APIC_SPIV: {
2039 u32 mask = 0x3ff;
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002040 if (kvm_lapic_get_reg(apic, APIC_LVR) & APIC_LVR_DIRECTED_EOI)
Gleb Natapovfc61b802009-07-05 17:39:35 +03002041 mask |= APIC_SPIV_DIRECTED_EOI;
Gleb Natapovf8c1ea12012-08-05 15:58:31 +03002042 apic_set_spiv(apic, val & mask);
Eddie Dong97222cc2007-09-12 10:58:04 +03002043 if (!(val & APIC_SPIV_APIC_ENABLED)) {
2044 int i;
2045 u32 lvt_val;
2046
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002047 for (i = 0; i < KVM_APIC_LVT_NUM; i++) {
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002048 lvt_val = kvm_lapic_get_reg(apic,
Eddie Dong97222cc2007-09-12 10:58:04 +03002049 APIC_LVTT + 0x10 * i);
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002050 kvm_lapic_set_reg(apic, APIC_LVTT + 0x10 * i,
Eddie Dong97222cc2007-09-12 10:58:04 +03002051 lvt_val | APIC_LVT_MASKED);
2052 }
Radim Krčmářb6ac0692015-06-05 20:57:41 +02002053 apic_update_lvtt(apic);
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03002054 atomic_set(&apic->lapic_timer.pending, 0);
Eddie Dong97222cc2007-09-12 10:58:04 +03002055
2056 }
2057 break;
Gleb Natapovfc61b802009-07-05 17:39:35 +03002058 }
Eddie Dong97222cc2007-09-12 10:58:04 +03002059 case APIC_ICR:
2060 /* No delay here, so we always clear the pending bit */
Wanpeng Li2b0911d2019-09-05 14:26:27 +08002061 val &= ~(1 << 12);
Wanpeng Lid5361672020-03-26 10:20:02 +08002062 kvm_apic_send_ipi(apic, val, kvm_lapic_get_reg(apic, APIC_ICR2));
Wanpeng Li2b0911d2019-09-05 14:26:27 +08002063 kvm_lapic_set_reg(apic, APIC_ICR, val);
Eddie Dong97222cc2007-09-12 10:58:04 +03002064 break;
2065
2066 case APIC_ICR2:
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002067 if (!apic_x2apic_mode(apic))
2068 val &= 0xff000000;
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002069 kvm_lapic_set_reg(apic, APIC_ICR2, val);
Eddie Dong97222cc2007-09-12 10:58:04 +03002070 break;
2071
Jan Kiszka23930f92008-09-26 09:30:52 +02002072 case APIC_LVT0:
Jan Kiszkacc6e4622008-10-20 10:20:03 +02002073 apic_manage_nmi_watchdog(apic, val);
Gustavo A. R. Silvadf561f662020-08-23 17:36:59 -05002074 fallthrough;
Eddie Dong97222cc2007-09-12 10:58:04 +03002075 case APIC_LVTTHMR:
2076 case APIC_LVTPC:
Eddie Dong97222cc2007-09-12 10:58:04 +03002077 case APIC_LVT1:
Marios Pomonis4bf79cb2019-12-11 12:47:46 -08002078 case APIC_LVTERR: {
Eddie Dong97222cc2007-09-12 10:58:04 +03002079 /* TODO: Check vector */
Marios Pomonis4bf79cb2019-12-11 12:47:46 -08002080 size_t size;
2081 u32 index;
2082
Gleb Natapovc48f1492012-08-05 15:58:33 +03002083 if (!kvm_apic_sw_enabled(apic))
Eddie Dong97222cc2007-09-12 10:58:04 +03002084 val |= APIC_LVT_MASKED;
Marios Pomonis4bf79cb2019-12-11 12:47:46 -08002085 size = ARRAY_SIZE(apic_lvt_mask);
2086 index = array_index_nospec(
2087 (reg - APIC_LVTT) >> 4, size);
2088 val &= apic_lvt_mask[index];
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002089 kvm_lapic_set_reg(apic, reg, val);
Eddie Dong97222cc2007-09-12 10:58:04 +03002090 break;
Marios Pomonis4bf79cb2019-12-11 12:47:46 -08002091 }
Eddie Dong97222cc2007-09-12 10:58:04 +03002092
Radim Krčmářb6ac0692015-06-05 20:57:41 +02002093 case APIC_LVTT:
Gleb Natapovc48f1492012-08-05 15:58:33 +03002094 if (!kvm_apic_sw_enabled(apic))
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002095 val |= APIC_LVT_MASKED;
2096 val &= (apic_lvt_mask[0] | apic->lapic_timer.timer_mode_mask);
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002097 kvm_lapic_set_reg(apic, APIC_LVTT, val);
Radim Krčmářb6ac0692015-06-05 20:57:41 +02002098 apic_update_lvtt(apic);
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002099 break;
2100
Eddie Dong97222cc2007-09-12 10:58:04 +03002101 case APIC_TMICT:
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002102 if (apic_lvtt_tscdeadline(apic))
2103 break;
2104
Wanpeng Lie898da72021-06-07 00:19:43 -07002105 cancel_apic_timer(apic);
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002106 kvm_lapic_set_reg(apic, APIC_TMICT, val);
Eddie Dong97222cc2007-09-12 10:58:04 +03002107 start_apic_timer(apic);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002108 break;
Eddie Dong97222cc2007-09-12 10:58:04 +03002109
Wanpeng Lic301b902017-10-06 07:38:32 -07002110 case APIC_TDCR: {
2111 uint32_t old_divisor = apic->divide_count;
2112
Wanpeng Lia445fc42020-07-31 11:12:20 +08002113 kvm_lapic_set_reg(apic, APIC_TDCR, val & 0xb);
Eddie Dong97222cc2007-09-12 10:58:04 +03002114 update_divide_count(apic);
Wanpeng Lic301b902017-10-06 07:38:32 -07002115 if (apic->divide_count != old_divisor &&
2116 apic->lapic_timer.period) {
2117 hrtimer_cancel(&apic->lapic_timer.timer);
2118 update_target_expiration(apic, old_divisor);
2119 restart_apic_timer(apic);
2120 }
Eddie Dong97222cc2007-09-12 10:58:04 +03002121 break;
Wanpeng Lic301b902017-10-06 07:38:32 -07002122 }
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002123 case APIC_ESR:
Yi Wang0d888002019-07-06 01:08:48 +08002124 if (apic_x2apic_mode(apic) && val != 0)
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002125 ret = 1;
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002126 break;
2127
2128 case APIC_SELF_IPI:
2129 if (apic_x2apic_mode(apic)) {
Haiwei Li9c2475f2020-07-21 16:23:54 +08002130 kvm_lapic_reg_write(apic, APIC_ICR,
2131 APIC_DEST_SELF | (val & APIC_VECTOR_MASK));
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002132 } else
2133 ret = 1;
2134 break;
Eddie Dong97222cc2007-09-12 10:58:04 +03002135 default:
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002136 ret = 1;
Eddie Dong97222cc2007-09-12 10:58:04 +03002137 break;
2138 }
Yi Wang0d888002019-07-06 01:08:48 +08002139
Wanpeng Li4abaffc2020-02-26 10:41:02 +08002140 kvm_recalculate_apic_map(apic->vcpu->kvm);
2141
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002142 return ret;
2143}
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002144EXPORT_SYMBOL_GPL(kvm_lapic_reg_write);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002145
Nikolay Nikolaeve32edf42015-03-26 14:39:28 +00002146static int apic_mmio_write(struct kvm_vcpu *vcpu, struct kvm_io_device *this,
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002147 gpa_t address, int len, const void *data)
2148{
2149 struct kvm_lapic *apic = to_lapic(this);
2150 unsigned int offset = address - apic->base_address;
2151 u32 val;
2152
2153 if (!apic_mmio_in_range(apic, address))
2154 return -EOPNOTSUPP;
2155
Vitaly Kuznetsovd1766202018-08-02 17:08:16 +02002156 if (!kvm_apic_hw_enabled(apic) || apic_x2apic_mode(apic)) {
2157 if (!kvm_check_has_quirk(vcpu->kvm,
2158 KVM_X86_QUIRK_LAPIC_MMIO_HOLE))
2159 return -EOPNOTSUPP;
2160
2161 return 0;
2162 }
2163
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002164 /*
2165 * APIC register must be aligned on 128-bits boundary.
2166 * 32/64/128 bits registers must be accessed thru 32 bits.
2167 * Refer SDM 8.4.1
2168 */
Yi Wang0d888002019-07-06 01:08:48 +08002169 if (len != 4 || (offset & 0xf))
Sheng Yang756975b2009-07-06 11:05:39 +08002170 return 0;
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002171
2172 val = *(u32*)data;
2173
Yi Wang0d888002019-07-06 01:08:48 +08002174 kvm_lapic_reg_write(apic, offset & 0xff0, val);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002175
Michael S. Tsirkinbda90202009-06-29 22:24:32 +03002176 return 0;
Eddie Dong97222cc2007-09-12 10:58:04 +03002177}
2178
Kevin Tian58fbbf22011-08-30 13:56:17 +03002179void kvm_lapic_set_eoi(struct kvm_vcpu *vcpu)
2180{
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002181 kvm_lapic_reg_write(vcpu->arch.apic, APIC_EOI, 0);
Kevin Tian58fbbf22011-08-30 13:56:17 +03002182}
2183EXPORT_SYMBOL_GPL(kvm_lapic_set_eoi);
2184
Yang Zhang83d4c282013-01-25 10:18:49 +08002185/* emulate APIC access in a trap manner */
2186void kvm_apic_write_nodecode(struct kvm_vcpu *vcpu, u32 offset)
2187{
2188 u32 val = 0;
2189
2190 /* hw has done the conditional check and inst decode */
2191 offset &= 0xff0;
2192
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002193 kvm_lapic_reg_read(vcpu->arch.apic, offset, 4, &val);
Yang Zhang83d4c282013-01-25 10:18:49 +08002194
2195 /* TODO: optimize to just emulate side effect w/o one more write */
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002196 kvm_lapic_reg_write(vcpu->arch.apic, offset, val);
Yang Zhang83d4c282013-01-25 10:18:49 +08002197}
2198EXPORT_SYMBOL_GPL(kvm_apic_write_nodecode);
2199
Rusty Russelld5894442007-10-08 10:48:30 +10002200void kvm_free_lapic(struct kvm_vcpu *vcpu)
Eddie Dong97222cc2007-09-12 10:58:04 +03002201{
Gleb Natapovf8c1ea12012-08-05 15:58:31 +03002202 struct kvm_lapic *apic = vcpu->arch.apic;
2203
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002204 if (!vcpu->arch.apic)
Eddie Dong97222cc2007-09-12 10:58:04 +03002205 return;
2206
Gleb Natapovf8c1ea12012-08-05 15:58:31 +03002207 hrtimer_cancel(&apic->lapic_timer.timer);
Eddie Dong97222cc2007-09-12 10:58:04 +03002208
Gleb Natapovc5cc4212012-08-05 15:58:30 +03002209 if (!(vcpu->arch.apic_base & MSR_IA32_APICBASE_ENABLE))
Cun Li6e4e3b42021-01-11 23:24:35 +08002210 static_branch_slow_dec_deferred(&apic_hw_disabled);
Gleb Natapovc5cc4212012-08-05 15:58:30 +03002211
Radim Krčmáře4627552014-10-30 15:06:45 +01002212 if (!apic->sw_enabled)
Cun Li6e4e3b42021-01-11 23:24:35 +08002213 static_branch_slow_dec_deferred(&apic_sw_disabled);
Eddie Dong97222cc2007-09-12 10:58:04 +03002214
Gleb Natapovf8c1ea12012-08-05 15:58:31 +03002215 if (apic->regs)
2216 free_page((unsigned long)apic->regs);
2217
2218 kfree(apic);
Eddie Dong97222cc2007-09-12 10:58:04 +03002219}
2220
2221/*
2222 *----------------------------------------------------------------------
2223 * LAPIC interface
2224 *----------------------------------------------------------------------
2225 */
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002226u64 kvm_get_lapic_tscdeadline_msr(struct kvm_vcpu *vcpu)
2227{
2228 struct kvm_lapic *apic = vcpu->arch.apic;
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002229
Wanpeng Lia970e9b2020-09-10 17:50:36 +08002230 if (!kvm_apic_present(vcpu) || !apic_lvtt_tscdeadline(apic))
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002231 return 0;
2232
2233 return apic->lapic_timer.tscdeadline;
2234}
2235
2236void kvm_set_lapic_tscdeadline_msr(struct kvm_vcpu *vcpu, u64 data)
2237{
2238 struct kvm_lapic *apic = vcpu->arch.apic;
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002239
Wanpeng Li27503832020-09-10 17:50:37 +08002240 if (!kvm_apic_present(vcpu) || !apic_lvtt_tscdeadline(apic))
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +08002241 return;
2242
2243 hrtimer_cancel(&apic->lapic_timer.timer);
2244 apic->lapic_timer.tscdeadline = data;
2245 start_apic_timer(apic);
2246}
2247
Eddie Dong97222cc2007-09-12 10:58:04 +03002248void kvm_lapic_set_tpr(struct kvm_vcpu *vcpu, unsigned long cr8)
2249{
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002250 struct kvm_lapic *apic = vcpu->arch.apic;
Eddie Dong97222cc2007-09-12 10:58:04 +03002251
Avi Kivityb93463a2007-10-25 16:52:32 +02002252 apic_set_tpr(apic, ((cr8 & 0x0f) << 4)
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002253 | (kvm_lapic_get_reg(apic, APIC_TASKPRI) & 4));
Eddie Dong97222cc2007-09-12 10:58:04 +03002254}
2255
2256u64 kvm_lapic_get_cr8(struct kvm_vcpu *vcpu)
2257{
Eddie Dong97222cc2007-09-12 10:58:04 +03002258 u64 tpr;
2259
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002260 tpr = (u64) kvm_lapic_get_reg(vcpu->arch.apic, APIC_TASKPRI);
Eddie Dong97222cc2007-09-12 10:58:04 +03002261
2262 return (tpr & 0xf0) >> 4;
2263}
2264
2265void kvm_lapic_set_base(struct kvm_vcpu *vcpu, u64 value)
2266{
Yang Zhang8d146952013-01-25 10:18:50 +08002267 u64 old_value = vcpu->arch.apic_base;
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002268 struct kvm_lapic *apic = vcpu->arch.apic;
Eddie Dong97222cc2007-09-12 10:58:04 +03002269
Jan Kiszkae66d2ae2013-12-29 02:29:30 +01002270 vcpu->arch.apic_base = value;
2271
Jim Mattsonc7dd15b2016-11-09 09:50:11 -08002272 if ((old_value ^ value) & MSR_IA32_APICBASE_ENABLE)
Xiaoyao Liaedbaf42020-07-09 12:34:23 +08002273 kvm_update_cpuid_runtime(vcpu);
Jim Mattsonc7dd15b2016-11-09 09:50:11 -08002274
2275 if (!apic)
2276 return;
2277
Gleb Natapovc5cc4212012-08-05 15:58:30 +03002278 /* update jump label if enable bit changes */
Andrew Jones0dce7cd2014-01-15 13:39:59 +01002279 if ((old_value ^ value) & MSR_IA32_APICBASE_ENABLE) {
Radim Krčmář49bd29b2016-07-12 22:09:23 +02002280 if (value & MSR_IA32_APICBASE_ENABLE) {
2281 kvm_apic_set_xapic_id(apic, vcpu->vcpu_id);
Cun Li6e4e3b42021-01-11 23:24:35 +08002282 static_branch_slow_dec_deferred(&apic_hw_disabled);
Vitaly Kuznetsov2f15d022021-04-22 11:29:48 +02002283 /* Check if there are APF page ready requests pending */
2284 kvm_make_request(KVM_REQ_APF_READY, vcpu);
Wanpeng Li187ca842016-08-03 12:04:13 +08002285 } else {
Cun Li6e4e3b42021-01-11 23:24:35 +08002286 static_branch_inc(&apic_hw_disabled.key);
Paolo Bonzini44d52712020-06-22 16:37:42 +02002287 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
Wanpeng Li187ca842016-08-03 12:04:13 +08002288 }
Gleb Natapovc5cc4212012-08-05 15:58:30 +03002289 }
2290
Jim Mattson8d860bb2018-05-09 16:56:05 -04002291 if (((old_value ^ value) & X2APIC_ENABLE) && (value & X2APIC_ENABLE))
2292 kvm_apic_set_x2apic_id(apic, vcpu->vcpu_id);
2293
2294 if ((old_value ^ value) & (MSR_IA32_APICBASE_ENABLE | X2APIC_ENABLE))
Jason Baronb36464772021-01-14 22:27:56 -05002295 static_call(kvm_x86_set_virtual_apic_mode)(vcpu);
Yang Zhang8d146952013-01-25 10:18:50 +08002296
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002297 apic->base_address = apic->vcpu->arch.apic_base &
Eddie Dong97222cc2007-09-12 10:58:04 +03002298 MSR_IA32_APICBASE_BASE;
2299
Nadav Amitdb324fe2014-11-02 11:54:59 +02002300 if ((value & MSR_IA32_APICBASE_ENABLE) &&
2301 apic->base_address != APIC_DEFAULT_PHYS_BASE)
2302 pr_warn_once("APIC base relocation is unsupported by KVM");
Eddie Dong97222cc2007-09-12 10:58:04 +03002303}
2304
Suravee Suthikulpanitb26a6952019-11-14 14:15:04 -06002305void kvm_apic_update_apicv(struct kvm_vcpu *vcpu)
2306{
2307 struct kvm_lapic *apic = vcpu->arch.apic;
2308
2309 if (vcpu->arch.apicv_active) {
2310 /* irr_pending is always true when apicv is activated. */
2311 apic->irr_pending = true;
2312 apic->isr_count = 1;
2313 } else {
2314 apic->irr_pending = (apic_search_irr(apic) != -1);
2315 apic->isr_count = count_vectors(apic->regs + APIC_ISR);
2316 }
2317}
2318EXPORT_SYMBOL_GPL(kvm_apic_update_apicv);
2319
Nadav Amitd28bc9d2015-04-13 14:34:08 +03002320void kvm_lapic_reset(struct kvm_vcpu *vcpu, bool init_event)
Eddie Dong97222cc2007-09-12 10:58:04 +03002321{
Radim Krčmářb7e31be2018-03-01 15:24:25 +01002322 struct kvm_lapic *apic = vcpu->arch.apic;
Sean Christophersonf7d8a192021-10-12 17:35:53 -07002323 u64 msr_val;
Eddie Dong97222cc2007-09-12 10:58:04 +03002324 int i;
2325
Sean Christopherson45477002021-07-13 09:32:56 -07002326 if (!init_event) {
Sean Christophersonf7d8a192021-10-12 17:35:53 -07002327 msr_val = APIC_DEFAULT_PHYS_BASE | MSR_IA32_APICBASE_ENABLE;
Sean Christopherson45477002021-07-13 09:32:56 -07002328 if (kvm_vcpu_is_reset_bsp(vcpu))
Sean Christophersonf7d8a192021-10-12 17:35:53 -07002329 msr_val |= MSR_IA32_APICBASE_BSP;
2330 kvm_lapic_set_base(vcpu, msr_val);
Sean Christopherson45477002021-07-13 09:32:56 -07002331 }
2332
Radim Krčmářb7e31be2018-03-01 15:24:25 +01002333 if (!apic)
2334 return;
Eddie Dong97222cc2007-09-12 10:58:04 +03002335
Eddie Dong97222cc2007-09-12 10:58:04 +03002336 /* Stop the timer in case it's a reset to an active apic */
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03002337 hrtimer_cancel(&apic->lapic_timer.timer);
Eddie Dong97222cc2007-09-12 10:58:04 +03002338
Sean Christophersonf7d8a192021-10-12 17:35:53 -07002339 /* The xAPIC ID is set at RESET even if the APIC was already enabled. */
2340 if (!init_event)
Radim Krčmářa92e2542016-07-12 22:09:22 +02002341 kvm_apic_set_xapic_id(apic, vcpu->vcpu_id);
Gleb Natapovfc61b802009-07-05 17:39:35 +03002342 kvm_apic_set_version(apic->vcpu);
Eddie Dong97222cc2007-09-12 10:58:04 +03002343
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002344 for (i = 0; i < KVM_APIC_LVT_NUM; i++)
2345 kvm_lapic_set_reg(apic, APIC_LVTT + 0x10 * i, APIC_LVT_MASKED);
Radim Krčmářb6ac0692015-06-05 20:57:41 +02002346 apic_update_lvtt(apic);
Jan H. Schönherr52b54192017-05-20 13:24:32 +02002347 if (kvm_vcpu_is_reset_bsp(vcpu) &&
2348 kvm_check_has_quirk(vcpu->kvm, KVM_X86_QUIRK_LINT0_REENABLED))
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002349 kvm_lapic_set_reg(apic, APIC_LVT0,
Nadav Amit90de4a12015-04-13 01:53:41 +03002350 SET_APIC_DELIVERY_MODE(0, APIC_MODE_EXTINT));
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002351 apic_manage_nmi_watchdog(apic, kvm_lapic_get_reg(apic, APIC_LVT0));
Eddie Dong97222cc2007-09-12 10:58:04 +03002352
Wanpeng Liae6f2492020-08-19 16:55:26 +08002353 kvm_apic_set_dfr(apic, 0xffffffffU);
Gleb Natapovf8c1ea12012-08-05 15:58:31 +03002354 apic_set_spiv(apic, 0xff);
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002355 kvm_lapic_set_reg(apic, APIC_TASKPRI, 0);
Radim Krčmářc028dd62015-05-22 19:22:10 +02002356 if (!apic_x2apic_mode(apic))
2357 kvm_apic_set_ldr(apic, 0);
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002358 kvm_lapic_set_reg(apic, APIC_ESR, 0);
2359 kvm_lapic_set_reg(apic, APIC_ICR, 0);
2360 kvm_lapic_set_reg(apic, APIC_ICR2, 0);
2361 kvm_lapic_set_reg(apic, APIC_TDCR, 0);
2362 kvm_lapic_set_reg(apic, APIC_TMICT, 0);
Eddie Dong97222cc2007-09-12 10:58:04 +03002363 for (i = 0; i < 8; i++) {
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002364 kvm_lapic_set_reg(apic, APIC_IRR + 0x10 * i, 0);
2365 kvm_lapic_set_reg(apic, APIC_ISR + 0x10 * i, 0);
2366 kvm_lapic_set_reg(apic, APIC_TMR + 0x10 * i, 0);
Eddie Dong97222cc2007-09-12 10:58:04 +03002367 }
Suravee Suthikulpanitb26a6952019-11-14 14:15:04 -06002368 kvm_apic_update_apicv(vcpu);
Michael S. Tsirkin8680b942012-06-24 19:24:26 +03002369 apic->highest_isr_cache = -1;
Kevin Pedrettib33ac882007-10-21 08:54:53 +02002370 update_divide_count(apic);
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03002371 atomic_set(&apic->lapic_timer.pending, 0);
Sean Christopherson549240e2021-07-13 09:32:50 -07002372
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002373 vcpu->arch.pv_eoi.msr_val = 0;
Eddie Dong97222cc2007-09-12 10:58:04 +03002374 apic_update_ppr(apic);
Jan H. Schönherr4191db22017-10-25 16:43:27 +02002375 if (vcpu->arch.apicv_active) {
Jason Baronb36464772021-01-14 22:27:56 -05002376 static_call(kvm_x86_apicv_post_state_restore)(vcpu);
2377 static_call(kvm_x86_hwapic_irr_update)(vcpu, -1);
2378 static_call(kvm_x86_hwapic_isr_update)(vcpu, -1);
Jan H. Schönherr4191db22017-10-25 16:43:27 +02002379 }
Eddie Dong97222cc2007-09-12 10:58:04 +03002380
Gleb Natapove1035712009-03-05 16:34:59 +02002381 vcpu->arch.apic_arb_prio = 0;
Gleb Natapov41383772012-04-19 14:06:29 +03002382 vcpu->arch.apic_attention = 0;
Wanpeng Li4abaffc2020-02-26 10:41:02 +08002383
2384 kvm_recalculate_apic_map(vcpu->kvm);
Eddie Dong97222cc2007-09-12 10:58:04 +03002385}
2386
Eddie Dong97222cc2007-09-12 10:58:04 +03002387/*
2388 *----------------------------------------------------------------------
2389 * timer interface
2390 *----------------------------------------------------------------------
2391 */
Eddie Dong1b9778d2007-09-03 16:56:58 +03002392
Avi Kivity2a6eac92012-07-26 18:01:51 +03002393static bool lapic_is_periodic(struct kvm_lapic *apic)
Eddie Dong97222cc2007-09-12 10:58:04 +03002394{
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03002395 return apic_lvtt_period(apic);
Eddie Dong97222cc2007-09-12 10:58:04 +03002396}
2397
Marcelo Tosatti3d808402008-04-11 14:53:26 -03002398int apic_has_pending_timer(struct kvm_vcpu *vcpu)
2399{
Gleb Natapov54e98182012-08-05 15:58:32 +03002400 struct kvm_lapic *apic = vcpu->arch.apic;
Marcelo Tosatti3d808402008-04-11 14:53:26 -03002401
Paolo Bonzini1e3161b42016-01-08 13:41:16 +01002402 if (apic_enabled(apic) && apic_lvt_enabled(apic, APIC_LVTT))
Gleb Natapov54e98182012-08-05 15:58:32 +03002403 return atomic_read(&apic->lapic_timer.pending);
Marcelo Tosatti3d808402008-04-11 14:53:26 -03002404
2405 return 0;
2406}
2407
Avi Kivity89342082011-11-10 14:57:21 +02002408int kvm_apic_local_deliver(struct kvm_lapic *apic, int lvt_type)
Eddie Dong1b9778d2007-09-03 16:56:58 +03002409{
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002410 u32 reg = kvm_lapic_get_reg(apic, lvt_type);
Jan Kiszka23930f92008-09-26 09:30:52 +02002411 int vector, mode, trig_mode;
Eddie Dong1b9778d2007-09-03 16:56:58 +03002412
Gleb Natapovc48f1492012-08-05 15:58:33 +03002413 if (kvm_apic_hw_enabled(apic) && !(reg & APIC_LVT_MASKED)) {
Jan Kiszka23930f92008-09-26 09:30:52 +02002414 vector = reg & APIC_VECTOR_MASK;
2415 mode = reg & APIC_MODE_MASK;
2416 trig_mode = reg & APIC_LVT_LEVEL_TRIGGER;
Yang Zhangb4f22252013-04-11 19:21:37 +08002417 return __apic_accept_irq(apic, mode, vector, 1, trig_mode,
2418 NULL);
Jan Kiszka23930f92008-09-26 09:30:52 +02002419 }
2420 return 0;
2421}
2422
Jan Kiszka8fdb2352008-10-20 10:20:02 +02002423void kvm_apic_nmi_wd_deliver(struct kvm_vcpu *vcpu)
Jan Kiszka23930f92008-09-26 09:30:52 +02002424{
Jan Kiszka8fdb2352008-10-20 10:20:02 +02002425 struct kvm_lapic *apic = vcpu->arch.apic;
2426
2427 if (apic)
2428 kvm_apic_local_deliver(apic, APIC_LVT0);
Eddie Dong1b9778d2007-09-03 16:56:58 +03002429}
2430
Gregory Haskinsd76685c42009-06-01 12:54:50 -04002431static const struct kvm_io_device_ops apic_mmio_ops = {
2432 .read = apic_mmio_read,
2433 .write = apic_mmio_write,
Gregory Haskinsd76685c42009-06-01 12:54:50 -04002434};
2435
Avi Kivitye9d90d42012-07-26 18:01:50 +03002436static enum hrtimer_restart apic_timer_fn(struct hrtimer *data)
2437{
2438 struct kvm_timer *ktimer = container_of(data, struct kvm_timer, timer);
Avi Kivity2a6eac92012-07-26 18:01:51 +03002439 struct kvm_lapic *apic = container_of(ktimer, struct kvm_lapic, lapic_timer);
Avi Kivitye9d90d42012-07-26 18:01:50 +03002440
Wanpeng Liae95f562020-04-28 14:23:28 +08002441 apic_timer_expired(apic, true);
Avi Kivitye9d90d42012-07-26 18:01:50 +03002442
Avi Kivity2a6eac92012-07-26 18:01:51 +03002443 if (lapic_is_periodic(apic)) {
Wanpeng Li8003c9a2016-10-24 18:23:13 +08002444 advance_periodic_target_expiration(apic);
Avi Kivitye9d90d42012-07-26 18:01:50 +03002445 hrtimer_add_expires_ns(&ktimer->timer, ktimer->period);
2446 return HRTIMER_RESTART;
2447 } else
2448 return HRTIMER_NORESTART;
2449}
2450
Sean Christophersonc3941d92019-04-17 10:15:33 -07002451int kvm_create_lapic(struct kvm_vcpu *vcpu, int timer_advance_ns)
Eddie Dong97222cc2007-09-12 10:58:04 +03002452{
2453 struct kvm_lapic *apic;
2454
2455 ASSERT(vcpu != NULL);
Eddie Dong97222cc2007-09-12 10:58:04 +03002456
Ben Gardon254272c2019-02-11 11:02:50 -08002457 apic = kzalloc(sizeof(*apic), GFP_KERNEL_ACCOUNT);
Eddie Dong97222cc2007-09-12 10:58:04 +03002458 if (!apic)
2459 goto nomem;
2460
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002461 vcpu->arch.apic = apic;
Eddie Dong97222cc2007-09-12 10:58:04 +03002462
Ben Gardon254272c2019-02-11 11:02:50 -08002463 apic->regs = (void *)get_zeroed_page(GFP_KERNEL_ACCOUNT);
Takuya Yoshikawaafc20182011-03-05 12:40:20 +09002464 if (!apic->regs) {
Eddie Dong97222cc2007-09-12 10:58:04 +03002465 printk(KERN_ERR "malloc apic regs error for vcpu %x\n",
2466 vcpu->vcpu_id);
Rusty Russelld5894442007-10-08 10:48:30 +10002467 goto nomem_free_apic;
Eddie Dong97222cc2007-09-12 10:58:04 +03002468 }
Eddie Dong97222cc2007-09-12 10:58:04 +03002469 apic->vcpu = vcpu;
2470
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03002471 hrtimer_init(&apic->lapic_timer.timer, CLOCK_MONOTONIC,
Sebastian Andrzej Siewior2c0d2782019-07-26 20:30:55 +02002472 HRTIMER_MODE_ABS_HARD);
Avi Kivitye9d90d42012-07-26 18:01:50 +03002473 apic->lapic_timer.timer.function = apic_timer_fn;
Sean Christophersonc3941d92019-04-17 10:15:33 -07002474 if (timer_advance_ns == -1) {
Wanpeng Lia0f00372019-09-26 08:54:03 +08002475 apic->lapic_timer.timer_advance_ns = LAPIC_TIMER_ADVANCE_NS_INIT;
Wanpeng Lid0f5a862019-09-17 16:16:26 +08002476 lapic_timer_advance_dynamic = true;
Sean Christophersonc3941d92019-04-17 10:15:33 -07002477 } else {
2478 apic->lapic_timer.timer_advance_ns = timer_advance_ns;
Wanpeng Lid0f5a862019-09-17 16:16:26 +08002479 lapic_timer_advance_dynamic = false;
Sean Christophersonc3941d92019-04-17 10:15:33 -07002480 }
2481
Sean Christophersonf7d8a192021-10-12 17:35:53 -07002482 /*
2483 * Stuff the APIC ENABLE bit in lieu of temporarily incrementing
2484 * apic_hw_disabled; the full RESET value is set by kvm_lapic_reset().
2485 */
2486 vcpu->arch.apic_base = MSR_IA32_APICBASE_ENABLE;
Cun Li6e4e3b42021-01-11 23:24:35 +08002487 static_branch_inc(&apic_sw_disabled.key); /* sw disabled at reset */
Gregory Haskinsd76685c42009-06-01 12:54:50 -04002488 kvm_iodevice_init(&apic->dev, &apic_mmio_ops);
Eddie Dong97222cc2007-09-12 10:58:04 +03002489
2490 return 0;
Rusty Russelld5894442007-10-08 10:48:30 +10002491nomem_free_apic:
2492 kfree(apic);
Saar Amara251fb902019-05-06 11:29:16 +03002493 vcpu->arch.apic = NULL;
Eddie Dong97222cc2007-09-12 10:58:04 +03002494nomem:
Eddie Dong97222cc2007-09-12 10:58:04 +03002495 return -ENOMEM;
2496}
Eddie Dong97222cc2007-09-12 10:58:04 +03002497
2498int kvm_apic_has_interrupt(struct kvm_vcpu *vcpu)
2499{
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002500 struct kvm_lapic *apic = vcpu->arch.apic;
Paolo Bonzinib3c045d2016-12-18 21:47:54 +01002501 u32 ppr;
Eddie Dong97222cc2007-09-12 10:58:04 +03002502
Paolo Bonzini72c3bcd2020-11-27 08:53:52 +01002503 if (!kvm_apic_present(vcpu))
Eddie Dong97222cc2007-09-12 10:58:04 +03002504 return -1;
2505
Paolo Bonzinib3c045d2016-12-18 21:47:54 +01002506 __apic_update_ppr(apic, &ppr);
2507 return apic_has_interrupt_for_ppr(apic, ppr);
Eddie Dong97222cc2007-09-12 10:58:04 +03002508}
Sean Christopherson25bb2cf2020-08-12 10:51:29 -07002509EXPORT_SYMBOL_GPL(kvm_apic_has_interrupt);
Eddie Dong97222cc2007-09-12 10:58:04 +03002510
Qing He40487c62007-09-17 14:47:13 +08002511int kvm_apic_accept_pic_intr(struct kvm_vcpu *vcpu)
2512{
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002513 u32 lvt0 = kvm_lapic_get_reg(vcpu->arch.apic, APIC_LVT0);
Qing He40487c62007-09-17 14:47:13 +08002514
Gleb Natapovc48f1492012-08-05 15:58:33 +03002515 if (!kvm_apic_hw_enabled(vcpu->arch.apic))
Miaohe Lin3ce4dc12020-01-18 10:50:37 +08002516 return 1;
Chris Lalancettee7dca5c2010-06-16 17:11:12 -04002517 if ((lvt0 & APIC_LVT_MASKED) == 0 &&
2518 GET_APIC_DELIVERY_MODE(lvt0) == APIC_MODE_EXTINT)
Miaohe Lin3ce4dc12020-01-18 10:50:37 +08002519 return 1;
2520 return 0;
Qing He40487c62007-09-17 14:47:13 +08002521}
2522
Eddie Dong1b9778d2007-09-03 16:56:58 +03002523void kvm_inject_apic_timer_irqs(struct kvm_vcpu *vcpu)
2524{
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002525 struct kvm_lapic *apic = vcpu->arch.apic;
Eddie Dong1b9778d2007-09-03 16:56:58 +03002526
Gleb Natapov54e98182012-08-05 15:58:32 +03002527 if (atomic_read(&apic->lapic_timer.pending) > 0) {
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08002528 kvm_apic_inject_pending_timer_irqs(apic);
Jan Kiszkaf1ed0452013-04-28 14:00:41 +02002529 atomic_set(&apic->lapic_timer.pending, 0);
Eddie Dong1b9778d2007-09-03 16:56:58 +03002530 }
2531}
2532
Eddie Dong97222cc2007-09-12 10:58:04 +03002533int kvm_get_apic_interrupt(struct kvm_vcpu *vcpu)
2534{
2535 int vector = kvm_apic_has_interrupt(vcpu);
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002536 struct kvm_lapic *apic = vcpu->arch.apic;
Paolo Bonzini4d82d122016-12-18 21:43:41 +01002537 u32 ppr;
Eddie Dong97222cc2007-09-12 10:58:04 +03002538
2539 if (vector == -1)
2540 return -1;
2541
Wanpeng Li56cc2402014-08-05 12:42:24 +08002542 /*
2543 * We get here even with APIC virtualization enabled, if doing
2544 * nested virtualization and L1 runs with the "acknowledge interrupt
2545 * on exit" mode. Then we cannot inject the interrupt via RVI,
2546 * because the process would deliver it through the IDT.
2547 */
2548
Eddie Dong97222cc2007-09-12 10:58:04 +03002549 apic_clear_irr(vector, apic);
Vitaly Kuznetsovf2bc14b2021-01-26 14:48:12 +01002550 if (to_hv_vcpu(vcpu) && test_bit(vector, to_hv_synic(vcpu)->auto_eoi_bitmap)) {
Paolo Bonzini4d82d122016-12-18 21:43:41 +01002551 /*
2552 * For auto-EOI interrupts, there might be another pending
2553 * interrupt above PPR, so check whether to raise another
2554 * KVM_REQ_EVENT.
2555 */
Andrey Smetanin5c9194122015-11-10 15:36:34 +03002556 apic_update_ppr(apic);
Paolo Bonzini4d82d122016-12-18 21:43:41 +01002557 } else {
2558 /*
2559 * For normal interrupts, PPR has been raised and there cannot
2560 * be a higher-priority pending interrupt---except if there was
2561 * a concurrent interrupt injection, but that would have
2562 * triggered KVM_REQ_EVENT already.
2563 */
2564 apic_set_isr(vector, apic);
2565 __apic_update_ppr(apic, &ppr);
Andrey Smetanin5c9194122015-11-10 15:36:34 +03002566 }
2567
Eddie Dong97222cc2007-09-12 10:58:04 +03002568 return vector;
2569}
Eddie Dong96ad2cc2007-09-06 12:22:56 +03002570
Radim Krčmářa92e2542016-07-12 22:09:22 +02002571static int kvm_apic_state_fixup(struct kvm_vcpu *vcpu,
2572 struct kvm_lapic_state *s, bool set)
2573{
2574 if (apic_x2apic_mode(vcpu->arch.apic)) {
2575 u32 *id = (u32 *)(s->regs + APIC_ID);
Dr. David Alan Gilbert12806ba2017-11-17 11:52:50 +00002576 u32 *ldr = (u32 *)(s->regs + APIC_LDR);
Radim Krčmářa92e2542016-07-12 22:09:22 +02002577
Radim Krčmář371313132016-07-12 22:09:27 +02002578 if (vcpu->kvm->arch.x2apic_format) {
2579 if (*id != vcpu->vcpu_id)
2580 return -EINVAL;
2581 } else {
2582 if (set)
2583 *id >>= 24;
2584 else
2585 *id <<= 24;
2586 }
Dr. David Alan Gilbert12806ba2017-11-17 11:52:50 +00002587
2588 /* In x2APIC mode, the LDR is fixed and based on the id */
2589 if (set)
2590 *ldr = kvm_apic_calc_x2apic_ldr(*id);
Radim Krčmářa92e2542016-07-12 22:09:22 +02002591 }
2592
2593 return 0;
2594}
2595
2596int kvm_apic_get_state(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s)
2597{
2598 memcpy(s->regs, vcpu->arch.apic->regs, sizeof(*s));
Peter Shier24647e02018-10-10 15:56:53 -07002599
2600 /*
2601 * Get calculated timer current count for remaining timer period (if
2602 * any) and store it in the returned register set.
2603 */
2604 __kvm_lapic_set_reg(s->regs, APIC_TMCCT,
2605 __apic_read(vcpu->arch.apic, APIC_TMCCT));
2606
Radim Krčmářa92e2542016-07-12 22:09:22 +02002607 return kvm_apic_state_fixup(vcpu, s, false);
2608}
2609
2610int kvm_apic_set_state(struct kvm_vcpu *vcpu, struct kvm_lapic_state *s)
Eddie Dong96ad2cc2007-09-06 12:22:56 +03002611{
Zhang Xiantaoad312c72007-12-13 23:50:52 +08002612 struct kvm_lapic *apic = vcpu->arch.apic;
Radim Krčmářa92e2542016-07-12 22:09:22 +02002613 int r;
2614
Gleb Natapov5dbc8f32012-08-05 15:58:27 +03002615 kvm_lapic_set_base(vcpu, vcpu->arch.apic_base);
Gleb Natapov64eb0622012-08-08 15:24:36 +03002616 /* set SPIV separately to get count of SW disabled APICs right */
2617 apic_set_spiv(apic, *((u32 *)(s->regs + APIC_SPIV)));
Radim Krčmářa92e2542016-07-12 22:09:22 +02002618
2619 r = kvm_apic_state_fixup(vcpu, s, true);
Wanpeng Li4abaffc2020-02-26 10:41:02 +08002620 if (r) {
2621 kvm_recalculate_apic_map(vcpu->kvm);
Radim Krčmářa92e2542016-07-12 22:09:22 +02002622 return r;
Wanpeng Li4abaffc2020-02-26 10:41:02 +08002623 }
Jordan Borgner0e96f312018-10-28 12:58:28 +00002624 memcpy(vcpu->arch.apic->regs, s->regs, sizeof(*s));
Radim Krčmářa92e2542016-07-12 22:09:22 +02002625
Paolo Bonzini44d52712020-06-22 16:37:42 +02002626 atomic_set_release(&apic->vcpu->kvm->arch.apic_map_dirty, DIRTY);
Wanpeng Li4abaffc2020-02-26 10:41:02 +08002627 kvm_recalculate_apic_map(vcpu->kvm);
Gleb Natapovfc61b802009-07-05 17:39:35 +03002628 kvm_apic_set_version(vcpu);
2629
Eddie Dong96ad2cc2007-09-06 12:22:56 +03002630 apic_update_ppr(apic);
Marcelo Tosattid3c7b772009-02-23 10:57:41 -03002631 hrtimer_cancel(&apic->lapic_timer.timer);
Wanpeng Li35737d22021-03-04 08:35:18 +08002632 apic->lapic_timer.expired_tscdeadline = 0;
Radim Krčmářb6ac0692015-06-05 20:57:41 +02002633 apic_update_lvtt(apic);
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002634 apic_manage_nmi_watchdog(apic, kvm_lapic_get_reg(apic, APIC_LVT0));
Eddie Dong96ad2cc2007-09-06 12:22:56 +03002635 update_divide_count(apic);
Peter Shier24647e02018-10-10 15:56:53 -07002636 __start_apic_timer(apic, APIC_TMCCT);
Wanpeng Li27358862021-06-09 00:16:40 -07002637 kvm_lapic_set_reg(apic, APIC_TMCCT, 0);
Suravee Suthikulpanitb26a6952019-11-14 14:15:04 -06002638 kvm_apic_update_apicv(vcpu);
Michael S. Tsirkin8680b942012-06-24 19:24:26 +03002639 apic->highest_isr_cache = -1;
Andrey Smetanind62caab2015-11-10 15:36:33 +03002640 if (vcpu->arch.apicv_active) {
Jason Baronb36464772021-01-14 22:27:56 -05002641 static_call(kvm_x86_apicv_post_state_restore)(vcpu);
2642 static_call(kvm_x86_hwapic_irr_update)(vcpu,
Wei Wang4114c272014-11-05 10:53:43 +08002643 apic_find_highest_irr(apic));
Jason Baronb36464772021-01-14 22:27:56 -05002644 static_call(kvm_x86_hwapic_isr_update)(vcpu,
Tiejun Chenb4eef9b2014-12-22 10:32:57 +01002645 apic_find_highest_isr(apic));
Andrey Smetanind62caab2015-11-10 15:36:33 +03002646 }
Avi Kivity3842d132010-07-27 12:30:24 +03002647 kvm_make_request(KVM_REQ_EVENT, vcpu);
Steve Rutherford49df6392015-07-29 23:21:40 -07002648 if (ioapic_in_kernel(vcpu->kvm))
2649 kvm_rtc_eoi_tracking_restore_one(vcpu);
Radim Krčmář0669a512015-10-30 15:48:20 +01002650
2651 vcpu->arch.apic_arb_prio = 0;
Radim Krčmářa92e2542016-07-12 22:09:22 +02002652
2653 return 0;
Eddie Dong96ad2cc2007-09-06 12:22:56 +03002654}
Eddie Donga3d7f852007-09-03 16:15:12 +03002655
Avi Kivity2f52d582008-01-16 12:49:30 +02002656void __kvm_migrate_apic_timer(struct kvm_vcpu *vcpu)
Eddie Donga3d7f852007-09-03 16:15:12 +03002657{
Eddie Donga3d7f852007-09-03 16:15:12 +03002658 struct hrtimer *timer;
2659
Wanpeng Li0c5f81d2019-07-06 09:26:51 +08002660 if (!lapic_in_kernel(vcpu) ||
2661 kvm_can_post_timer_interrupt(vcpu))
Eddie Donga3d7f852007-09-03 16:15:12 +03002662 return;
2663
Gleb Natapov54e98182012-08-05 15:58:32 +03002664 timer = &vcpu->arch.apic->lapic_timer.timer;
Eddie Donga3d7f852007-09-03 16:15:12 +03002665 if (hrtimer_cancel(timer))
Sebastian Andrzej Siewior2c0d2782019-07-26 20:30:55 +02002666 hrtimer_start_expires(timer, HRTIMER_MODE_ABS_HARD);
Eddie Donga3d7f852007-09-03 16:15:12 +03002667}
Avi Kivityb93463a2007-10-25 16:52:32 +02002668
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002669/*
2670 * apic_sync_pv_eoi_from_guest - called on vmexit or cancel interrupt
2671 *
2672 * Detect whether guest triggered PV EOI since the
2673 * last entry. If yes, set EOI on guests's behalf.
2674 * Clear PV EOI in guest memory in any case.
2675 */
2676static void apic_sync_pv_eoi_from_guest(struct kvm_vcpu *vcpu,
2677 struct kvm_lapic *apic)
2678{
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002679 int vector;
2680 /*
2681 * PV EOI state is derived from KVM_APIC_PV_EOI_PENDING in host
2682 * and KVM_PV_EOI_ENABLED in guest memory as follows:
2683 *
2684 * KVM_APIC_PV_EOI_PENDING is unset:
2685 * -> host disabled PV EOI.
2686 * KVM_APIC_PV_EOI_PENDING is set, KVM_PV_EOI_ENABLED is set:
2687 * -> host enabled PV EOI, guest did not execute EOI yet.
2688 * KVM_APIC_PV_EOI_PENDING is set, KVM_PV_EOI_ENABLED is unset:
2689 * -> host enabled PV EOI, guest executed EOI.
2690 */
2691 BUG_ON(!pv_eoi_enabled(vcpu));
Li RongQing51b12092021-11-04 19:56:14 +08002692
2693 if (pv_eoi_test_and_clr_pending(vcpu))
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002694 return;
2695 vector = apic_set_eoi(apic);
2696 trace_kvm_pv_eoi(apic, vector);
2697}
2698
Avi Kivityb93463a2007-10-25 16:52:32 +02002699void kvm_lapic_sync_from_vapic(struct kvm_vcpu *vcpu)
2700{
2701 u32 data;
Avi Kivityb93463a2007-10-25 16:52:32 +02002702
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002703 if (test_bit(KVM_APIC_PV_EOI_PENDING, &vcpu->arch.apic_attention))
2704 apic_sync_pv_eoi_from_guest(vcpu, vcpu->arch.apic);
2705
Gleb Natapov41383772012-04-19 14:06:29 +03002706 if (!test_bit(KVM_APIC_CHECK_VAPIC, &vcpu->arch.apic_attention))
Avi Kivityb93463a2007-10-25 16:52:32 +02002707 return;
2708
Paolo Bonzini4e335d92017-05-02 16:20:18 +02002709 if (kvm_read_guest_cached(vcpu->kvm, &vcpu->arch.apic->vapic_cache, &data,
2710 sizeof(u32)))
Nicholas Krause603242a2015-08-05 10:44:40 -04002711 return;
Avi Kivityb93463a2007-10-25 16:52:32 +02002712
2713 apic_set_tpr(vcpu->arch.apic, data & 0xff);
2714}
2715
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002716/*
2717 * apic_sync_pv_eoi_to_guest - called before vmentry
2718 *
2719 * Detect whether it's safe to enable PV EOI and
2720 * if yes do so.
2721 */
2722static void apic_sync_pv_eoi_to_guest(struct kvm_vcpu *vcpu,
2723 struct kvm_lapic *apic)
2724{
2725 if (!pv_eoi_enabled(vcpu) ||
2726 /* IRR set or many bits in ISR: could be nested. */
2727 apic->irr_pending ||
2728 /* Cache not set: could be safe but we don't bother. */
2729 apic->highest_isr_cache == -1 ||
2730 /* Need EOI to update ioapic. */
Paolo Bonzini3bb345f2015-07-29 10:43:18 +02002731 kvm_ioapic_handles_vector(apic, apic->highest_isr_cache)) {
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002732 /*
2733 * PV EOI was disabled by apic_sync_pv_eoi_from_guest
2734 * so we need not do anything here.
2735 */
2736 return;
2737 }
2738
2739 pv_eoi_set_pending(apic->vcpu);
2740}
2741
Avi Kivityb93463a2007-10-25 16:52:32 +02002742void kvm_lapic_sync_to_vapic(struct kvm_vcpu *vcpu)
2743{
2744 u32 data, tpr;
2745 int max_irr, max_isr;
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002746 struct kvm_lapic *apic = vcpu->arch.apic;
Avi Kivityb93463a2007-10-25 16:52:32 +02002747
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002748 apic_sync_pv_eoi_to_guest(vcpu, apic);
2749
Gleb Natapov41383772012-04-19 14:06:29 +03002750 if (!test_bit(KVM_APIC_CHECK_VAPIC, &vcpu->arch.apic_attention))
Avi Kivityb93463a2007-10-25 16:52:32 +02002751 return;
2752
Suravee Suthikulpanitdfb95952016-05-04 14:09:41 -05002753 tpr = kvm_lapic_get_reg(apic, APIC_TASKPRI) & 0xff;
Avi Kivityb93463a2007-10-25 16:52:32 +02002754 max_irr = apic_find_highest_irr(apic);
2755 if (max_irr < 0)
2756 max_irr = 0;
2757 max_isr = apic_find_highest_isr(apic);
2758 if (max_isr < 0)
2759 max_isr = 0;
2760 data = (tpr & 0xff) | ((max_isr & 0xf0) << 8) | (max_irr << 24);
2761
Paolo Bonzini4e335d92017-05-02 16:20:18 +02002762 kvm_write_guest_cached(vcpu->kvm, &vcpu->arch.apic->vapic_cache, &data,
2763 sizeof(u32));
Avi Kivityb93463a2007-10-25 16:52:32 +02002764}
2765
Andy Honigfda4e2e2013-11-20 10:23:22 -08002766int kvm_lapic_set_vapic_addr(struct kvm_vcpu *vcpu, gpa_t vapic_addr)
Avi Kivityb93463a2007-10-25 16:52:32 +02002767{
Andy Honigfda4e2e2013-11-20 10:23:22 -08002768 if (vapic_addr) {
Paolo Bonzini4e335d92017-05-02 16:20:18 +02002769 if (kvm_gfn_to_hva_cache_init(vcpu->kvm,
Andy Honigfda4e2e2013-11-20 10:23:22 -08002770 &vcpu->arch.apic->vapic_cache,
2771 vapic_addr, sizeof(u32)))
2772 return -EINVAL;
Gleb Natapov41383772012-04-19 14:06:29 +03002773 __set_bit(KVM_APIC_CHECK_VAPIC, &vcpu->arch.apic_attention);
Andy Honigfda4e2e2013-11-20 10:23:22 -08002774 } else {
Gleb Natapov41383772012-04-19 14:06:29 +03002775 __clear_bit(KVM_APIC_CHECK_VAPIC, &vcpu->arch.apic_attention);
Andy Honigfda4e2e2013-11-20 10:23:22 -08002776 }
2777
2778 vcpu->arch.apic->vapic_addr = vapic_addr;
2779 return 0;
Avi Kivityb93463a2007-10-25 16:52:32 +02002780}
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002781
2782int kvm_x2apic_msr_write(struct kvm_vcpu *vcpu, u32 msr, u64 data)
2783{
2784 struct kvm_lapic *apic = vcpu->arch.apic;
2785 u32 reg = (msr - APIC_BASE_MSR) << 4;
2786
Paolo Bonzini35754c92015-07-29 12:05:37 +02002787 if (!lapic_in_kernel(vcpu) || !apic_x2apic_mode(apic))
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002788 return 1;
2789
Nadav Amitc69d3d92014-11-26 17:56:25 +02002790 if (reg == APIC_ICR2)
2791 return 1;
2792
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002793 /* if this is ICR write vector before command */
Radim Krčmářdecdc282014-11-26 17:07:05 +01002794 if (reg == APIC_ICR)
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002795 kvm_lapic_reg_write(apic, APIC_ICR2, (u32)(data >> 32));
2796 return kvm_lapic_reg_write(apic, reg, (u32)data);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002797}
2798
2799int kvm_x2apic_msr_read(struct kvm_vcpu *vcpu, u32 msr, u64 *data)
2800{
2801 struct kvm_lapic *apic = vcpu->arch.apic;
2802 u32 reg = (msr - APIC_BASE_MSR) << 4, low, high = 0;
2803
Paolo Bonzini35754c92015-07-29 12:05:37 +02002804 if (!lapic_in_kernel(vcpu) || !apic_x2apic_mode(apic))
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002805 return 1;
2806
Yi Wang0d888002019-07-06 01:08:48 +08002807 if (reg == APIC_DFR || reg == APIC_ICR2)
Nadav Amitc69d3d92014-11-26 17:56:25 +02002808 return 1;
Nadav Amitc69d3d92014-11-26 17:56:25 +02002809
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002810 if (kvm_lapic_reg_read(apic, reg, 4, &low))
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002811 return 1;
Radim Krčmářdecdc282014-11-26 17:07:05 +01002812 if (reg == APIC_ICR)
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002813 kvm_lapic_reg_read(apic, APIC_ICR2, 4, &high);
Gleb Natapov0105d1a2009-07-05 17:39:36 +03002814
2815 *data = (((u64)high) << 32) | low;
2816
2817 return 0;
2818}
Gleb Natapov10388a02010-01-17 15:51:23 +02002819
2820int kvm_hv_vapic_msr_write(struct kvm_vcpu *vcpu, u32 reg, u64 data)
2821{
2822 struct kvm_lapic *apic = vcpu->arch.apic;
2823
Paolo Bonzinibce87cc2016-01-08 13:48:51 +01002824 if (!lapic_in_kernel(vcpu))
Gleb Natapov10388a02010-01-17 15:51:23 +02002825 return 1;
2826
2827 /* if this is ICR write vector before command */
2828 if (reg == APIC_ICR)
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002829 kvm_lapic_reg_write(apic, APIC_ICR2, (u32)(data >> 32));
2830 return kvm_lapic_reg_write(apic, reg, (u32)data);
Gleb Natapov10388a02010-01-17 15:51:23 +02002831}
2832
2833int kvm_hv_vapic_msr_read(struct kvm_vcpu *vcpu, u32 reg, u64 *data)
2834{
2835 struct kvm_lapic *apic = vcpu->arch.apic;
2836 u32 low, high = 0;
2837
Paolo Bonzinibce87cc2016-01-08 13:48:51 +01002838 if (!lapic_in_kernel(vcpu))
Gleb Natapov10388a02010-01-17 15:51:23 +02002839 return 1;
2840
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002841 if (kvm_lapic_reg_read(apic, reg, 4, &low))
Gleb Natapov10388a02010-01-17 15:51:23 +02002842 return 1;
2843 if (reg == APIC_ICR)
Suravee Suthikulpanit1e6e2752016-05-04 14:09:40 -05002844 kvm_lapic_reg_read(apic, APIC_ICR2, 4, &high);
Gleb Natapov10388a02010-01-17 15:51:23 +02002845
2846 *data = (((u64)high) << 32) | low;
2847
2848 return 0;
2849}
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002850
Vitaly Kuznetsov77c33232021-11-08 16:28:18 +01002851int kvm_lapic_set_pv_eoi(struct kvm_vcpu *vcpu, u64 data, unsigned long len)
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002852{
2853 u64 addr = data & ~KVM_MSR_ENABLED;
Vitaly Kuznetsova7c42bb2018-10-16 18:50:06 +02002854 struct gfn_to_hva_cache *ghc = &vcpu->arch.pv_eoi.data;
2855 unsigned long new_len;
Vitaly Kuznetsovafd67ee2021-11-08 16:28:19 +01002856 int ret;
Vitaly Kuznetsova7c42bb2018-10-16 18:50:06 +02002857
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002858 if (!IS_ALIGNED(addr, 4))
2859 return 1;
2860
Vitaly Kuznetsovafd67ee2021-11-08 16:28:19 +01002861 if (data & KVM_MSR_ENABLED) {
2862 if (addr == ghc->gpa && len <= ghc->len)
2863 new_len = ghc->len;
2864 else
2865 new_len = len;
2866
2867 ret = kvm_gfn_to_hva_cache_init(vcpu->kvm, ghc, addr, new_len);
2868 if (ret)
2869 return ret;
2870 }
2871
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002872 vcpu->arch.pv_eoi.msr_val = data;
Vitaly Kuznetsova7c42bb2018-10-16 18:50:06 +02002873
Vitaly Kuznetsovafd67ee2021-11-08 16:28:19 +01002874 return 0;
Michael S. Tsirkinae7a2a32012-06-24 19:25:07 +03002875}
Gleb Natapovc5cc4212012-08-05 15:58:30 +03002876
Jim Mattson4fe09bc2021-06-04 10:26:04 -07002877int kvm_apic_accept_events(struct kvm_vcpu *vcpu)
Jan Kiszka66450a22013-03-13 12:42:34 +01002878{
2879 struct kvm_lapic *apic = vcpu->arch.apic;
Paolo Bonzini2b4a2732014-11-24 14:35:24 +01002880 u8 sipi_vector;
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002881 int r;
Gleb Natapov299018f2013-06-03 11:30:02 +03002882 unsigned long pe;
Jan Kiszka66450a22013-03-13 12:42:34 +01002883
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002884 if (!lapic_in_kernel(vcpu))
Jim Mattson4fe09bc2021-06-04 10:26:04 -07002885 return 0;
Jan Kiszka66450a22013-03-13 12:42:34 +01002886
Paolo Bonzinicd7764f2015-06-04 10:41:21 +02002887 /*
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002888 * Read pending events before calling the check_events
2889 * callback.
2890 */
2891 pe = smp_load_acquire(&apic->pending_events);
2892 if (!pe)
Jim Mattson4fe09bc2021-06-04 10:26:04 -07002893 return 0;
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002894
2895 if (is_guest_mode(vcpu)) {
Sean Christophersoncb6a32c2021-03-02 09:45:14 -08002896 r = kvm_check_nested_events(vcpu);
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002897 if (r < 0)
Jim Mattson4fe09bc2021-06-04 10:26:04 -07002898 return r == -EBUSY ? 0 : r;
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002899 /*
2900 * If an event has happened and caused a vmexit,
2901 * we know INITs are latched and therefore
2902 * we will not incorrectly deliver an APIC
2903 * event instead of a vmexit.
2904 */
2905 }
2906
2907 /*
Liran Alon4b9852f2019-08-26 13:24:49 +03002908 * INITs are latched while CPU is in specific states
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002909 * (SMM, VMX root mode, SVM with GIF=0).
Liran Alon4b9852f2019-08-26 13:24:49 +03002910 * Because a CPU cannot be in these states immediately
2911 * after it has processed an INIT signal (and thus in
2912 * KVM_MP_STATE_INIT_RECEIVED state), just eat SIPIs
2913 * and leave the INIT pending.
Paolo Bonzinicd7764f2015-06-04 10:41:21 +02002914 */
Liran Alon27cbe7d2019-11-11 11:16:40 +02002915 if (kvm_vcpu_latch_init(vcpu)) {
Paolo Bonzinicd7764f2015-06-04 10:41:21 +02002916 WARN_ON_ONCE(vcpu->arch.mp_state == KVM_MP_STATE_INIT_RECEIVED);
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002917 if (test_bit(KVM_APIC_SIPI, &pe))
Paolo Bonzinicd7764f2015-06-04 10:41:21 +02002918 clear_bit(KVM_APIC_SIPI, &apic->pending_events);
Jim Mattson4fe09bc2021-06-04 10:26:04 -07002919 return 0;
Paolo Bonzinicd7764f2015-06-04 10:41:21 +02002920 }
Gleb Natapov299018f2013-06-03 11:30:02 +03002921
2922 if (test_bit(KVM_APIC_INIT, &pe)) {
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002923 clear_bit(KVM_APIC_INIT, &apic->pending_events);
Nadav Amitd28bc9d2015-04-13 14:34:08 +03002924 kvm_vcpu_reset(vcpu, true);
Jan Kiszka66450a22013-03-13 12:42:34 +01002925 if (kvm_vcpu_is_bsp(apic->vcpu))
2926 vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE;
2927 else
2928 vcpu->arch.mp_state = KVM_MP_STATE_INIT_RECEIVED;
2929 }
Maxim Levitskyf57ad632020-12-03 16:33:19 +02002930 if (test_bit(KVM_APIC_SIPI, &pe)) {
Paolo Bonzini1c96dcc2020-11-05 11:20:49 -05002931 clear_bit(KVM_APIC_SIPI, &apic->pending_events);
Maxim Levitskyf57ad632020-12-03 16:33:19 +02002932 if (vcpu->arch.mp_state == KVM_MP_STATE_INIT_RECEIVED) {
2933 /* evaluate pending_events before reading the vector */
2934 smp_rmb();
2935 sipi_vector = apic->sipi_vector;
Tom Lendacky647daca2021-01-04 14:20:01 -06002936 kvm_x86_ops.vcpu_deliver_sipi_vector(vcpu, sipi_vector);
Maxim Levitskyf57ad632020-12-03 16:33:19 +02002937 vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE;
2938 }
Jan Kiszka66450a22013-03-13 12:42:34 +01002939 }
Jim Mattson4fe09bc2021-06-04 10:26:04 -07002940 return 0;
Jan Kiszka66450a22013-03-13 12:42:34 +01002941}
2942
David Matlackcef84c32016-12-16 14:30:36 -08002943void kvm_lapic_exit(void)
2944{
2945 static_key_deferred_flush(&apic_hw_disabled);
Sean Christopherson9139a7a2021-10-12 17:35:54 -07002946 WARN_ON(static_branch_unlikely(&apic_hw_disabled.key));
David Matlackcef84c32016-12-16 14:30:36 -08002947 static_key_deferred_flush(&apic_sw_disabled);
Sean Christopherson9139a7a2021-10-12 17:35:54 -07002948 WARN_ON(static_branch_unlikely(&apic_sw_disabled.key));
David Matlackcef84c32016-12-16 14:30:36 -08002949}