blob: 4ceefa9567eda53be301147236be3a2874793d2e [file] [log] [blame]
Vegard Nossuma656c8e2008-07-22 21:27:11 +02001/*
Carsten Otte043405e2007-10-10 17:16:19 +02002 * Kernel-based Virtual Machine driver for Linux
3 *
4 * This header defines architecture specific interfaces, x86 version
5 *
6 * This work is licensed under the terms of the GNU GPL, version 2. See
7 * the COPYING file in the top-level directory.
8 *
9 */
10
H. Peter Anvin1965aae2008-10-22 22:26:29 -070011#ifndef _ASM_X86_KVM_HOST_H
12#define _ASM_X86_KVM_HOST_H
Carsten Otte043405e2007-10-10 17:16:19 +020013
Zhang Xiantao34c16ee2007-10-20 15:34:38 +080014#include <linux/types.h>
15#include <linux/mm.h>
Andrea Arcangelie930bff2008-07-25 16:24:52 +020016#include <linux/mmu_notifier.h>
Marcelo Tosatti229456f2009-06-17 09:22:14 -030017#include <linux/tracepoint.h>
Sheng Yangf5f48ee2010-06-30 12:25:15 +080018#include <linux/cpumask.h>
Zhang Xiantao34c16ee2007-10-20 15:34:38 +080019
20#include <linux/kvm.h>
21#include <linux/kvm_para.h>
Avi Kivityedf88412007-12-16 11:02:48 +020022#include <linux/kvm_types.h>
Zhang Xiantao34c16ee2007-10-20 15:34:38 +080023
Gerd Hoffmann50d0a0f2008-06-03 16:17:31 +020024#include <asm/pvclock-abi.h>
Hollis Blancharde01a1b52007-12-03 15:30:25 -060025#include <asm/desc.h>
Sheng Yang0bed3b52008-10-09 16:01:54 +080026#include <asm/mtrr.h>
Alexander Graf9962d032008-11-25 20:17:02 +010027#include <asm/msr-index.h>
Hollis Blancharde01a1b52007-12-03 15:30:25 -060028
Sasha Levin8c3ba332011-07-18 17:17:15 +030029#define KVM_MAX_VCPUS 254
30#define KVM_SOFT_MAX_VCPUS 64
Avi Kivity69a9f692008-03-21 12:38:23 +020031#define KVM_MEMORY_SLOTS 32
32/* memory slots that does not exposed to userspace */
33#define KVM_PRIVATE_MEM_SLOTS 4
Avi Kivitycef4dea2010-01-20 12:01:20 +020034#define KVM_MMIO_SIZE 16
Avi Kivity69a9f692008-03-21 12:38:23 +020035
36#define KVM_PIO_PAGE_OFFSET 1
Laurent Vivier542472b2008-05-30 16:05:55 +020037#define KVM_COALESCED_MMIO_PAGE_OFFSET 2
Avi Kivity69a9f692008-03-21 12:38:23 +020038
Joerg Roedelcfec82c2011-04-04 12:39:28 +020039#define CR0_RESERVED_BITS \
40 (~(unsigned long)(X86_CR0_PE | X86_CR0_MP | X86_CR0_EM | X86_CR0_TS \
41 | X86_CR0_ET | X86_CR0_NE | X86_CR0_WP | X86_CR0_AM \
42 | X86_CR0_NW | X86_CR0_CD | X86_CR0_PG))
43
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080044#define CR3_PAE_RESERVED_BITS ((X86_CR3_PWT | X86_CR3_PCD) - 1)
45#define CR3_NONPAE_RESERVED_BITS ((PAGE_SIZE-1) & ~(X86_CR3_PWT | X86_CR3_PCD))
Joe Perches7d76b4d2008-03-23 01:02:34 -070046#define CR3_L_MODE_RESERVED_BITS (CR3_NONPAE_RESERVED_BITS | \
47 0xFFFFFF0000000000ULL)
Joerg Roedelcfec82c2011-04-04 12:39:28 +020048#define CR4_RESERVED_BITS \
49 (~(unsigned long)(X86_CR4_VME | X86_CR4_PVI | X86_CR4_TSD | X86_CR4_DE\
50 | X86_CR4_PSE | X86_CR4_PAE | X86_CR4_MCE \
51 | X86_CR4_PGE | X86_CR4_PCE | X86_CR4_OSFXSR \
Yang, Weid9c34762011-06-14 20:10:17 +080052 | X86_CR4_OSXSAVE | X86_CR4_SMEP | X86_CR4_RDWRGSFS \
Joerg Roedelcfec82c2011-04-04 12:39:28 +020053 | X86_CR4_OSXMMEXCPT | X86_CR4_VMXE))
54
55#define CR8_RESERVED_BITS (~(unsigned long)X86_CR8_TPR)
56
57
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080058
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080059#define INVALID_PAGE (~(hpa_t)0)
Xiao Guangrongdd180b32010-07-03 16:02:42 +080060#define VALID_PAGE(x) ((x) != INVALID_PAGE)
61
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080062#define UNMAPPED_GVA (~(gpa_t)0)
63
Joerg Roedelec04b262009-06-19 15:16:23 +020064/* KVM Hugepage definitions for x86 */
Joerg Roedel04326ca2009-07-27 16:30:47 +020065#define KVM_NR_PAGE_SIZES 3
Joerg Roedel82855412010-07-01 16:00:11 +020066#define KVM_HPAGE_GFN_SHIFT(x) (((x) - 1) * 9)
67#define KVM_HPAGE_SHIFT(x) (PAGE_SHIFT + KVM_HPAGE_GFN_SHIFT(x))
Joerg Roedelec04b262009-06-19 15:16:23 +020068#define KVM_HPAGE_SIZE(x) (1UL << KVM_HPAGE_SHIFT(x))
69#define KVM_HPAGE_MASK(x) (~(KVM_HPAGE_SIZE(x) - 1))
70#define KVM_PAGES_PER_HPAGE(x) (KVM_HPAGE_SIZE(x) / PAGE_SIZE)
Marcelo Tosatti05da4552008-02-23 11:44:30 -030071
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080072#define DE_VECTOR 0
Jan Kiszka19bd8af2008-07-13 13:40:55 +020073#define DB_VECTOR 1
Jan Kiszka77ab6db2008-07-14 12:28:51 +020074#define BP_VECTOR 3
75#define OF_VECTOR 4
76#define BR_VECTOR 5
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080077#define UD_VECTOR 6
78#define NM_VECTOR 7
79#define DF_VECTOR 8
80#define TS_VECTOR 10
81#define NP_VECTOR 11
82#define SS_VECTOR 12
83#define GP_VECTOR 13
84#define PF_VECTOR 14
Jan Kiszka77ab6db2008-07-14 12:28:51 +020085#define MF_VECTOR 16
Joerg Roedel53371b52008-04-09 14:15:30 +020086#define MC_VECTOR 18
Zhang Xiantaocd6e8f82007-11-19 14:33:37 +080087
88#define SELECTOR_TI_MASK (1 << 2)
89#define SELECTOR_RPL_MASK 0x03
90
91#define IOPL_SHIFT 12
92
Zhang Xiantaod657a982007-12-14 09:41:22 +080093#define KVM_PERMILLE_MMU_PAGES 20
94#define KVM_MIN_ALLOC_MMU_PAGES 64
Dong, Eddie1ae0a132008-01-07 13:20:25 +020095#define KVM_MMU_HASH_SHIFT 10
96#define KVM_NUM_MMU_PAGES (1 << KVM_MMU_HASH_SHIFT)
Zhang Xiantaod657a982007-12-14 09:41:22 +080097#define KVM_MIN_FREE_MMU_PAGES 5
98#define KVM_REFILL_PAGES 25
Andre Przywara73c11602010-12-01 12:17:44 +010099#define KVM_MAX_CPUID_ENTRIES 80
Sheng Yang0bed3b52008-10-09 16:01:54 +0800100#define KVM_NR_FIXED_MTRR_REGION 88
Avi Kivity9ba075a2008-05-26 20:06:35 +0300101#define KVM_NR_VAR_MTRR 8
Zhang Xiantaod657a982007-12-14 09:41:22 +0800102
Gleb Natapovaf585b92010-10-14 11:22:46 +0200103#define ASYNC_PF_PER_VCPU 64
104
Jan Kiszkae935b832011-02-08 12:55:33 +0100105extern raw_spinlock_t kvm_lock;
Zhang Xiantaoe9b11c12007-11-14 20:38:21 +0800106extern struct list_head vm_list;
107
Zhang Xiantaod657a982007-12-14 09:41:22 +0800108struct kvm_vcpu;
109struct kvm;
Gleb Natapovaf585b92010-10-14 11:22:46 +0200110struct kvm_async_pf;
Zhang Xiantaod657a982007-12-14 09:41:22 +0800111
Marcelo Tosatti5fdbf972008-06-27 14:58:02 -0300112enum kvm_reg {
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800113 VCPU_REGS_RAX = 0,
114 VCPU_REGS_RCX = 1,
115 VCPU_REGS_RDX = 2,
116 VCPU_REGS_RBX = 3,
117 VCPU_REGS_RSP = 4,
118 VCPU_REGS_RBP = 5,
119 VCPU_REGS_RSI = 6,
120 VCPU_REGS_RDI = 7,
121#ifdef CONFIG_X86_64
122 VCPU_REGS_R8 = 8,
123 VCPU_REGS_R9 = 9,
124 VCPU_REGS_R10 = 10,
125 VCPU_REGS_R11 = 11,
126 VCPU_REGS_R12 = 12,
127 VCPU_REGS_R13 = 13,
128 VCPU_REGS_R14 = 14,
129 VCPU_REGS_R15 = 15,
130#endif
Marcelo Tosatti5fdbf972008-06-27 14:58:02 -0300131 VCPU_REGS_RIP,
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800132 NR_VCPU_REGS
133};
134
Avi Kivity6de4f3a2009-05-31 22:58:47 +0300135enum kvm_reg_ex {
136 VCPU_EXREG_PDPTR = NR_VCPU_REGS,
Avi Kivityaff48ba2010-12-05 18:56:11 +0200137 VCPU_EXREG_CR3,
Avi Kivity6de12732011-03-07 12:51:22 +0200138 VCPU_EXREG_RFLAGS,
Avi Kivity69c73022011-03-07 15:26:44 +0200139 VCPU_EXREG_CPL,
Avi Kivity2fb92db2011-04-27 19:42:18 +0300140 VCPU_EXREG_SEGMENTS,
Avi Kivity6de4f3a2009-05-31 22:58:47 +0300141};
142
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800143enum {
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800144 VCPU_SREG_ES,
Avi Kivity81609e32008-05-27 16:26:01 +0300145 VCPU_SREG_CS,
146 VCPU_SREG_SS,
147 VCPU_SREG_DS,
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800148 VCPU_SREG_FS,
149 VCPU_SREG_GS,
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800150 VCPU_SREG_TR,
151 VCPU_SREG_LDTR,
152};
153
Avi Kivity56e82312009-08-12 15:04:37 +0300154#include <asm/kvm_emulate.h>
Zhang Xiantao2b3ccfa2007-11-19 14:56:05 +0800155
Zhang Xiantaod657a982007-12-14 09:41:22 +0800156#define KVM_NR_MEM_OBJS 40
157
Jan Kiszka42dbaa52008-12-15 13:52:10 +0100158#define KVM_NR_DB_REGS 4
159
160#define DR6_BD (1 << 13)
161#define DR6_BS (1 << 14)
162#define DR6_FIXED_1 0xffff0ff0
163#define DR6_VOLATILE 0x0000e00f
164
165#define DR7_BP_EN_MASK 0x000000ff
166#define DR7_GE (1 << 9)
167#define DR7_GD (1 << 13)
168#define DR7_FIXED_1 0x00000400
169#define DR7_VOLATILE 0xffff23ff
170
Zhang Xiantaod657a982007-12-14 09:41:22 +0800171/*
172 * We don't want allocation failures within the mmu code, so we preallocate
173 * enough memory for a single page fault in a cache.
174 */
175struct kvm_mmu_memory_cache {
176 int nobjs;
177 void *objects[KVM_NR_MEM_OBJS];
178};
179
180#define NR_PTE_CHAIN_ENTRIES 5
181
182struct kvm_pte_chain {
183 u64 *parent_ptes[NR_PTE_CHAIN_ENTRIES];
184 struct hlist_node link;
185};
186
187/*
188 * kvm_mmu_page_role, below, is defined as:
189 *
190 * bits 0:3 - total guest paging levels (2-4, or zero for real mode)
191 * bits 4:7 - page table level for this shadow (1-4)
192 * bits 8:9 - page table quadrant for 2-level guests
Avi Kivityf6e2c02b2009-01-11 13:02:10 +0200193 * bit 16 - direct mapping of virtual to physical mapping at gfn
194 * used for real mode and two-dimensional paging
Zhang Xiantaod657a982007-12-14 09:41:22 +0800195 * bits 17:19 - common access permissions for all ptes in this shadow page
196 */
197union kvm_mmu_page_role {
198 unsigned word;
199 struct {
Joe Perches7d76b4d2008-03-23 01:02:34 -0700200 unsigned level:4;
Avi Kivity5b7e0102010-04-14 19:20:03 +0300201 unsigned cr4_pae:1;
Joe Perches7d76b4d2008-03-23 01:02:34 -0700202 unsigned quadrant:2;
203 unsigned pad_for_nice_hex_output:6;
Avi Kivityf6e2c02b2009-01-11 13:02:10 +0200204 unsigned direct:1;
Joe Perches7d76b4d2008-03-23 01:02:34 -0700205 unsigned access:3;
Marcelo Tosatti2e53d632008-02-20 14:47:24 -0500206 unsigned invalid:1;
Avi Kivity9645bb562009-03-31 11:31:54 +0300207 unsigned nxe:1;
Avi Kivity3dbe1412010-05-12 11:48:18 +0300208 unsigned cr0_wp:1;
Avi Kivity411c5882011-06-06 16:11:54 +0300209 unsigned smep_andnot_wp:1;
Zhang Xiantaod657a982007-12-14 09:41:22 +0800210 };
211};
212
213struct kvm_mmu_page {
214 struct list_head link;
215 struct hlist_node hash_link;
216
217 /*
218 * The following two entries are used to key the shadow page in the
219 * hash table.
220 */
221 gfn_t gfn;
222 union kvm_mmu_page_role role;
223
224 u64 *spt;
225 /* hold the gfn of each spte inside spt */
226 gfn_t *gfns;
Sheng Yang291f26b2008-10-16 17:30:57 +0800227 /*
228 * One bit set per slot which has memory
229 * in this shadow page.
230 */
231 DECLARE_BITMAP(slot_bitmap, KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS);
Marcelo Tosatti4731d4c2008-09-23 13:18:39 -0300232 bool unsync;
Xiao Guangrong0571d362010-04-16 21:27:54 +0800233 int root_count; /* Currently serving as active root */
Marcelo Tosatti60c8aec2008-12-01 22:32:02 -0200234 unsigned int unsync_children;
Xiao Guangrong67052b32011-05-15 23:27:08 +0800235 unsigned long parent_ptes; /* Reverse mapping for parent_pte */
Marcelo Tosatti0074ff62008-09-23 13:18:40 -0300236 DECLARE_BITMAP(unsync_child_bitmap, 512);
Xiao Guangrongc2a2ac22011-07-12 03:32:13 +0800237
238#ifdef CONFIG_X86_32
239 int clear_spte_count;
240#endif
241
242 struct rcu_head rcu;
Zhang Xiantaod657a982007-12-14 09:41:22 +0800243};
244
Dave Hansen6ad18fb2008-08-11 10:01:49 -0700245struct kvm_pv_mmu_op_buffer {
246 void *ptr;
247 unsigned len;
248 unsigned processed;
249 char buf[512] __aligned(sizeof(long));
250};
251
Avi Kivity1c083642009-01-04 12:39:07 +0200252struct kvm_pio_request {
253 unsigned long count;
Avi Kivity1c083642009-01-04 12:39:07 +0200254 int in;
255 int port;
256 int size;
Avi Kivity1c083642009-01-04 12:39:07 +0200257};
258
Zhang Xiantaod657a982007-12-14 09:41:22 +0800259/*
260 * x86 supports 3 paging modes (4-level 64-bit, 3-level 64-bit, and 2-level
261 * 32-bit). The kvm_mmu structure abstracts the details of the current mmu
262 * mode.
263 */
264struct kvm_mmu {
265 void (*new_cr3)(struct kvm_vcpu *vcpu);
Joerg Roedelf43addd2010-09-10 17:30:40 +0200266 void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long root);
Joerg Roedel5777ed32010-09-10 17:30:42 +0200267 unsigned long (*get_cr3)(struct kvm_vcpu *vcpu);
Avi Kivitye4e517b2011-07-28 11:36:17 +0300268 u64 (*get_pdptr)(struct kvm_vcpu *vcpu, int index);
Xiao Guangrong78b2c542010-12-07 10:48:06 +0800269 int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err,
270 bool prefault);
Avi Kivity6389ee92010-11-29 16:12:30 +0200271 void (*inject_page_fault)(struct kvm_vcpu *vcpu,
272 struct x86_exception *fault);
Zhang Xiantaod657a982007-12-14 09:41:22 +0800273 void (*free)(struct kvm_vcpu *vcpu);
Gleb Natapov1871c602010-02-10 14:21:32 +0200274 gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva, u32 access,
Avi Kivityab9ae312010-11-22 17:53:26 +0200275 struct x86_exception *exception);
Joerg Roedelc30a3582010-09-10 17:30:48 +0200276 gpa_t (*translate_gpa)(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access);
Marcelo Tosattie8bc2172008-09-23 13:18:33 -0300277 int (*sync_page)(struct kvm_vcpu *vcpu,
Xiao Guangronga4a8e6f2010-11-19 17:04:03 +0800278 struct kvm_mmu_page *sp);
Marcelo Tosattia7052892008-09-23 13:18:35 -0300279 void (*invlpg)(struct kvm_vcpu *vcpu, gva_t gva);
Xiao Guangrong0f53b5b2011-03-09 15:43:51 +0800280 void (*update_pte)(struct kvm_vcpu *vcpu, struct kvm_mmu_page *sp,
Xiao Guangrong7c562522011-03-28 10:29:27 +0800281 u64 *spte, const void *pte);
Zhang Xiantaod657a982007-12-14 09:41:22 +0800282 hpa_t root_hpa;
283 int root_level;
284 int shadow_root_level;
Avi Kivitya770f6f2008-12-21 19:20:09 +0200285 union kvm_mmu_page_role base_role;
Joerg Roedelc5a78f2b2010-09-10 17:30:39 +0200286 bool direct_map;
Zhang Xiantaod657a982007-12-14 09:41:22 +0800287
288 u64 *pae_root;
Joerg Roedel81407ca2010-09-10 17:31:00 +0200289 u64 *lm_root;
Dong, Eddie82725b22009-03-30 16:21:08 +0800290 u64 rsvd_bits_mask[2][4];
Joerg Roedelff03a072010-09-10 17:30:57 +0200291
Joerg Roedel2d48a982010-09-10 17:31:01 +0200292 bool nx;
293
Joerg Roedelff03a072010-09-10 17:30:57 +0200294 u64 pdptrs[4]; /* pae */
Zhang Xiantaod657a982007-12-14 09:41:22 +0800295};
296
Zhang Xiantaoad312c72007-12-13 23:50:52 +0800297struct kvm_vcpu_arch {
Marcelo Tosatti5fdbf972008-06-27 14:58:02 -0300298 /*
299 * rip and regs accesses must go through
300 * kvm_{register,rip}_{read,write} functions.
301 */
302 unsigned long regs[NR_VCPU_REGS];
303 u32 regs_avail;
304 u32 regs_dirty;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800305
306 unsigned long cr0;
Avi Kivitye8467fd2009-12-29 18:43:06 +0200307 unsigned long cr0_guest_owned_bits;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800308 unsigned long cr2;
309 unsigned long cr3;
310 unsigned long cr4;
Avi Kivityfc78f512009-12-07 12:16:48 +0200311 unsigned long cr4_guest_owned_bits;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800312 unsigned long cr8;
Alexander Graf1371d902008-11-25 20:17:04 +0100313 u32 hflags;
Avi Kivityf6801df2010-01-21 15:31:50 +0200314 u64 efer;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800315 u64 apic_base;
316 struct kvm_lapic *apic; /* kernel irqchip context */
Gleb Natapove1035712009-03-05 16:34:59 +0200317 int32_t apic_arb_prio;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800318 int mp_state;
319 int sipi_vector;
320 u64 ia32_misc_enable_msr;
Avi Kivityb209749f2007-10-22 16:50:39 +0200321 bool tpr_access_reporting;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800322
Joerg Roedel14dfe852010-09-10 17:30:49 +0200323 /*
324 * Paging state of the vcpu
325 *
326 * If the vcpu runs in guest mode with two level paging this still saves
327 * the paging mode of the l1 guest. This context is always used to
328 * handle faults.
329 */
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800330 struct kvm_mmu mmu;
Joerg Roedel8df25a32010-09-10 17:30:46 +0200331
332 /*
Joerg Roedel6539e732010-09-10 17:30:50 +0200333 * Paging state of an L2 guest (used for nested npt)
334 *
335 * This context will save all necessary information to walk page tables
336 * of the an L2 guest. This context is only initialized for page table
337 * walking and not for faulting since we never handle l2 page faults on
338 * the host.
339 */
340 struct kvm_mmu nested_mmu;
341
342 /*
Joerg Roedel14dfe852010-09-10 17:30:49 +0200343 * Pointer to the mmu context currently used for
344 * gva_to_gpa translations.
345 */
346 struct kvm_mmu *walk_mmu;
347
Dave Hansen6ad18fb2008-08-11 10:01:49 -0700348 /* only needed in kvm_pv_mmu_op() path, but it's hot so
349 * put it here to avoid allocation */
350 struct kvm_pv_mmu_op_buffer mmu_op_buffer;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800351
Xiao Guangrong53c07b12011-05-15 23:26:20 +0800352 struct kvm_mmu_memory_cache mmu_pte_list_desc_cache;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800353 struct kvm_mmu_memory_cache mmu_page_cache;
354 struct kvm_mmu_memory_cache mmu_page_header_cache;
355
356 gfn_t last_pt_write_gfn;
357 int last_pt_write_count;
358 u64 *last_pte_updated;
Avi Kivity1b7fcd32008-05-15 13:51:35 +0300359 gfn_t last_pte_gfn;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800360
Sheng Yang98918832010-05-17 17:08:28 +0800361 struct fpu guest_fpu;
Dexuan Cui2acf9232010-06-10 11:27:12 +0800362 u64 xcr0;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800363
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800364 struct kvm_pio_request pio;
365 void *pio_data;
366
Gleb Natapov66fd3f72009-05-11 13:35:50 +0300367 u8 event_exit_inst_len;
368
Avi Kivity298101d2007-11-25 13:41:11 +0200369 struct kvm_queued_exception {
370 bool pending;
371 bool has_error_code;
Joerg Roedelce7ddec2010-04-22 12:33:13 +0200372 bool reinject;
Avi Kivity298101d2007-11-25 13:41:11 +0200373 u8 nr;
374 u32 error_code;
375 } exception;
376
Avi Kivity937a7ea2008-07-03 15:17:01 +0300377 struct kvm_queued_interrupt {
378 bool pending;
Gleb Natapov66fd3f72009-05-11 13:35:50 +0300379 bool soft;
Avi Kivity937a7ea2008-07-03 15:17:01 +0300380 u8 nr;
381 } interrupt;
382
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800383 int halt_request; /* real mode on Intel only */
384
385 int cpuid_nent;
Dan Kenigsberg07716712007-11-21 17:10:04 +0200386 struct kvm_cpuid_entry2 cpuid_entries[KVM_MAX_CPUID_ENTRIES];
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800387 /* emulate context */
388
389 struct x86_emulate_ctxt emulate_ctxt;
Gleb Natapov7ae441e2011-03-31 12:06:41 +0200390 bool emulate_regs_need_sync_to_vcpu;
391 bool emulate_regs_need_sync_from_vcpu;
Glauber de Oliveira Costa18068522008-02-15 17:52:47 -0200392
393 gpa_t time;
Gerd Hoffmann50d0a0f2008-06-03 16:17:31 +0200394 struct pvclock_vcpu_time_info hv_clock;
Zachary Amsdene48672f2010-08-19 22:07:23 -1000395 unsigned int hw_tsc_khz;
Glauber de Oliveira Costa18068522008-02-15 17:52:47 -0200396 unsigned int time_offset;
397 struct page *time_page;
Glauber Costac9aaa892011-07-11 15:28:14 -0400398
399 struct {
400 u64 msr_val;
401 u64 last_steal;
402 u64 accum_steal;
403 struct gfn_to_hva_cache stime;
404 struct kvm_steal_time steal;
405 } st;
406
Zachary Amsden1d5f0662010-08-19 22:07:30 -1000407 u64 last_guest_tsc;
408 u64 last_kernel_ns;
Zachary Amsdenc2855452010-09-18 14:38:15 -1000409 u64 last_tsc_nsec;
410 u64 last_tsc_write;
Joerg Roedel1e993612011-03-25 09:44:47 +0100411 u32 virtual_tsc_khz;
Zachary Amsdenc2855452010-09-18 14:38:15 -1000412 bool tsc_catchup;
Joerg Roedel1e993612011-03-25 09:44:47 +0100413 u32 tsc_catchup_mult;
414 s8 tsc_catchup_shift;
Sheng Yang3419ffc2008-05-15 09:52:48 +0800415
Avi Kivity7460fb4a2011-09-20 13:43:14 +0300416 atomic_t nmi_queued; /* unprocessed asynchronous NMIs */
417 unsigned nmi_pending; /* NMI queued after currently running handler */
418 bool nmi_injected; /* Trying to inject an NMI this entry */
Avi Kivity9ba075a2008-05-26 20:06:35 +0300419
Sheng Yang0bed3b52008-10-09 16:01:54 +0800420 struct mtrr_state_type mtrr_state;
421 u32 pat;
Jan Kiszka42dbaa52008-12-15 13:52:10 +0100422
423 int switch_db_regs;
Jan Kiszka42dbaa52008-12-15 13:52:10 +0100424 unsigned long db[KVM_NR_DB_REGS];
425 unsigned long dr6;
426 unsigned long dr7;
427 unsigned long eff_db[KVM_NR_DB_REGS];
Huang Ying890ca9a2009-05-11 16:48:15 +0800428
429 u64 mcg_cap;
430 u64 mcg_status;
431 u64 mcg_ctl;
432 u64 *mce_banks;
Jan Kiszka94fe45d2009-10-18 13:24:44 +0200433
Xiao Guangrongbebb1062011-07-12 03:23:20 +0800434 /* Cache MMIO info */
435 u64 mmio_gva;
436 unsigned access;
437 gfn_t mmio_gfn;
438
Jan Kiszka94fe45d2009-10-18 13:24:44 +0200439 /* used for guest single stepping over the given code position */
Jan Kiszka94fe45d2009-10-18 13:24:44 +0200440 unsigned long singlestep_rip;
Jan Kiszkaf92653e2010-02-23 17:47:55 +0100441
Gleb Natapov10388a02010-01-17 15:51:23 +0200442 /* fields used by HYPER-V emulation */
443 u64 hv_vapic;
Sheng Yangf5f48ee2010-06-30 12:25:15 +0800444
445 cpumask_var_t wbinvd_dirty_mask;
Gleb Natapovaf585b92010-10-14 11:22:46 +0200446
Xiao Guangrong1cb3f3a2011-09-22 17:02:48 +0800447 unsigned long last_retry_eip;
448 unsigned long last_retry_addr;
449
Gleb Natapovaf585b92010-10-14 11:22:46 +0200450 struct {
451 bool halted;
452 gfn_t gfns[roundup_pow_of_two(ASYNC_PF_PER_VCPU)];
Gleb Natapov344d9582010-10-14 11:22:50 +0200453 struct gfn_to_hva_cache data;
454 u64 msr_val;
Gleb Natapov7c907052010-10-14 11:22:53 +0200455 u32 id;
Gleb Natapov6adba522010-10-14 11:22:55 +0200456 bool send_user_only;
Gleb Natapovaf585b92010-10-14 11:22:46 +0200457 } apf;
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800458};
459
Marcelo Tosattifef9cce2009-12-23 14:35:17 -0200460struct kvm_arch {
Dave Hansen49d5ca22010-08-19 18:11:28 -0700461 unsigned int n_used_mmu_pages;
Zhang Xiantaof05e70a2007-12-14 10:01:48 +0800462 unsigned int n_requested_mmu_pages;
Dave Hansen39de71e2010-08-19 18:11:14 -0700463 unsigned int n_max_mmu_pages;
Xiao Guangrong332b2072011-05-15 23:20:27 +0800464 unsigned int indirect_shadow_pages;
Avi Kivity08e850c2010-03-15 13:59:57 +0200465 atomic_t invlpg_counter;
Zhang Xiantaof05e70a2007-12-14 10:01:48 +0800466 struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
467 /*
468 * Hash table of struct kvm_mmu_page.
469 */
470 struct list_head active_mmu_pages;
Ben-Ami Yassour4d5c5d02008-07-28 19:26:26 +0300471 struct list_head assigned_dev_head;
Joerg Roedel19de40a2008-12-03 14:43:34 +0100472 struct iommu_domain *iommu_domain;
Sheng Yang522c68c2009-04-27 20:35:43 +0800473 int iommu_flags;
Zhang Xiantaod7deeeb02007-12-14 10:17:34 +0800474 struct kvm_pic *vpic;
475 struct kvm_ioapic *vioapic;
Sheng Yang78376992008-01-28 05:10:22 +0800476 struct kvm_pit *vpit;
Jan Kiszkacc6e4622008-10-20 10:20:03 +0200477 int vapics_in_nmi_mode;
Zhang Xiantaobfc6d222007-12-14 10:20:16 +0800478
Zhang Xiantaobfc6d222007-12-14 10:20:16 +0800479 unsigned int tss_addr;
480 struct page *apic_access_page;
Glauber de Oliveira Costa18068522008-02-15 17:52:47 -0200481
482 gpa_t wall_clock;
Sheng Yangb7ebfb02008-04-25 21:44:52 +0800483
484 struct page *ept_identity_pagetable;
485 bool ept_identity_pagetable_done;
Sheng Yangb927a3c2009-07-21 10:42:48 +0800486 gpa_t ept_identity_map_addr;
Sheng Yang5550af42008-10-15 20:15:06 +0800487
488 unsigned long irq_sources_bitmap;
Glauber Costaafbcf7a2009-10-16 15:28:36 -0400489 s64 kvmclock_offset;
Jan Kiszka038f8c12011-02-04 10:49:11 +0100490 raw_spinlock_t tsc_write_lock;
Zachary Amsdenf38e0982010-08-19 22:07:20 -1000491 u64 last_tsc_nsec;
492 u64 last_tsc_offset;
493 u64 last_tsc_write;
Ed Swierkffde22a2009-10-15 15:21:43 -0700494
495 struct kvm_xen_hvm_config xen_hvm_config;
Gleb Natapov55cd8e52010-01-17 15:51:22 +0200496
497 /* fields used by HYPER-V emulation */
498 u64 hv_guest_os_id;
499 u64 hv_hypercall;
Xiao Guangrongb034cf02010-12-23 16:08:35 +0800500
Xiao Guangrongc2a2ac22011-07-12 03:32:13 +0800501 atomic_t reader_counter;
502
Xiao Guangrongb034cf02010-12-23 16:08:35 +0800503 #ifdef CONFIG_KVM_MMU_AUDIT
504 int audit_point;
505 #endif
Zhang Xiantaod69fb812007-12-14 09:54:20 +0800506};
507
Zhang Xiantao07114562007-12-14 10:23:23 +0800508struct kvm_vm_stat {
509 u32 mmu_shadow_zapped;
510 u32 mmu_pte_write;
511 u32 mmu_pte_updated;
512 u32 mmu_pde_zapped;
513 u32 mmu_flooded;
514 u32 mmu_recycled;
Avi Kivitydfc5aa02007-12-18 19:47:18 +0200515 u32 mmu_cache_miss;
Marcelo Tosatti4731d4c2008-09-23 13:18:39 -0300516 u32 mmu_unsync;
Zhang Xiantao07114562007-12-14 10:23:23 +0800517 u32 remote_tlb_flush;
Marcelo Tosatti05da4552008-02-23 11:44:30 -0300518 u32 lpages;
Zhang Xiantao07114562007-12-14 10:23:23 +0800519};
520
Zhang Xiantao77b4c252007-12-14 09:49:26 +0800521struct kvm_vcpu_stat {
522 u32 pf_fixed;
523 u32 pf_guest;
524 u32 tlb_flush;
525 u32 invlpg;
526
527 u32 exits;
528 u32 io_exits;
529 u32 mmio_exits;
530 u32 signal_exits;
531 u32 irq_window_exits;
Sheng Yangf08864b2008-05-15 18:23:25 +0800532 u32 nmi_window_exits;
Zhang Xiantao77b4c252007-12-14 09:49:26 +0800533 u32 halt_exits;
534 u32 halt_wakeup;
535 u32 request_irq_exits;
536 u32 irq_exits;
537 u32 host_state_reload;
538 u32 efer_reload;
539 u32 fpu_reload;
540 u32 insn_emulation;
541 u32 insn_emulation_fail;
Amit Shahf11c3a82008-02-21 01:00:30 +0530542 u32 hypercalls;
Avi Kivityfa89a812008-09-01 15:57:51 +0300543 u32 irq_injections;
Jan Kiszkac4abb7c2008-09-26 09:30:55 +0200544 u32 nmi_injections;
Zhang Xiantao77b4c252007-12-14 09:49:26 +0800545};
Zhang Xiantaoad312c72007-12-13 23:50:52 +0800546
Joerg Roedel8a76d7f2011-04-04 12:39:27 +0200547struct x86_instruction_info;
548
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800549struct kvm_x86_ops {
550 int (*cpu_has_kvm_support)(void); /* __init */
551 int (*disabled_by_bios)(void); /* __init */
Alexander Graf10474ae2009-09-15 11:37:46 +0200552 int (*hardware_enable)(void *dummy);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800553 void (*hardware_disable)(void *dummy);
554 void (*check_processor_compatibility)(void *rtn);
555 int (*hardware_setup)(void); /* __init */
556 void (*hardware_unsetup)(void); /* __exit */
Avi Kivity774ead32007-12-26 13:57:04 +0200557 bool (*cpu_has_accelerated_tpr)(void);
Sheng Yang0e851882009-12-18 16:48:46 +0800558 void (*cpuid_update)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800559
560 /* Create, but do not attach this VCPU */
561 struct kvm_vcpu *(*vcpu_create)(struct kvm *kvm, unsigned id);
562 void (*vcpu_free)(struct kvm_vcpu *vcpu);
563 int (*vcpu_reset)(struct kvm_vcpu *vcpu);
564
565 void (*prepare_guest_switch)(struct kvm_vcpu *vcpu);
566 void (*vcpu_load)(struct kvm_vcpu *vcpu, int cpu);
567 void (*vcpu_put)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800568
Jan Kiszka355be0b2009-10-03 00:31:21 +0200569 void (*set_guest_debug)(struct kvm_vcpu *vcpu,
570 struct kvm_guest_debug *dbg);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800571 int (*get_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 *pdata);
572 int (*set_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
573 u64 (*get_segment_base)(struct kvm_vcpu *vcpu, int seg);
574 void (*get_segment)(struct kvm_vcpu *vcpu,
575 struct kvm_segment *var, int seg);
Izik Eidus2e4d2652008-03-24 19:38:34 +0200576 int (*get_cpl)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800577 void (*set_segment)(struct kvm_vcpu *vcpu,
578 struct kvm_segment *var, int seg);
579 void (*get_cs_db_l_bits)(struct kvm_vcpu *vcpu, int *db, int *l);
Avi Kivitye8467fd2009-12-29 18:43:06 +0200580 void (*decache_cr0_guest_bits)(struct kvm_vcpu *vcpu);
Avi Kivityaff48ba2010-12-05 18:56:11 +0200581 void (*decache_cr3)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800582 void (*decache_cr4_guest_bits)(struct kvm_vcpu *vcpu);
583 void (*set_cr0)(struct kvm_vcpu *vcpu, unsigned long cr0);
584 void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
Nadav Har'El5e1746d2011-05-25 23:03:24 +0300585 int (*set_cr4)(struct kvm_vcpu *vcpu, unsigned long cr4);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800586 void (*set_efer)(struct kvm_vcpu *vcpu, u64 efer);
Gleb Natapov89a27f42010-02-16 10:51:48 +0200587 void (*get_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
588 void (*set_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
589 void (*get_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
590 void (*set_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
Gleb Natapov020df072010-04-13 10:05:23 +0300591 void (*set_dr7)(struct kvm_vcpu *vcpu, unsigned long value);
Marcelo Tosatti5fdbf972008-06-27 14:58:02 -0300592 void (*cache_reg)(struct kvm_vcpu *vcpu, enum kvm_reg reg);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800593 unsigned long (*get_rflags)(struct kvm_vcpu *vcpu);
594 void (*set_rflags)(struct kvm_vcpu *vcpu, unsigned long rflags);
Avi Kivity6b52d182010-01-21 15:31:47 +0200595 void (*fpu_activate)(struct kvm_vcpu *vcpu);
Avi Kivity02daab22009-12-30 12:40:26 +0200596 void (*fpu_deactivate)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800597
598 void (*tlb_flush)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800599
Avi Kivity851ba692009-08-24 11:10:17 +0300600 void (*run)(struct kvm_vcpu *vcpu);
601 int (*handle_exit)(struct kvm_vcpu *vcpu);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800602 void (*skip_emulated_instruction)(struct kvm_vcpu *vcpu);
Glauber Costa2809f5d2009-05-12 16:21:05 -0400603 void (*set_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
604 u32 (*get_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800605 void (*patch_hypercall)(struct kvm_vcpu *vcpu,
606 unsigned char *hypercall_addr);
Gleb Natapov66fd3f72009-05-11 13:35:50 +0300607 void (*set_irq)(struct kvm_vcpu *vcpu);
Gleb Natapov95ba8273132009-04-21 17:45:08 +0300608 void (*set_nmi)(struct kvm_vcpu *vcpu);
Avi Kivity298101d2007-11-25 13:41:11 +0200609 void (*queue_exception)(struct kvm_vcpu *vcpu, unsigned nr,
Joerg Roedelce7ddec2010-04-22 12:33:13 +0200610 bool has_error_code, u32 error_code,
611 bool reinject);
Avi Kivityb463a6f2010-07-20 15:06:17 +0300612 void (*cancel_injection)(struct kvm_vcpu *vcpu);
Gleb Natapov78646122009-03-23 12:12:11 +0200613 int (*interrupt_allowed)(struct kvm_vcpu *vcpu);
Gleb Natapov95ba8273132009-04-21 17:45:08 +0300614 int (*nmi_allowed)(struct kvm_vcpu *vcpu);
Jan Kiszka3cfc3092009-11-12 01:04:25 +0100615 bool (*get_nmi_mask)(struct kvm_vcpu *vcpu);
616 void (*set_nmi_mask)(struct kvm_vcpu *vcpu, bool masked);
Gleb Natapov95ba8273132009-04-21 17:45:08 +0300617 void (*enable_nmi_window)(struct kvm_vcpu *vcpu);
618 void (*enable_irq_window)(struct kvm_vcpu *vcpu);
619 void (*update_cr8_intercept)(struct kvm_vcpu *vcpu, int tpr, int irr);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800620 int (*set_tss_addr)(struct kvm *kvm, unsigned int addr);
Sheng Yang67253af2008-04-25 10:20:22 +0800621 int (*get_tdp_level)(void);
Sheng Yang4b12f0d2009-04-27 20:35:42 +0800622 u64 (*get_mt_mask)(struct kvm_vcpu *vcpu, gfn_t gfn, bool is_mmio);
Sheng Yang17cc3932010-01-05 19:02:27 +0800623 int (*get_lpage_level)(void);
Sheng Yang4e47c7a2009-12-18 16:48:47 +0800624 bool (*rdtscp_supported)(void);
Zachary Amsdene48672f2010-08-19 22:07:23 -1000625 void (*adjust_tsc_offset)(struct kvm_vcpu *vcpu, s64 adjustment);
Joerg Roedel344f4142009-07-27 16:30:48 +0200626
Joerg Roedel1c97f0a2010-09-10 17:30:41 +0200627 void (*set_tdp_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
628
Joerg Roedeld4330ef2010-04-22 12:33:11 +0200629 void (*set_supported_cpuid)(u32 func, struct kvm_cpuid_entry2 *entry);
630
Sheng Yangf5f48ee2010-06-30 12:25:15 +0800631 bool (*has_wbinvd_exit)(void);
632
Joerg Roedel4051b182011-03-25 09:44:49 +0100633 void (*set_tsc_khz)(struct kvm_vcpu *vcpu, u32 user_tsc_khz);
Zachary Amsden99e3e302010-08-19 22:07:17 -1000634 void (*write_tsc_offset)(struct kvm_vcpu *vcpu, u64 offset);
635
Joerg Roedel857e4092011-03-25 09:44:50 +0100636 u64 (*compute_tsc_offset)(struct kvm_vcpu *vcpu, u64 target_tsc);
Nadav Har'Eld5c17852011-08-02 15:54:20 +0300637 u64 (*read_l1_tsc)(struct kvm_vcpu *vcpu);
Joerg Roedel857e4092011-03-25 09:44:50 +0100638
Avi Kivity586f9602010-11-18 13:09:54 +0200639 void (*get_exit_info)(struct kvm_vcpu *vcpu, u64 *info1, u64 *info2);
Joerg Roedel8a76d7f2011-04-04 12:39:27 +0200640
641 int (*check_intercept)(struct kvm_vcpu *vcpu,
642 struct x86_instruction_info *info,
643 enum x86_intercept_stage stage);
Zhang Xiantaoea4a5ff2007-11-19 14:40:47 +0800644};
645
Gleb Natapovaf585b92010-10-14 11:22:46 +0200646struct kvm_arch_async_pf {
Gleb Natapov7c907052010-10-14 11:22:53 +0200647 u32 token;
Gleb Natapovaf585b92010-10-14 11:22:46 +0200648 gfn_t gfn;
Xiao Guangrongfb67e142010-12-07 10:35:25 +0800649 unsigned long cr3;
Xiao Guangrongc4806ac2010-11-12 14:49:55 +0800650 bool direct_map;
Gleb Natapovaf585b92010-10-14 11:22:46 +0200651};
652
Zhang Xiantao97896d02007-11-14 20:09:30 +0800653extern struct kvm_x86_ops *kvm_x86_ops;
654
Zhang Xiantao54f15852007-11-19 15:24:28 +0800655int kvm_mmu_module_init(void);
656void kvm_mmu_module_exit(void);
657
658void kvm_mmu_destroy(struct kvm_vcpu *vcpu);
659int kvm_mmu_create(struct kvm_vcpu *vcpu);
660int kvm_mmu_setup(struct kvm_vcpu *vcpu);
Sheng Yang7b523452008-04-25 21:13:50 +0800661void kvm_mmu_set_mask_ptes(u64 user_mask, u64 accessed_mask,
Sheng Yang4b12f0d2009-04-27 20:35:42 +0800662 u64 dirty_mask, u64 nx_mask, u64 x_mask);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800663
664int kvm_mmu_reset_context(struct kvm_vcpu *vcpu);
665void kvm_mmu_slot_remove_write_access(struct kvm *kvm, int slot);
666void kvm_mmu_zap_all(struct kvm *kvm);
Zhang Xiantao3ad82a72007-11-20 13:11:38 +0800667unsigned int kvm_mmu_calculate_mmu_pages(struct kvm *kvm);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800668void kvm_mmu_change_mmu_pages(struct kvm *kvm, unsigned int kvm_nr_mmu_pages);
669
Joerg Roedelff03a072010-09-10 17:30:57 +0200670int load_pdptrs(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu, unsigned long cr3);
Joerg Roedelcc4b6872008-02-07 13:47:43 +0100671
Marcelo Tosatti3200f402008-03-29 20:17:59 -0300672int emulator_write_phys(struct kvm_vcpu *vcpu, gpa_t gpa,
Avi Kivity9f811282008-03-02 14:06:05 +0200673 const void *val, int bytes);
Marcelo Tosatti2f333bc2008-02-22 12:21:37 -0500674int kvm_pv_mmu_op(struct kvm_vcpu *vcpu, unsigned long bytes,
675 gpa_t addr, unsigned long *ret);
Sheng Yang4b12f0d2009-04-27 20:35:42 +0800676u8 kvm_get_guest_memory_type(struct kvm_vcpu *vcpu, gfn_t gfn);
Marcelo Tosatti2f333bc2008-02-22 12:21:37 -0500677
678extern bool tdp_enabled;
Avi Kivity9f811282008-03-02 14:06:05 +0200679
Liu, Jinsonga3e06bb2011-09-22 16:55:52 +0800680u64 vcpu_tsc_khz(struct kvm_vcpu *vcpu);
681
Joerg Roedel92a1f122011-03-25 09:44:51 +0100682/* control of guest tsc rate supported? */
683extern bool kvm_has_tsc_control;
684/* minimum supported tsc_khz for guests */
685extern u32 kvm_min_guest_tsc_khz;
686/* maximum supported tsc_khz for guests */
687extern u32 kvm_max_guest_tsc_khz;
688
Zhang Xiantao54f15852007-11-19 15:24:28 +0800689enum emulation_result {
690 EMULATE_DONE, /* no further processing */
691 EMULATE_DO_MMIO, /* kvm_run filled with mmio request */
692 EMULATE_FAIL, /* can't emulate this instruction */
693};
694
Sheng Yang571008d2008-01-02 14:49:22 +0800695#define EMULTYPE_NO_DECODE (1 << 0)
696#define EMULTYPE_TRAP_UD (1 << 1)
Gleb Natapovba8afb62009-04-12 13:36:57 +0300697#define EMULTYPE_SKIP (1 << 2)
Xiao Guangrong1cb3f3a2011-09-22 17:02:48 +0800698#define EMULTYPE_RETRY (1 << 3)
Andre Przywaradc25e892010-12-21 11:12:07 +0100699int x86_emulate_instruction(struct kvm_vcpu *vcpu, unsigned long cr2,
700 int emulation_type, void *insn, int insn_len);
Andre Przywara51d8b662010-12-21 11:12:02 +0100701
702static inline int emulate_instruction(struct kvm_vcpu *vcpu,
703 int emulation_type)
704{
Andre Przywaradc25e892010-12-21 11:12:07 +0100705 return x86_emulate_instruction(vcpu, 0, emulation_type, NULL, 0);
Andre Przywara51d8b662010-12-21 11:12:02 +0100706}
707
Joerg Roedelf2b4b7d2008-01-31 14:57:37 +0100708void kvm_enable_efer_bits(u64);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800709int kvm_get_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 *data);
710int kvm_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
711
712struct x86_emulate_ctxt;
713
Gleb Natapovcf8f70b2010-03-18 15:20:23 +0200714int kvm_fast_pio_out(struct kvm_vcpu *vcpu, int size, unsigned short port);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800715void kvm_emulate_cpuid(struct kvm_vcpu *vcpu);
716int kvm_emulate_halt(struct kvm_vcpu *vcpu);
Sheng Yangf5f48ee2010-06-30 12:25:15 +0800717int kvm_emulate_wbinvd(struct kvm_vcpu *vcpu);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800718
Guillaume Thouvenin3e6e0aa2008-05-27 10:18:46 +0200719void kvm_get_segment(struct kvm_vcpu *vcpu, struct kvm_segment *var, int seg);
Gleb Natapovc6975182010-02-18 12:15:01 +0200720int kvm_load_segment_descriptor(struct kvm_vcpu *vcpu, u16 selector, int seg);
Guillaume Thouvenin3e6e0aa2008-05-27 10:18:46 +0200721
Jan Kiszkae269fb22010-04-14 15:51:09 +0200722int kvm_task_switch(struct kvm_vcpu *vcpu, u16 tss_selector, int reason,
723 bool has_error_code, u32 error_code);
Izik Eidus37817f22008-03-24 23:14:53 +0200724
Avi Kivity49a9b072010-06-10 17:02:14 +0300725int kvm_set_cr0(struct kvm_vcpu *vcpu, unsigned long cr0);
Avi Kivity23902182010-06-10 17:02:16 +0300726int kvm_set_cr3(struct kvm_vcpu *vcpu, unsigned long cr3);
Avi Kivitya83b29c2010-06-10 17:02:15 +0300727int kvm_set_cr4(struct kvm_vcpu *vcpu, unsigned long cr4);
Andre Przywaraeea1cff2010-12-21 11:12:00 +0100728int kvm_set_cr8(struct kvm_vcpu *vcpu, unsigned long cr8);
Gleb Natapov020df072010-04-13 10:05:23 +0300729int kvm_set_dr(struct kvm_vcpu *vcpu, int dr, unsigned long val);
730int kvm_get_dr(struct kvm_vcpu *vcpu, int dr, unsigned long *val);
Avi Kivity2d3ad1f2008-02-24 11:20:43 +0200731unsigned long kvm_get_cr8(struct kvm_vcpu *vcpu);
732void kvm_lmsw(struct kvm_vcpu *vcpu, unsigned long msw);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800733void kvm_get_cs_db_l_bits(struct kvm_vcpu *vcpu, int *db, int *l);
Dexuan Cui2acf9232010-06-10 11:27:12 +0800734int kvm_set_xcr(struct kvm_vcpu *vcpu, u32 index, u64 xcr);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800735
736int kvm_get_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 *pdata);
737int kvm_set_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 data);
738
Jan Kiszka91586a32009-10-05 13:07:21 +0200739unsigned long kvm_get_rflags(struct kvm_vcpu *vcpu);
740void kvm_set_rflags(struct kvm_vcpu *vcpu, unsigned long rflags);
741
Avi Kivity298101d2007-11-25 13:41:11 +0200742void kvm_queue_exception(struct kvm_vcpu *vcpu, unsigned nr);
743void kvm_queue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
Joerg Roedelce7ddec2010-04-22 12:33:13 +0200744void kvm_requeue_exception(struct kvm_vcpu *vcpu, unsigned nr);
745void kvm_requeue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
Avi Kivity6389ee92010-11-29 16:12:30 +0200746void kvm_inject_page_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
Joerg Roedelec92fe42010-09-10 17:30:51 +0200747int kvm_read_guest_page_mmu(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu,
748 gfn_t gfn, void *data, int offset, int len,
749 u32 access);
Avi Kivity6389ee92010-11-29 16:12:30 +0200750void kvm_propagate_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
Avi Kivity0a79b002009-09-01 12:03:25 +0300751bool kvm_require_cpl(struct kvm_vcpu *vcpu, int required_cpl);
Avi Kivity298101d2007-11-25 13:41:11 +0200752
Gleb Natapov49256632009-02-04 17:28:14 +0200753int kvm_pic_set_irq(void *opaque, int irq, int level);
Xiantao Zhang3de42dc2008-10-06 13:48:45 +0800754
Sheng Yang3419ffc2008-05-15 09:52:48 +0800755void kvm_inject_nmi(struct kvm_vcpu *vcpu);
756
Jan Kiszka10ab25c2010-05-25 16:01:50 +0200757int fx_init(struct kvm_vcpu *vcpu);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800758
Avi Kivityd835dfe2007-11-21 02:57:59 +0200759void kvm_mmu_flush_tlb(struct kvm_vcpu *vcpu);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800760void kvm_mmu_pte_write(struct kvm_vcpu *vcpu, gpa_t gpa,
Marcelo Tosattiad218f82008-12-01 22:32:05 -0200761 const u8 *new, int bytes,
762 bool guest_initiated);
Xiao Guangrong1cb3f3a2011-09-22 17:02:48 +0800763int kvm_mmu_unprotect_page(struct kvm *kvm, gfn_t gfn);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800764int kvm_mmu_unprotect_page_virt(struct kvm_vcpu *vcpu, gva_t gva);
765void __kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu);
766int kvm_mmu_load(struct kvm_vcpu *vcpu);
767void kvm_mmu_unload(struct kvm_vcpu *vcpu);
Marcelo Tosatti0ba73cd2008-09-23 13:18:34 -0300768void kvm_mmu_sync_roots(struct kvm_vcpu *vcpu);
Avi Kivityab9ae312010-11-22 17:53:26 +0200769gpa_t kvm_mmu_gva_to_gpa_read(struct kvm_vcpu *vcpu, gva_t gva,
770 struct x86_exception *exception);
771gpa_t kvm_mmu_gva_to_gpa_fetch(struct kvm_vcpu *vcpu, gva_t gva,
772 struct x86_exception *exception);
773gpa_t kvm_mmu_gva_to_gpa_write(struct kvm_vcpu *vcpu, gva_t gva,
774 struct x86_exception *exception);
775gpa_t kvm_mmu_gva_to_gpa_system(struct kvm_vcpu *vcpu, gva_t gva,
776 struct x86_exception *exception);
Zhang Xiantao54f15852007-11-19 15:24:28 +0800777
778int kvm_emulate_hypercall(struct kvm_vcpu *vcpu);
779
Andre Przywaradc25e892010-12-21 11:12:07 +0100780int kvm_mmu_page_fault(struct kvm_vcpu *vcpu, gva_t gva, u32 error_code,
781 void *insn, int insn_len);
Marcelo Tosattia7052892008-09-23 13:18:35 -0300782void kvm_mmu_invlpg(struct kvm_vcpu *vcpu, gva_t gva);
Zhang Xiantao34c16ee2007-10-20 15:34:38 +0800783
Joerg Roedel18552672008-02-07 13:47:41 +0100784void kvm_enable_tdp(void);
Joerg Roedel5f4cb662008-07-14 20:36:36 +0200785void kvm_disable_tdp(void);
Joerg Roedel18552672008-02-07 13:47:41 +0100786
Carsten Ottede7d7892007-10-30 18:44:25 +0100787int complete_pio(struct kvm_vcpu *vcpu);
Gleb Natapovf850e2e2010-02-10 14:21:33 +0200788bool kvm_check_iopl(struct kvm_vcpu *vcpu);
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800789
790static inline struct kvm_mmu_page *page_header(hpa_t shadow_page)
791{
792 struct page *page = pfn_to_page(shadow_page >> PAGE_SHIFT);
793
794 return (struct kvm_mmu_page *)page_private(page);
795}
796
Avi Kivityd6e88ae2008-07-10 16:53:33 +0300797static inline u16 kvm_read_ldt(void)
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800798{
799 u16 ldt;
800 asm("sldt %0" : "=g"(ldt));
801 return ldt;
802}
803
Avi Kivityd6e88ae2008-07-10 16:53:33 +0300804static inline void kvm_load_ldt(u16 sel)
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800805{
806 asm("lldt %0" : : "rm"(sel));
807}
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800808
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800809#ifdef CONFIG_X86_64
810static inline unsigned long read_msr(unsigned long msr)
811{
812 u64 value;
813
814 rdmsrl(msr, value);
815 return value;
816}
817#endif
818
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800819static inline u32 get_rdx_init_val(void)
820{
821 return 0x600; /* P6 family */
822}
823
Avi Kivityc1a5d4f2007-11-25 14:12:03 +0200824static inline void kvm_inject_gp(struct kvm_vcpu *vcpu, u32 error_code)
825{
826 kvm_queue_exception_e(vcpu, GP_VECTOR, error_code);
827}
828
Zhang Xiantaoec6d2732007-11-19 15:08:31 +0800829#define TSS_IOPB_BASE_OFFSET 0x66
830#define TSS_BASE_SIZE 0x68
831#define TSS_IOPB_SIZE (65536 / 8)
832#define TSS_REDIRECTION_SIZE (256 / 8)
Joe Perches7d76b4d2008-03-23 01:02:34 -0700833#define RMODE_TSS_SIZE \
834 (TSS_BASE_SIZE + TSS_REDIRECTION_SIZE + TSS_IOPB_SIZE + 1)
Hollis Blanchard53e0aa72007-12-03 16:15:26 -0600835
Izik Eidus37817f22008-03-24 23:14:53 +0200836enum {
837 TASK_SWITCH_CALL = 0,
838 TASK_SWITCH_IRET = 1,
839 TASK_SWITCH_JMP = 2,
840 TASK_SWITCH_GATE = 3,
841};
842
Alexander Graf1371d902008-11-25 20:17:04 +0100843#define HF_GIF_MASK (1 << 0)
Alexander Graf3d6368e2008-11-25 20:17:07 +0100844#define HF_HIF_MASK (1 << 1)
845#define HF_VINTR_MASK (1 << 2)
Gleb Natapov95ba8273132009-04-21 17:45:08 +0300846#define HF_NMI_MASK (1 << 3)
Gleb Natapov44c11432009-05-11 13:35:52 +0300847#define HF_IRET_MASK (1 << 4)
Joerg Roedelec9e60b2010-11-29 17:51:47 +0100848#define HF_GUEST_MASK (1 << 5) /* VCPU is in guest-mode */
Alexander Graf1371d902008-11-25 20:17:04 +0100849
Avi Kivity4ecac3f2008-05-13 13:23:38 +0300850/*
851 * Hardware virtualization extension instructions may fault if a
852 * reboot turns off virtualization while processes are running.
853 * Trap the fault and ignore the instruction if that happens.
854 */
Avi Kivityb7c41452010-12-02 17:52:50 +0200855asmlinkage void kvm_spurious_fault(void);
856extern bool kvm_rebooting;
Avi Kivity4ecac3f2008-05-13 13:23:38 +0300857
Avi Kivity5e520e62011-05-15 10:13:12 -0400858#define ____kvm_handle_fault_on_reboot(insn, cleanup_insn) \
Avi Kivity4ecac3f2008-05-13 13:23:38 +0300859 "666: " insn "\n\t" \
Avi Kivityb7c41452010-12-02 17:52:50 +0200860 "668: \n\t" \
Eduardo Habkost18b13e52008-08-19 20:00:08 -0300861 ".pushsection .fixup, \"ax\" \n" \
Avi Kivity4ecac3f2008-05-13 13:23:38 +0300862 "667: \n\t" \
Avi Kivity5e520e62011-05-15 10:13:12 -0400863 cleanup_insn "\n\t" \
Avi Kivityb7c41452010-12-02 17:52:50 +0200864 "cmpb $0, kvm_rebooting \n\t" \
865 "jne 668b \n\t" \
Avi Kivity8ceed3472008-08-14 21:25:47 +0300866 __ASM_SIZE(push) " $666b \n\t" \
Avi Kivityb7c41452010-12-02 17:52:50 +0200867 "call kvm_spurious_fault \n\t" \
Avi Kivity4ecac3f2008-05-13 13:23:38 +0300868 ".popsection \n\t" \
869 ".pushsection __ex_table, \"a\" \n\t" \
Avi Kivity8ceed3472008-08-14 21:25:47 +0300870 _ASM_PTR " 666b, 667b \n\t" \
Avi Kivity4ecac3f2008-05-13 13:23:38 +0300871 ".popsection"
872
Avi Kivity5e520e62011-05-15 10:13:12 -0400873#define __kvm_handle_fault_on_reboot(insn) \
874 ____kvm_handle_fault_on_reboot(insn, "")
875
Andrea Arcangelie930bff2008-07-25 16:24:52 +0200876#define KVM_ARCH_WANT_MMU_NOTIFIER
877int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
878int kvm_age_hva(struct kvm *kvm, unsigned long hva);
Andrea Arcangeli8ee53822011-01-13 15:47:10 -0800879int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
Izik Eidus3da0dd42009-09-23 21:47:18 +0300880void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
Dong, Eddie82725b22009-03-30 16:21:08 +0800881int cpuid_maxphyaddr(struct kvm_vcpu *vcpu);
Gleb Natapova1b37102009-07-09 15:33:52 +0300882int kvm_cpu_has_interrupt(struct kvm_vcpu *vcpu);
883int kvm_arch_interrupt_allowed(struct kvm_vcpu *vcpu);
Gleb Natapov0b717852009-07-09 15:33:53 +0300884int kvm_cpu_get_interrupt(struct kvm_vcpu *v);
Andrea Arcangelie930bff2008-07-25 16:24:52 +0200885
Avi Kivity18863bd2009-09-07 11:12:18 +0300886void kvm_define_shared_msr(unsigned index, u32 msr);
Avi Kivityd5696722009-12-02 12:28:47 +0200887void kvm_set_shared_msr(unsigned index, u64 val, u64 mask);
Avi Kivity18863bd2009-09-07 11:12:18 +0300888
Jan Kiszkaf92653e2010-02-23 17:47:55 +0100889bool kvm_is_linear_rip(struct kvm_vcpu *vcpu, unsigned long linear_rip);
890
Gleb Natapovaf585b92010-10-14 11:22:46 +0200891void kvm_arch_async_page_not_present(struct kvm_vcpu *vcpu,
892 struct kvm_async_pf *work);
893void kvm_arch_async_page_present(struct kvm_vcpu *vcpu,
894 struct kvm_async_pf *work);
Gleb Natapov56028d02010-10-17 18:13:42 +0200895void kvm_arch_async_page_ready(struct kvm_vcpu *vcpu,
896 struct kvm_async_pf *work);
Gleb Natapov7c907052010-10-14 11:22:53 +0200897bool kvm_arch_can_inject_async_page_present(struct kvm_vcpu *vcpu);
Gleb Natapovaf585b92010-10-14 11:22:46 +0200898extern bool kvm_find_async_pf_gfn(struct kvm_vcpu *vcpu, gfn_t gfn);
899
Andre Przywaradb8fcef2010-12-21 11:12:01 +0100900void kvm_complete_insn_gp(struct kvm_vcpu *vcpu, int err);
901
H. Peter Anvin1965aae2008-10-22 22:26:29 -0700902#endif /* _ASM_X86_KVM_HOST_H */