aboutsummaryrefslogtreecommitdiffstats
path: root/include
diff options
context:
space:
mode:
authorAvi Kivity <avi@qumranet.com>2007-12-16 04:02:48 -0500
committerAvi Kivity <avi@qumranet.com>2008-01-30 11:01:18 -0500
commitedf884172e9828c6234b254208af04655855038d (patch)
treef5e5d1eecaed9737eced6ba60d09fe93149751c1 /include
parent9584bf2c93f56656dba0de8f6c75b54ca7995143 (diff)
KVM: Move arch dependent files to new directory arch/x86/kvm/
This paves the way for multiple architecture support. Note that while ioapic.c could potentially be shared with ia64, it is also moved. Signed-off-by: Avi Kivity <avi@qumranet.com>
Diffstat (limited to 'include')
-rw-r--r--include/asm-x86/kvm_host.h601
-rw-r--r--include/asm-x86/kvm_x86_emulate.h186
-rw-r--r--include/linux/kvm_host.h289
-rw-r--r--include/linux/kvm_types.h54
4 files changed, 1130 insertions, 0 deletions
diff --git a/include/asm-x86/kvm_host.h b/include/asm-x86/kvm_host.h
new file mode 100644
index 000000000000..28940e1a9713
--- /dev/null
+++ b/include/asm-x86/kvm_host.h
@@ -0,0 +1,601 @@
1#/*
2 * Kernel-based Virtual Machine driver for Linux
3 *
4 * This header defines architecture specific interfaces, x86 version
5 *
6 * This work is licensed under the terms of the GNU GPL, version 2. See
7 * the COPYING file in the top-level directory.
8 *
9 */
10
11#ifndef ASM_KVM_HOST_H
12#define ASM_KVM_HOST_H
13
14#include <linux/types.h>
15#include <linux/mm.h>
16
17#include <linux/kvm.h>
18#include <linux/kvm_para.h>
19#include <linux/kvm_types.h>
20
21#include <asm/desc.h>
22
23#define CR3_PAE_RESERVED_BITS ((X86_CR3_PWT | X86_CR3_PCD) - 1)
24#define CR3_NONPAE_RESERVED_BITS ((PAGE_SIZE-1) & ~(X86_CR3_PWT | X86_CR3_PCD))
25#define CR3_L_MODE_RESERVED_BITS (CR3_NONPAE_RESERVED_BITS|0xFFFFFF0000000000ULL)
26
27#define KVM_GUEST_CR0_MASK \
28 (X86_CR0_PG | X86_CR0_PE | X86_CR0_WP | X86_CR0_NE \
29 | X86_CR0_NW | X86_CR0_CD)
30#define KVM_VM_CR0_ALWAYS_ON \
31 (X86_CR0_PG | X86_CR0_PE | X86_CR0_WP | X86_CR0_NE | X86_CR0_TS \
32 | X86_CR0_MP)
33#define KVM_GUEST_CR4_MASK \
34 (X86_CR4_VME | X86_CR4_PSE | X86_CR4_PAE | X86_CR4_PGE | X86_CR4_VMXE)
35#define KVM_PMODE_VM_CR4_ALWAYS_ON (X86_CR4_PAE | X86_CR4_VMXE)
36#define KVM_RMODE_VM_CR4_ALWAYS_ON (X86_CR4_VME | X86_CR4_PAE | X86_CR4_VMXE)
37
38#define INVALID_PAGE (~(hpa_t)0)
39#define UNMAPPED_GVA (~(gpa_t)0)
40
41#define DE_VECTOR 0
42#define UD_VECTOR 6
43#define NM_VECTOR 7
44#define DF_VECTOR 8
45#define TS_VECTOR 10
46#define NP_VECTOR 11
47#define SS_VECTOR 12
48#define GP_VECTOR 13
49#define PF_VECTOR 14
50
51#define SELECTOR_TI_MASK (1 << 2)
52#define SELECTOR_RPL_MASK 0x03
53
54#define IOPL_SHIFT 12
55
56#define KVM_ALIAS_SLOTS 4
57
58#define KVM_PERMILLE_MMU_PAGES 20
59#define KVM_MIN_ALLOC_MMU_PAGES 64
60#define KVM_NUM_MMU_PAGES 1024
61#define KVM_MIN_FREE_MMU_PAGES 5
62#define KVM_REFILL_PAGES 25
63#define KVM_MAX_CPUID_ENTRIES 40
64
65extern spinlock_t kvm_lock;
66extern struct list_head vm_list;
67
68struct kvm_vcpu;
69struct kvm;
70
71enum {
72 VCPU_REGS_RAX = 0,
73 VCPU_REGS_RCX = 1,
74 VCPU_REGS_RDX = 2,
75 VCPU_REGS_RBX = 3,
76 VCPU_REGS_RSP = 4,
77 VCPU_REGS_RBP = 5,
78 VCPU_REGS_RSI = 6,
79 VCPU_REGS_RDI = 7,
80#ifdef CONFIG_X86_64
81 VCPU_REGS_R8 = 8,
82 VCPU_REGS_R9 = 9,
83 VCPU_REGS_R10 = 10,
84 VCPU_REGS_R11 = 11,
85 VCPU_REGS_R12 = 12,
86 VCPU_REGS_R13 = 13,
87 VCPU_REGS_R14 = 14,
88 VCPU_REGS_R15 = 15,
89#endif
90 NR_VCPU_REGS
91};
92
93enum {
94 VCPU_SREG_CS,
95 VCPU_SREG_DS,
96 VCPU_SREG_ES,
97 VCPU_SREG_FS,
98 VCPU_SREG_GS,
99 VCPU_SREG_SS,
100 VCPU_SREG_TR,
101 VCPU_SREG_LDTR,
102};
103
104#include <asm/kvm_x86_emulate.h>
105
106#define KVM_NR_MEM_OBJS 40
107
108/*
109 * We don't want allocation failures within the mmu code, so we preallocate
110 * enough memory for a single page fault in a cache.
111 */
112struct kvm_mmu_memory_cache {
113 int nobjs;
114 void *objects[KVM_NR_MEM_OBJS];
115};
116
117#define NR_PTE_CHAIN_ENTRIES 5
118
119struct kvm_pte_chain {
120 u64 *parent_ptes[NR_PTE_CHAIN_ENTRIES];
121 struct hlist_node link;
122};
123
124/*
125 * kvm_mmu_page_role, below, is defined as:
126 *
127 * bits 0:3 - total guest paging levels (2-4, or zero for real mode)
128 * bits 4:7 - page table level for this shadow (1-4)
129 * bits 8:9 - page table quadrant for 2-level guests
130 * bit 16 - "metaphysical" - gfn is not a real page (huge page/real mode)
131 * bits 17:19 - common access permissions for all ptes in this shadow page
132 */
133union kvm_mmu_page_role {
134 unsigned word;
135 struct {
136 unsigned glevels : 4;
137 unsigned level : 4;
138 unsigned quadrant : 2;
139 unsigned pad_for_nice_hex_output : 6;
140 unsigned metaphysical : 1;
141 unsigned access : 3;
142 };
143};
144
145struct kvm_mmu_page {
146 struct list_head link;
147 struct hlist_node hash_link;
148
149 /*
150 * The following two entries are used to key the shadow page in the
151 * hash table.
152 */
153 gfn_t gfn;
154 union kvm_mmu_page_role role;
155
156 u64 *spt;
157 /* hold the gfn of each spte inside spt */
158 gfn_t *gfns;
159 unsigned long slot_bitmap; /* One bit set per slot which has memory
160 * in this shadow page.
161 */
162 int multimapped; /* More than one parent_pte? */
163 int root_count; /* Currently serving as active root */
164 union {
165 u64 *parent_pte; /* !multimapped */
166 struct hlist_head parent_ptes; /* multimapped, kvm_pte_chain */
167 };
168};
169
170/*
171 * x86 supports 3 paging modes (4-level 64-bit, 3-level 64-bit, and 2-level
172 * 32-bit). The kvm_mmu structure abstracts the details of the current mmu
173 * mode.
174 */
175struct kvm_mmu {
176 void (*new_cr3)(struct kvm_vcpu *vcpu);
177 int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err);
178 void (*free)(struct kvm_vcpu *vcpu);
179 gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva);
180 void (*prefetch_page)(struct kvm_vcpu *vcpu,
181 struct kvm_mmu_page *page);
182 hpa_t root_hpa;
183 int root_level;
184 int shadow_root_level;
185
186 u64 *pae_root;
187};
188
189struct kvm_vcpu_arch {
190 u64 host_tsc;
191 int interrupt_window_open;
192 unsigned long irq_summary; /* bit vector: 1 per word in irq_pending */
193 DECLARE_BITMAP(irq_pending, KVM_NR_INTERRUPTS);
194 unsigned long regs[NR_VCPU_REGS]; /* for rsp: vcpu_load_rsp_rip() */
195 unsigned long rip; /* needs vcpu_load_rsp_rip() */
196
197 unsigned long cr0;
198 unsigned long cr2;
199 unsigned long cr3;
200 unsigned long cr4;
201 unsigned long cr8;
202 u64 pdptrs[4]; /* pae */
203 u64 shadow_efer;
204 u64 apic_base;
205 struct kvm_lapic *apic; /* kernel irqchip context */
206#define VCPU_MP_STATE_RUNNABLE 0
207#define VCPU_MP_STATE_UNINITIALIZED 1
208#define VCPU_MP_STATE_INIT_RECEIVED 2
209#define VCPU_MP_STATE_SIPI_RECEIVED 3
210#define VCPU_MP_STATE_HALTED 4
211 int mp_state;
212 int sipi_vector;
213 u64 ia32_misc_enable_msr;
214
215 struct kvm_mmu mmu;
216
217 struct kvm_mmu_memory_cache mmu_pte_chain_cache;
218 struct kvm_mmu_memory_cache mmu_rmap_desc_cache;
219 struct kvm_mmu_memory_cache mmu_page_cache;
220 struct kvm_mmu_memory_cache mmu_page_header_cache;
221
222 gfn_t last_pt_write_gfn;
223 int last_pt_write_count;
224 u64 *last_pte_updated;
225
226 struct i387_fxsave_struct host_fx_image;
227 struct i387_fxsave_struct guest_fx_image;
228
229 gva_t mmio_fault_cr2;
230 struct kvm_pio_request pio;
231 void *pio_data;
232
233 struct kvm_queued_exception {
234 bool pending;
235 bool has_error_code;
236 u8 nr;
237 u32 error_code;
238 } exception;
239
240 struct {
241 int active;
242 u8 save_iopl;
243 struct kvm_save_segment {
244 u16 selector;
245 unsigned long base;
246 u32 limit;
247 u32 ar;
248 } tr, es, ds, fs, gs;
249 } rmode;
250 int halt_request; /* real mode on Intel only */
251
252 int cpuid_nent;
253 struct kvm_cpuid_entry2 cpuid_entries[KVM_MAX_CPUID_ENTRIES];
254 /* emulate context */
255
256 struct x86_emulate_ctxt emulate_ctxt;
257};
258
259struct kvm_mem_alias {
260 gfn_t base_gfn;
261 unsigned long npages;
262 gfn_t target_gfn;
263};
264
265struct kvm_arch{
266 int naliases;
267 struct kvm_mem_alias aliases[KVM_ALIAS_SLOTS];
268
269 unsigned int n_free_mmu_pages;
270 unsigned int n_requested_mmu_pages;
271 unsigned int n_alloc_mmu_pages;
272 struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
273 /*
274 * Hash table of struct kvm_mmu_page.
275 */
276 struct list_head active_mmu_pages;
277 struct kvm_pic *vpic;
278 struct kvm_ioapic *vioapic;
279
280 int round_robin_prev_vcpu;
281 unsigned int tss_addr;
282 struct page *apic_access_page;
283};
284
285struct kvm_vm_stat {
286 u32 mmu_shadow_zapped;
287 u32 mmu_pte_write;
288 u32 mmu_pte_updated;
289 u32 mmu_pde_zapped;
290 u32 mmu_flooded;
291 u32 mmu_recycled;
292 u32 remote_tlb_flush;
293};
294
295struct kvm_vcpu_stat {
296 u32 pf_fixed;
297 u32 pf_guest;
298 u32 tlb_flush;
299 u32 invlpg;
300
301 u32 exits;
302 u32 io_exits;
303 u32 mmio_exits;
304 u32 signal_exits;
305 u32 irq_window_exits;
306 u32 halt_exits;
307 u32 halt_wakeup;
308 u32 request_irq_exits;
309 u32 irq_exits;
310 u32 host_state_reload;
311 u32 efer_reload;
312 u32 fpu_reload;
313 u32 insn_emulation;
314 u32 insn_emulation_fail;
315};
316
317struct descriptor_table {
318 u16 limit;
319 unsigned long base;
320} __attribute__((packed));
321
322struct kvm_x86_ops {
323 int (*cpu_has_kvm_support)(void); /* __init */
324 int (*disabled_by_bios)(void); /* __init */
325 void (*hardware_enable)(void *dummy); /* __init */
326 void (*hardware_disable)(void *dummy);
327 void (*check_processor_compatibility)(void *rtn);
328 int (*hardware_setup)(void); /* __init */
329 void (*hardware_unsetup)(void); /* __exit */
330
331 /* Create, but do not attach this VCPU */
332 struct kvm_vcpu *(*vcpu_create)(struct kvm *kvm, unsigned id);
333 void (*vcpu_free)(struct kvm_vcpu *vcpu);
334 int (*vcpu_reset)(struct kvm_vcpu *vcpu);
335
336 void (*prepare_guest_switch)(struct kvm_vcpu *vcpu);
337 void (*vcpu_load)(struct kvm_vcpu *vcpu, int cpu);
338 void (*vcpu_put)(struct kvm_vcpu *vcpu);
339 void (*vcpu_decache)(struct kvm_vcpu *vcpu);
340
341 int (*set_guest_debug)(struct kvm_vcpu *vcpu,
342 struct kvm_debug_guest *dbg);
343 void (*guest_debug_pre)(struct kvm_vcpu *vcpu);
344 int (*get_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 *pdata);
345 int (*set_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
346 u64 (*get_segment_base)(struct kvm_vcpu *vcpu, int seg);
347 void (*get_segment)(struct kvm_vcpu *vcpu,
348 struct kvm_segment *var, int seg);
349 void (*set_segment)(struct kvm_vcpu *vcpu,
350 struct kvm_segment *var, int seg);
351 void (*get_cs_db_l_bits)(struct kvm_vcpu *vcpu, int *db, int *l);
352 void (*decache_cr4_guest_bits)(struct kvm_vcpu *vcpu);
353 void (*set_cr0)(struct kvm_vcpu *vcpu, unsigned long cr0);
354 void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
355 void (*set_cr4)(struct kvm_vcpu *vcpu, unsigned long cr4);
356 void (*set_efer)(struct kvm_vcpu *vcpu, u64 efer);
357 void (*get_idt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
358 void (*set_idt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
359 void (*get_gdt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
360 void (*set_gdt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
361 unsigned long (*get_dr)(struct kvm_vcpu *vcpu, int dr);
362 void (*set_dr)(struct kvm_vcpu *vcpu, int dr, unsigned long value,
363 int *exception);
364 void (*cache_regs)(struct kvm_vcpu *vcpu);
365 void (*decache_regs)(struct kvm_vcpu *vcpu);
366 unsigned long (*get_rflags)(struct kvm_vcpu *vcpu);
367 void (*set_rflags)(struct kvm_vcpu *vcpu, unsigned long rflags);
368
369 void (*tlb_flush)(struct kvm_vcpu *vcpu);
370
371 void (*run)(struct kvm_vcpu *vcpu, struct kvm_run *run);
372 int (*handle_exit)(struct kvm_run *run, struct kvm_vcpu *vcpu);
373 void (*skip_emulated_instruction)(struct kvm_vcpu *vcpu);
374 void (*patch_hypercall)(struct kvm_vcpu *vcpu,
375 unsigned char *hypercall_addr);
376 int (*get_irq)(struct kvm_vcpu *vcpu);
377 void (*set_irq)(struct kvm_vcpu *vcpu, int vec);
378 void (*queue_exception)(struct kvm_vcpu *vcpu, unsigned nr,
379 bool has_error_code, u32 error_code);
380 bool (*exception_injected)(struct kvm_vcpu *vcpu);
381 void (*inject_pending_irq)(struct kvm_vcpu *vcpu);
382 void (*inject_pending_vectors)(struct kvm_vcpu *vcpu,
383 struct kvm_run *run);
384
385 int (*set_tss_addr)(struct kvm *kvm, unsigned int addr);
386};
387
388extern struct kvm_x86_ops *kvm_x86_ops;
389
390int kvm_mmu_module_init(void);
391void kvm_mmu_module_exit(void);
392
393void kvm_mmu_destroy(struct kvm_vcpu *vcpu);
394int kvm_mmu_create(struct kvm_vcpu *vcpu);
395int kvm_mmu_setup(struct kvm_vcpu *vcpu);
396void kvm_mmu_set_nonpresent_ptes(u64 trap_pte, u64 notrap_pte);
397
398int kvm_mmu_reset_context(struct kvm_vcpu *vcpu);
399void kvm_mmu_slot_remove_write_access(struct kvm *kvm, int slot);
400void kvm_mmu_zap_all(struct kvm *kvm);
401unsigned int kvm_mmu_calculate_mmu_pages(struct kvm *kvm);
402void kvm_mmu_change_mmu_pages(struct kvm *kvm, unsigned int kvm_nr_mmu_pages);
403
404enum emulation_result {
405 EMULATE_DONE, /* no further processing */
406 EMULATE_DO_MMIO, /* kvm_run filled with mmio request */
407 EMULATE_FAIL, /* can't emulate this instruction */
408};
409
410int emulate_instruction(struct kvm_vcpu *vcpu, struct kvm_run *run,
411 unsigned long cr2, u16 error_code, int no_decode);
412void kvm_report_emulation_failure(struct kvm_vcpu *cvpu, const char *context);
413void realmode_lgdt(struct kvm_vcpu *vcpu, u16 size, unsigned long address);
414void realmode_lidt(struct kvm_vcpu *vcpu, u16 size, unsigned long address);
415void realmode_lmsw(struct kvm_vcpu *vcpu, unsigned long msw,
416 unsigned long *rflags);
417
418unsigned long realmode_get_cr(struct kvm_vcpu *vcpu, int cr);
419void realmode_set_cr(struct kvm_vcpu *vcpu, int cr, unsigned long value,
420 unsigned long *rflags);
421int kvm_get_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 *data);
422int kvm_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
423
424struct x86_emulate_ctxt;
425
426int kvm_emulate_pio(struct kvm_vcpu *vcpu, struct kvm_run *run, int in,
427 int size, unsigned port);
428int kvm_emulate_pio_string(struct kvm_vcpu *vcpu, struct kvm_run *run, int in,
429 int size, unsigned long count, int down,
430 gva_t address, int rep, unsigned port);
431void kvm_emulate_cpuid(struct kvm_vcpu *vcpu);
432int kvm_emulate_halt(struct kvm_vcpu *vcpu);
433int emulate_invlpg(struct kvm_vcpu *vcpu, gva_t address);
434int emulate_clts(struct kvm_vcpu *vcpu);
435int emulator_get_dr(struct x86_emulate_ctxt *ctxt, int dr,
436 unsigned long *dest);
437int emulator_set_dr(struct x86_emulate_ctxt *ctxt, int dr,
438 unsigned long value);
439
440void set_cr0(struct kvm_vcpu *vcpu, unsigned long cr0);
441void set_cr3(struct kvm_vcpu *vcpu, unsigned long cr0);
442void set_cr4(struct kvm_vcpu *vcpu, unsigned long cr0);
443void set_cr8(struct kvm_vcpu *vcpu, unsigned long cr0);
444unsigned long get_cr8(struct kvm_vcpu *vcpu);
445void lmsw(struct kvm_vcpu *vcpu, unsigned long msw);
446void kvm_get_cs_db_l_bits(struct kvm_vcpu *vcpu, int *db, int *l);
447
448int kvm_get_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 *pdata);
449int kvm_set_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 data);
450
451void kvm_queue_exception(struct kvm_vcpu *vcpu, unsigned nr);
452void kvm_queue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
453void kvm_inject_page_fault(struct kvm_vcpu *vcpu, unsigned long cr2,
454 u32 error_code);
455
456void fx_init(struct kvm_vcpu *vcpu);
457
458int emulator_read_std(unsigned long addr,
459 void *val,
460 unsigned int bytes,
461 struct kvm_vcpu *vcpu);
462int emulator_write_emulated(unsigned long addr,
463 const void *val,
464 unsigned int bytes,
465 struct kvm_vcpu *vcpu);
466
467unsigned long segment_base(u16 selector);
468
469void kvm_mmu_flush_tlb(struct kvm_vcpu *vcpu);
470void kvm_mmu_pte_write(struct kvm_vcpu *vcpu, gpa_t gpa,
471 const u8 *new, int bytes);
472int kvm_mmu_unprotect_page_virt(struct kvm_vcpu *vcpu, gva_t gva);
473void __kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu);
474int kvm_mmu_load(struct kvm_vcpu *vcpu);
475void kvm_mmu_unload(struct kvm_vcpu *vcpu);
476
477int kvm_emulate_hypercall(struct kvm_vcpu *vcpu);
478
479int kvm_fix_hypercall(struct kvm_vcpu *vcpu);
480
481int kvm_mmu_page_fault(struct kvm_vcpu *vcpu, gva_t gva, u32 error_code);
482
483int load_pdptrs(struct kvm_vcpu *vcpu, unsigned long cr3);
484int complete_pio(struct kvm_vcpu *vcpu);
485
486static inline struct kvm_mmu_page *page_header(hpa_t shadow_page)
487{
488 struct page *page = pfn_to_page(shadow_page >> PAGE_SHIFT);
489
490 return (struct kvm_mmu_page *)page_private(page);
491}
492
493static inline u16 read_fs(void)
494{
495 u16 seg;
496 asm("mov %%fs, %0" : "=g"(seg));
497 return seg;
498}
499
500static inline u16 read_gs(void)
501{
502 u16 seg;
503 asm("mov %%gs, %0" : "=g"(seg));
504 return seg;
505}
506
507static inline u16 read_ldt(void)
508{
509 u16 ldt;
510 asm("sldt %0" : "=g"(ldt));
511 return ldt;
512}
513
514static inline void load_fs(u16 sel)
515{
516 asm("mov %0, %%fs" : : "rm"(sel));
517}
518
519static inline void load_gs(u16 sel)
520{
521 asm("mov %0, %%gs" : : "rm"(sel));
522}
523
524#ifndef load_ldt
525static inline void load_ldt(u16 sel)
526{
527 asm("lldt %0" : : "rm"(sel));
528}
529#endif
530
531static inline void get_idt(struct descriptor_table *table)
532{
533 asm("sidt %0" : "=m"(*table));
534}
535
536static inline void get_gdt(struct descriptor_table *table)
537{
538 asm("sgdt %0" : "=m"(*table));
539}
540
541static inline unsigned long read_tr_base(void)
542{
543 u16 tr;
544 asm("str %0" : "=g"(tr));
545 return segment_base(tr);
546}
547
548#ifdef CONFIG_X86_64
549static inline unsigned long read_msr(unsigned long msr)
550{
551 u64 value;
552
553 rdmsrl(msr, value);
554 return value;
555}
556#endif
557
558static inline void fx_save(struct i387_fxsave_struct *image)
559{
560 asm("fxsave (%0)":: "r" (image));
561}
562
563static inline void fx_restore(struct i387_fxsave_struct *image)
564{
565 asm("fxrstor (%0)":: "r" (image));
566}
567
568static inline void fpu_init(void)
569{
570 asm("finit");
571}
572
573static inline u32 get_rdx_init_val(void)
574{
575 return 0x600; /* P6 family */
576}
577
578static inline void kvm_inject_gp(struct kvm_vcpu *vcpu, u32 error_code)
579{
580 kvm_queue_exception_e(vcpu, GP_VECTOR, error_code);
581}
582
583#define ASM_VMX_VMCLEAR_RAX ".byte 0x66, 0x0f, 0xc7, 0x30"
584#define ASM_VMX_VMLAUNCH ".byte 0x0f, 0x01, 0xc2"
585#define ASM_VMX_VMRESUME ".byte 0x0f, 0x01, 0xc3"
586#define ASM_VMX_VMPTRLD_RAX ".byte 0x0f, 0xc7, 0x30"
587#define ASM_VMX_VMREAD_RDX_RAX ".byte 0x0f, 0x78, 0xd0"
588#define ASM_VMX_VMWRITE_RAX_RDX ".byte 0x0f, 0x79, 0xd0"
589#define ASM_VMX_VMWRITE_RSP_RDX ".byte 0x0f, 0x79, 0xd4"
590#define ASM_VMX_VMXOFF ".byte 0x0f, 0x01, 0xc4"
591#define ASM_VMX_VMXON_RAX ".byte 0xf3, 0x0f, 0xc7, 0x30"
592
593#define MSR_IA32_TIME_STAMP_COUNTER 0x010
594
595#define TSS_IOPB_BASE_OFFSET 0x66
596#define TSS_BASE_SIZE 0x68
597#define TSS_IOPB_SIZE (65536 / 8)
598#define TSS_REDIRECTION_SIZE (256 / 8)
599#define RMODE_TSS_SIZE (TSS_BASE_SIZE + TSS_REDIRECTION_SIZE + TSS_IOPB_SIZE + 1)
600
601#endif
diff --git a/include/asm-x86/kvm_x86_emulate.h b/include/asm-x86/kvm_x86_emulate.h
new file mode 100644
index 000000000000..7db91b9bdcd4
--- /dev/null
+++ b/include/asm-x86/kvm_x86_emulate.h
@@ -0,0 +1,186 @@
1/******************************************************************************
2 * x86_emulate.h
3 *
4 * Generic x86 (32-bit and 64-bit) instruction decoder and emulator.
5 *
6 * Copyright (c) 2005 Keir Fraser
7 *
8 * From: xen-unstable 10676:af9809f51f81a3c43f276f00c81a52ef558afda4
9 */
10
11#ifndef __X86_EMULATE_H__
12#define __X86_EMULATE_H__
13
14struct x86_emulate_ctxt;
15
16/*
17 * x86_emulate_ops:
18 *
19 * These operations represent the instruction emulator's interface to memory.
20 * There are two categories of operation: those that act on ordinary memory
21 * regions (*_std), and those that act on memory regions known to require
22 * special treatment or emulation (*_emulated).
23 *
24 * The emulator assumes that an instruction accesses only one 'emulated memory'
25 * location, that this location is the given linear faulting address (cr2), and
26 * that this is one of the instruction's data operands. Instruction fetches and
27 * stack operations are assumed never to access emulated memory. The emulator
28 * automatically deduces which operand of a string-move operation is accessing
29 * emulated memory, and assumes that the other operand accesses normal memory.
30 *
31 * NOTES:
32 * 1. The emulator isn't very smart about emulated vs. standard memory.
33 * 'Emulated memory' access addresses should be checked for sanity.
34 * 'Normal memory' accesses may fault, and the caller must arrange to
35 * detect and handle reentrancy into the emulator via recursive faults.
36 * Accesses may be unaligned and may cross page boundaries.
37 * 2. If the access fails (cannot emulate, or a standard access faults) then
38 * it is up to the memop to propagate the fault to the guest VM via
39 * some out-of-band mechanism, unknown to the emulator. The memop signals
40 * failure by returning X86EMUL_PROPAGATE_FAULT to the emulator, which will
41 * then immediately bail.
42 * 3. Valid access sizes are 1, 2, 4 and 8 bytes. On x86/32 systems only
43 * cmpxchg8b_emulated need support 8-byte accesses.
44 * 4. The emulator cannot handle 64-bit mode emulation on an x86/32 system.
45 */
46/* Access completed successfully: continue emulation as normal. */
47#define X86EMUL_CONTINUE 0
48/* Access is unhandleable: bail from emulation and return error to caller. */
49#define X86EMUL_UNHANDLEABLE 1
50/* Terminate emulation but return success to the caller. */
51#define X86EMUL_PROPAGATE_FAULT 2 /* propagate a generated fault to guest */
52#define X86EMUL_RETRY_INSTR 2 /* retry the instruction for some reason */
53#define X86EMUL_CMPXCHG_FAILED 2 /* cmpxchg did not see expected value */
54struct x86_emulate_ops {
55 /*
56 * read_std: Read bytes of standard (non-emulated/special) memory.
57 * Used for instruction fetch, stack operations, and others.
58 * @addr: [IN ] Linear address from which to read.
59 * @val: [OUT] Value read from memory, zero-extended to 'u_long'.
60 * @bytes: [IN ] Number of bytes to read from memory.
61 */
62 int (*read_std)(unsigned long addr, void *val,
63 unsigned int bytes, struct kvm_vcpu *vcpu);
64
65 /*
66 * read_emulated: Read bytes from emulated/special memory area.
67 * @addr: [IN ] Linear address from which to read.
68 * @val: [OUT] Value read from memory, zero-extended to 'u_long'.
69 * @bytes: [IN ] Number of bytes to read from memory.
70 */
71 int (*read_emulated) (unsigned long addr,
72 void *val,
73 unsigned int bytes,
74 struct kvm_vcpu *vcpu);
75
76 /*
77 * write_emulated: Read bytes from emulated/special memory area.
78 * @addr: [IN ] Linear address to which to write.
79 * @val: [IN ] Value to write to memory (low-order bytes used as
80 * required).
81 * @bytes: [IN ] Number of bytes to write to memory.
82 */
83 int (*write_emulated) (unsigned long addr,
84 const void *val,
85 unsigned int bytes,
86 struct kvm_vcpu *vcpu);
87
88 /*
89 * cmpxchg_emulated: Emulate an atomic (LOCKed) CMPXCHG operation on an
90 * emulated/special memory area.
91 * @addr: [IN ] Linear address to access.
92 * @old: [IN ] Value expected to be current at @addr.
93 * @new: [IN ] Value to write to @addr.
94 * @bytes: [IN ] Number of bytes to access using CMPXCHG.
95 */
96 int (*cmpxchg_emulated) (unsigned long addr,
97 const void *old,
98 const void *new,
99 unsigned int bytes,
100 struct kvm_vcpu *vcpu);
101
102};
103
104/* Type, address-of, and value of an instruction's operand. */
105struct operand {
106 enum { OP_REG, OP_MEM, OP_IMM, OP_NONE } type;
107 unsigned int bytes;
108 unsigned long val, orig_val, *ptr;
109};
110
111struct fetch_cache {
112 u8 data[15];
113 unsigned long start;
114 unsigned long end;
115};
116
117struct decode_cache {
118 u8 twobyte;
119 u8 b;
120 u8 lock_prefix;
121 u8 rep_prefix;
122 u8 op_bytes;
123 u8 ad_bytes;
124 u8 rex_prefix;
125 struct operand src;
126 struct operand dst;
127 unsigned long *override_base;
128 unsigned int d;
129 unsigned long regs[NR_VCPU_REGS];
130 unsigned long eip;
131 /* modrm */
132 u8 modrm;
133 u8 modrm_mod;
134 u8 modrm_reg;
135 u8 modrm_rm;
136 u8 use_modrm_ea;
137 unsigned long modrm_ea;
138 unsigned long modrm_val;
139 struct fetch_cache fetch;
140};
141
142struct x86_emulate_ctxt {
143 /* Register state before/after emulation. */
144 struct kvm_vcpu *vcpu;
145
146 /* Linear faulting address (if emulating a page-faulting instruction). */
147 unsigned long eflags;
148
149 /* Emulated execution mode, represented by an X86EMUL_MODE value. */
150 int mode;
151
152 unsigned long cs_base;
153 unsigned long ds_base;
154 unsigned long es_base;
155 unsigned long ss_base;
156 unsigned long gs_base;
157 unsigned long fs_base;
158
159 /* decode cache */
160
161 struct decode_cache decode;
162};
163
164/* Repeat String Operation Prefix */
165#define REPE_PREFIX 1
166#define REPNE_PREFIX 2
167
168/* Execution mode, passed to the emulator. */
169#define X86EMUL_MODE_REAL 0 /* Real mode. */
170#define X86EMUL_MODE_PROT16 2 /* 16-bit protected mode. */
171#define X86EMUL_MODE_PROT32 4 /* 32-bit protected mode. */
172#define X86EMUL_MODE_PROT64 8 /* 64-bit (long) mode. */
173
174/* Host execution mode. */
175#if defined(__i386__)
176#define X86EMUL_MODE_HOST X86EMUL_MODE_PROT32
177#elif defined(CONFIG_X86_64)
178#define X86EMUL_MODE_HOST X86EMUL_MODE_PROT64
179#endif
180
181int x86_decode_insn(struct x86_emulate_ctxt *ctxt,
182 struct x86_emulate_ops *ops);
183int x86_emulate_insn(struct x86_emulate_ctxt *ctxt,
184 struct x86_emulate_ops *ops);
185
186#endif /* __X86_EMULATE_H__ */
diff --git a/include/linux/kvm_host.h b/include/linux/kvm_host.h
new file mode 100644
index 000000000000..a85d5b6943de
--- /dev/null
+++ b/include/linux/kvm_host.h
@@ -0,0 +1,289 @@
1#ifndef __KVM_HOST_H
2#define __KVM_HOST_H
3
4/*
5 * This work is licensed under the terms of the GNU GPL, version 2. See
6 * the COPYING file in the top-level directory.
7 */
8
9#include <linux/types.h>
10#include <linux/hardirq.h>
11#include <linux/list.h>
12#include <linux/mutex.h>
13#include <linux/spinlock.h>
14#include <linux/signal.h>
15#include <linux/sched.h>
16#include <linux/mm.h>
17#include <linux/preempt.h>
18#include <asm/signal.h>
19
20#include <linux/kvm.h>
21#include <linux/kvm_para.h>
22
23#include <linux/kvm_types.h>
24
25#include <asm/kvm_host.h>
26
27#define KVM_MAX_VCPUS 4
28#define KVM_MEMORY_SLOTS 8
29/* memory slots that does not exposed to userspace */
30#define KVM_PRIVATE_MEM_SLOTS 4
31
32#define KVM_PIO_PAGE_OFFSET 1
33
34/*
35 * vcpu->requests bit members
36 */
37#define KVM_REQ_TLB_FLUSH 0
38
39
40struct kvm_vcpu;
41extern struct kmem_cache *kvm_vcpu_cache;
42
43struct kvm_guest_debug {
44 int enabled;
45 unsigned long bp[4];
46 int singlestep;
47};
48
49/*
50 * It would be nice to use something smarter than a linear search, TBD...
51 * Thankfully we dont expect many devices to register (famous last words :),
52 * so until then it will suffice. At least its abstracted so we can change
53 * in one place.
54 */
55struct kvm_io_bus {
56 int dev_count;
57#define NR_IOBUS_DEVS 6
58 struct kvm_io_device *devs[NR_IOBUS_DEVS];
59};
60
61void kvm_io_bus_init(struct kvm_io_bus *bus);
62void kvm_io_bus_destroy(struct kvm_io_bus *bus);
63struct kvm_io_device *kvm_io_bus_find_dev(struct kvm_io_bus *bus, gpa_t addr);
64void kvm_io_bus_register_dev(struct kvm_io_bus *bus,
65 struct kvm_io_device *dev);
66
67struct kvm_vcpu {
68 struct kvm *kvm;
69 struct preempt_notifier preempt_notifier;
70 int vcpu_id;
71 struct mutex mutex;
72 int cpu;
73 struct kvm_run *run;
74 int guest_mode;
75 unsigned long requests;
76 struct kvm_guest_debug guest_debug;
77 int fpu_active;
78 int guest_fpu_loaded;
79 wait_queue_head_t wq;
80 int sigset_active;
81 sigset_t sigset;
82 struct kvm_vcpu_stat stat;
83
84#ifdef CONFIG_HAS_IOMEM
85 int mmio_needed;
86 int mmio_read_completed;
87 int mmio_is_write;
88 int mmio_size;
89 unsigned char mmio_data[8];
90 gpa_t mmio_phys_addr;
91#endif
92
93 struct kvm_vcpu_arch arch;
94};
95
96struct kvm_memory_slot {
97 gfn_t base_gfn;
98 unsigned long npages;
99 unsigned long flags;
100 unsigned long *rmap;
101 unsigned long *dirty_bitmap;
102 unsigned long userspace_addr;
103 int user_alloc;
104};
105
106struct kvm {
107 struct mutex lock; /* protects everything except vcpus */
108 struct mm_struct *mm; /* userspace tied to this vm */
109 int nmemslots;
110 struct kvm_memory_slot memslots[KVM_MEMORY_SLOTS +
111 KVM_PRIVATE_MEM_SLOTS];
112 struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
113 struct list_head vm_list;
114 struct file *filp;
115 struct kvm_io_bus mmio_bus;
116 struct kvm_io_bus pio_bus;
117 struct kvm_vm_stat stat;
118 struct kvm_arch arch;
119};
120
121/* The guest did something we don't support. */
122#define pr_unimpl(vcpu, fmt, ...) \
123 do { \
124 if (printk_ratelimit()) \
125 printk(KERN_ERR "kvm: %i: cpu%i " fmt, \
126 current->tgid, (vcpu)->vcpu_id , ## __VA_ARGS__); \
127 } while (0)
128
129#define kvm_printf(kvm, fmt ...) printk(KERN_DEBUG fmt)
130#define vcpu_printf(vcpu, fmt...) kvm_printf(vcpu->kvm, fmt)
131
132int kvm_vcpu_init(struct kvm_vcpu *vcpu, struct kvm *kvm, unsigned id);
133void kvm_vcpu_uninit(struct kvm_vcpu *vcpu);
134
135void vcpu_load(struct kvm_vcpu *vcpu);
136void vcpu_put(struct kvm_vcpu *vcpu);
137
138void decache_vcpus_on_cpu(int cpu);
139
140
141int kvm_init(void *opaque, unsigned int vcpu_size,
142 struct module *module);
143void kvm_exit(void);
144
145#define HPA_MSB ((sizeof(hpa_t) * 8) - 1)
146#define HPA_ERR_MASK ((hpa_t)1 << HPA_MSB)
147static inline int is_error_hpa(hpa_t hpa) { return hpa >> HPA_MSB; }
148struct page *gva_to_page(struct kvm_vcpu *vcpu, gva_t gva);
149
150extern struct page *bad_page;
151
152int is_error_page(struct page *page);
153int kvm_is_error_hva(unsigned long addr);
154int kvm_set_memory_region(struct kvm *kvm,
155 struct kvm_userspace_memory_region *mem,
156 int user_alloc);
157int __kvm_set_memory_region(struct kvm *kvm,
158 struct kvm_userspace_memory_region *mem,
159 int user_alloc);
160int kvm_arch_set_memory_region(struct kvm *kvm,
161 struct kvm_userspace_memory_region *mem,
162 struct kvm_memory_slot old,
163 int user_alloc);
164gfn_t unalias_gfn(struct kvm *kvm, gfn_t gfn);
165struct page *gfn_to_page(struct kvm *kvm, gfn_t gfn);
166void kvm_release_page_clean(struct page *page);
167void kvm_release_page_dirty(struct page *page);
168int kvm_read_guest_page(struct kvm *kvm, gfn_t gfn, void *data, int offset,
169 int len);
170int kvm_read_guest(struct kvm *kvm, gpa_t gpa, void *data, unsigned long len);
171int kvm_write_guest_page(struct kvm *kvm, gfn_t gfn, const void *data,
172 int offset, int len);
173int kvm_write_guest(struct kvm *kvm, gpa_t gpa, const void *data,
174 unsigned long len);
175int kvm_clear_guest_page(struct kvm *kvm, gfn_t gfn, int offset, int len);
176int kvm_clear_guest(struct kvm *kvm, gpa_t gpa, unsigned long len);
177struct kvm_memory_slot *gfn_to_memslot(struct kvm *kvm, gfn_t gfn);
178int kvm_is_visible_gfn(struct kvm *kvm, gfn_t gfn);
179void mark_page_dirty(struct kvm *kvm, gfn_t gfn);
180
181void kvm_vcpu_block(struct kvm_vcpu *vcpu);
182void kvm_resched(struct kvm_vcpu *vcpu);
183void kvm_load_guest_fpu(struct kvm_vcpu *vcpu);
184void kvm_put_guest_fpu(struct kvm_vcpu *vcpu);
185void kvm_flush_remote_tlbs(struct kvm *kvm);
186
187long kvm_arch_dev_ioctl(struct file *filp,
188 unsigned int ioctl, unsigned long arg);
189long kvm_arch_vcpu_ioctl(struct file *filp,
190 unsigned int ioctl, unsigned long arg);
191void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
192void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);
193
194int kvm_dev_ioctl_check_extension(long ext);
195
196int kvm_get_dirty_log(struct kvm *kvm,
197 struct kvm_dirty_log *log, int *is_dirty);
198int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm,
199 struct kvm_dirty_log *log);
200
201int kvm_vm_ioctl_set_memory_region(struct kvm *kvm,
202 struct
203 kvm_userspace_memory_region *mem,
204 int user_alloc);
205long kvm_arch_vm_ioctl(struct file *filp,
206 unsigned int ioctl, unsigned long arg);
207void kvm_arch_destroy_vm(struct kvm *kvm);
208
209int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
210int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
211
212int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
213 struct kvm_translation *tr);
214
215int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
216int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
217int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
218 struct kvm_sregs *sregs);
219int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
220 struct kvm_sregs *sregs);
221int kvm_arch_vcpu_ioctl_debug_guest(struct kvm_vcpu *vcpu,
222 struct kvm_debug_guest *dbg);
223int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run);
224
225int kvm_arch_init(void *opaque);
226void kvm_arch_exit(void);
227
228int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu);
229void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu);
230
231void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu);
232void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
233void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);
234struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id);
235int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu);
236void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu);
237
238int kvm_arch_vcpu_reset(struct kvm_vcpu *vcpu);
239void kvm_arch_hardware_enable(void *garbage);
240void kvm_arch_hardware_disable(void *garbage);
241int kvm_arch_hardware_setup(void);
242void kvm_arch_hardware_unsetup(void);
243void kvm_arch_check_processor_compat(void *rtn);
244int kvm_arch_vcpu_runnable(struct kvm_vcpu *vcpu);
245
246void kvm_free_physmem(struct kvm *kvm);
247
248struct kvm *kvm_arch_create_vm(void);
249void kvm_arch_destroy_vm(struct kvm *kvm);
250
251int kvm_cpu_get_interrupt(struct kvm_vcpu *v);
252int kvm_cpu_has_interrupt(struct kvm_vcpu *v);
253
254static inline void kvm_guest_enter(void)
255{
256 account_system_vtime(current);
257 current->flags |= PF_VCPU;
258}
259
260static inline void kvm_guest_exit(void)
261{
262 account_system_vtime(current);
263 current->flags &= ~PF_VCPU;
264}
265
266static inline int memslot_id(struct kvm *kvm, struct kvm_memory_slot *slot)
267{
268 return slot - kvm->memslots;
269}
270
271static inline gpa_t gfn_to_gpa(gfn_t gfn)
272{
273 return (gpa_t)gfn << PAGE_SHIFT;
274}
275
276enum kvm_stat_kind {
277 KVM_STAT_VM,
278 KVM_STAT_VCPU,
279};
280
281struct kvm_stats_debugfs_item {
282 const char *name;
283 int offset;
284 enum kvm_stat_kind kind;
285 struct dentry *dentry;
286};
287extern struct kvm_stats_debugfs_item debugfs_entries[];
288
289#endif
diff --git a/include/linux/kvm_types.h b/include/linux/kvm_types.h
new file mode 100644
index 000000000000..1c4e46decb22
--- /dev/null
+++ b/include/linux/kvm_types.h
@@ -0,0 +1,54 @@
1/*
2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License as published by
4 * the Free Software Foundation; either version 2 of the License.
5 *
6 * This program is distributed in the hope that it will be useful,
7 * but WITHOUT ANY WARRANTY; without even the implied warranty of
8 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
9 * GNU General Public License for more details.
10 *
11 * You should have received a copy of the GNU General Public License
12 * along with this program; if not, write to the Free Software
13 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
14 *
15 */
16
17#ifndef __KVM_TYPES_H__
18#define __KVM_TYPES_H__
19
20#include <asm/types.h>
21
22/*
23 * Address types:
24 *
25 * gva - guest virtual address
26 * gpa - guest physical address
27 * gfn - guest frame number
28 * hva - host virtual address
29 * hpa - host physical address
30 * hfn - host frame number
31 */
32
33typedef unsigned long gva_t;
34typedef u64 gpa_t;
35typedef unsigned long gfn_t;
36
37typedef unsigned long hva_t;
38typedef u64 hpa_t;
39typedef unsigned long hfn_t;
40
41struct kvm_pio_request {
42 unsigned long count;
43 int cur_count;
44 struct page *guest_pages[2];
45 unsigned guest_page_offset;
46 int in;
47 int port;
48 int size;
49 int string;
50 int down;
51 int rep;
52};
53
54#endif /* __KVM_TYPES_H__ */