kvm.h 22.3 KB
Newer Older
A
Avi Kivity 已提交
1 2 3 4 5 6 7 8 9 10 11 12
#ifndef __KVM_H
#define __KVM_H

/*
 * This work is licensed under the terms of the GNU GPL, version 2.  See
 * the COPYING file in the top-level directory.
 */

#include <linux/types.h>
#include <linux/list.h>
#include <linux/mutex.h>
#include <linux/spinlock.h>
M
Markus Rechberger 已提交
13 14
#include <linux/signal.h>
#include <linux/sched.h>
A
Avi Kivity 已提交
15
#include <linux/mm.h>
16
#include <linux/preempt.h>
A
Alexey Dobriyan 已提交
17
#include <asm/signal.h>
A
Avi Kivity 已提交
18 19

#include <linux/kvm.h>
I
Ingo Molnar 已提交
20
#include <linux/kvm_para.h>
A
Avi Kivity 已提交
21

22 23 24
#define CR3_PAE_RESERVED_BITS ((X86_CR3_PWT | X86_CR3_PCD) - 1)
#define CR3_NONPAE_RESERVED_BITS ((PAGE_SIZE-1) & ~(X86_CR3_PWT | X86_CR3_PCD))
#define CR3_L_MODE_RESERVED_BITS (CR3_NONPAE_RESERVED_BITS|0xFFFFFF0000000000ULL)
A
Avi Kivity 已提交
25 26

#define KVM_GUEST_CR0_MASK \
27 28
	(X86_CR0_PG | X86_CR0_PE | X86_CR0_WP | X86_CR0_NE \
	 | X86_CR0_NW | X86_CR0_CD)
A
Avi Kivity 已提交
29
#define KVM_VM_CR0_ALWAYS_ON \
30 31
	(X86_CR0_PG | X86_CR0_PE | X86_CR0_WP | X86_CR0_NE | X86_CR0_TS \
	 | X86_CR0_MP)
A
Avi Kivity 已提交
32
#define KVM_GUEST_CR4_MASK \
33 34 35
	(X86_CR4_VME | X86_CR4_PSE | X86_CR4_PAE | X86_CR4_PGE | X86_CR4_VMXE)
#define KVM_PMODE_VM_CR4_ALWAYS_ON (X86_CR4_PAE | X86_CR4_VMXE)
#define KVM_RMODE_VM_CR4_ALWAYS_ON (X86_CR4_VME | X86_CR4_PAE | X86_CR4_VMXE)
A
Avi Kivity 已提交
36 37 38 39

#define INVALID_PAGE (~(hpa_t)0)
#define UNMAPPED_GVA (~(gpa_t)0)

A
Avi Kivity 已提交
40
#define KVM_MAX_VCPUS 4
41
#define KVM_ALIAS_SLOTS 4
I
Izik Eidus 已提交
42
#define KVM_MEMORY_SLOTS 8
43 44
#define KVM_PERMILLE_MMU_PAGES 20
#define KVM_MIN_ALLOC_MMU_PAGES 64
45
#define KVM_NUM_MMU_PAGES 1024
A
Avi Kivity 已提交
46 47
#define KVM_MIN_FREE_MMU_PAGES 5
#define KVM_REFILL_PAGES 25
48
#define KVM_MAX_CPUID_ENTRIES 40
A
Avi Kivity 已提交
49 50

#define DE_VECTOR 0
51
#define UD_VECTOR 6
A
Anthony Liguori 已提交
52
#define NM_VECTOR 7
A
Avi Kivity 已提交
53 54 55 56 57 58 59 60 61 62 63 64
#define DF_VECTOR 8
#define TS_VECTOR 10
#define NP_VECTOR 11
#define SS_VECTOR 12
#define GP_VECTOR 13
#define PF_VECTOR 14

#define SELECTOR_TI_MASK (1 << 2)
#define SELECTOR_RPL_MASK 0x03

#define IOPL_SHIFT 12

65 66
#define KVM_PIO_PAGE_OFFSET 1

67 68 69
/*
 * vcpu->requests bit members
 */
70
#define KVM_REQ_TLB_FLUSH          0
71

A
Avi Kivity 已提交
72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90
/*
 * Address types:
 *
 *  gva - guest virtual address
 *  gpa - guest physical address
 *  gfn - guest frame number
 *  hva - host virtual address
 *  hpa - host physical address
 *  hfn - host frame number
 */

typedef unsigned long  gva_t;
typedef u64            gpa_t;
typedef unsigned long  gfn_t;

typedef unsigned long  hva_t;
typedef u64            hpa_t;
typedef unsigned long  hfn_t;

91 92 93 94 95 96 97 98 99 100 101 102 103 104
#define NR_PTE_CHAIN_ENTRIES 5

struct kvm_pte_chain {
	u64 *parent_ptes[NR_PTE_CHAIN_ENTRIES];
	struct hlist_node link;
};

/*
 * kvm_mmu_page_role, below, is defined as:
 *
 *   bits 0:3 - total guest paging levels (2-4, or zero for real mode)
 *   bits 4:7 - page table level for this shadow (1-4)
 *   bits 8:9 - page table quadrant for 2-level guests
 *   bit   16 - "metaphysical" - gfn is not a real page (huge page/real mode)
105
 *   bits 17:19 - "access" - the user, writable, and nx bits of a huge page pde
106 107 108 109 110 111 112 113 114
 */
union kvm_mmu_page_role {
	unsigned word;
	struct {
		unsigned glevels : 4;
		unsigned level : 4;
		unsigned quadrant : 2;
		unsigned pad_for_nice_hex_output : 6;
		unsigned metaphysical : 1;
115
		unsigned hugepage_access : 3;
116 117 118
	};
};

A
Avi Kivity 已提交
119 120
struct kvm_mmu_page {
	struct list_head link;
121 122 123 124 125 126 127 128 129
	struct hlist_node hash_link;

	/*
	 * The following two entries are used to key the shadow page in the
	 * hash table.
	 */
	gfn_t gfn;
	union kvm_mmu_page_role role;

130
	u64 *spt;
131 132
	/* hold the gfn of each spte inside spt */
	gfn_t *gfns;
A
Avi Kivity 已提交
133 134 135
	unsigned long slot_bitmap; /* One bit set per slot which has memory
				    * in this shadow page.
				    */
136
	int multimapped;         /* More than one parent_pte? */
137
	int root_count;          /* Currently serving as active root */
138 139 140 141
	union {
		u64 *parent_pte;               /* !multimapped */
		struct hlist_head parent_ptes; /* multimapped, kvm_pte_chain */
	};
A
Avi Kivity 已提交
142 143 144
};

struct kvm_vcpu;
145
extern struct kmem_cache *kvm_vcpu_cache;
A
Avi Kivity 已提交
146 147 148 149 150 151 152 153 154 155 156

/*
 * x86 supports 3 paging modes (4-level 64-bit, 3-level 64-bit, and 2-level
 * 32-bit).  The kvm_mmu structure abstracts the details of the current mmu
 * mode.
 */
struct kvm_mmu {
	void (*new_cr3)(struct kvm_vcpu *vcpu);
	int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err);
	void (*free)(struct kvm_vcpu *vcpu);
	gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva);
157 158
	void (*prefetch_page)(struct kvm_vcpu *vcpu,
			      struct kvm_mmu_page *page);
A
Avi Kivity 已提交
159 160 161
	hpa_t root_hpa;
	int root_level;
	int shadow_root_level;
162 163

	u64 *pae_root;
A
Avi Kivity 已提交
164 165
};

166
#define KVM_NR_MEM_OBJS 40
167 168 169 170 171 172 173 174 175 176

struct kvm_mmu_memory_cache {
	int nobjs;
	void *objects[KVM_NR_MEM_OBJS];
};

/*
 * We don't want allocation failures within the mmu code, so we preallocate
 * enough memory for a single page fault in a cache.
 */
A
Avi Kivity 已提交
177 178 179 180 181 182 183 184 185 186 187 188 189 190 191
struct kvm_guest_debug {
	int enabled;
	unsigned long bp[4];
	int singlestep;
};

enum {
	VCPU_REGS_RAX = 0,
	VCPU_REGS_RCX = 1,
	VCPU_REGS_RDX = 2,
	VCPU_REGS_RBX = 3,
	VCPU_REGS_RSP = 4,
	VCPU_REGS_RBP = 5,
	VCPU_REGS_RSI = 6,
	VCPU_REGS_RDI = 7,
192
#ifdef CONFIG_X86_64
A
Avi Kivity 已提交
193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215
	VCPU_REGS_R8 = 8,
	VCPU_REGS_R9 = 9,
	VCPU_REGS_R10 = 10,
	VCPU_REGS_R11 = 11,
	VCPU_REGS_R12 = 12,
	VCPU_REGS_R13 = 13,
	VCPU_REGS_R14 = 14,
	VCPU_REGS_R15 = 15,
#endif
	NR_VCPU_REGS
};

enum {
	VCPU_SREG_CS,
	VCPU_SREG_DS,
	VCPU_SREG_ES,
	VCPU_SREG_FS,
	VCPU_SREG_GS,
	VCPU_SREG_SS,
	VCPU_SREG_TR,
	VCPU_SREG_LDTR,
};

216 217
#include "x86_emulate.h"

218 219 220 221 222 223
struct kvm_pio_request {
	unsigned long count;
	int cur_count;
	struct page *guest_pages[2];
	unsigned guest_page_offset;
	int in;
224
	int port;
225 226 227 228 229 230
	int size;
	int string;
	int down;
	int rep;
};

A
Avi Kivity 已提交
231 232 233 234 235 236 237 238 239 240 241 242
struct kvm_stat {
	u32 pf_fixed;
	u32 pf_guest;
	u32 tlb_flush;
	u32 invlpg;

	u32 exits;
	u32 io_exits;
	u32 mmio_exits;
	u32 signal_exits;
	u32 irq_window_exits;
	u32 halt_exits;
E
Eddie Dong 已提交
243
	u32 halt_wakeup;
A
Avi Kivity 已提交
244 245
	u32 request_irq_exits;
	u32 irq_exits;
246
	u32 light_exits;
247
	u32 efer_reload;
A
Avi Kivity 已提交
248 249
};

250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287
struct kvm_io_device {
	void (*read)(struct kvm_io_device *this,
		     gpa_t addr,
		     int len,
		     void *val);
	void (*write)(struct kvm_io_device *this,
		      gpa_t addr,
		      int len,
		      const void *val);
	int (*in_range)(struct kvm_io_device *this, gpa_t addr);
	void (*destructor)(struct kvm_io_device *this);

	void             *private;
};

static inline void kvm_iodevice_read(struct kvm_io_device *dev,
				     gpa_t addr,
				     int len,
				     void *val)
{
	dev->read(dev, addr, len, val);
}

static inline void kvm_iodevice_write(struct kvm_io_device *dev,
				      gpa_t addr,
				      int len,
				      const void *val)
{
	dev->write(dev, addr, len, val);
}

static inline int kvm_iodevice_inrange(struct kvm_io_device *dev, gpa_t addr)
{
	return dev->in_range(dev, addr);
}

static inline void kvm_iodevice_destructor(struct kvm_io_device *dev)
{
288 289
	if (dev->destructor)
		dev->destructor(dev);
290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309
}

/*
 * It would be nice to use something smarter than a linear search, TBD...
 * Thankfully we dont expect many devices to register (famous last words :),
 * so until then it will suffice.  At least its abstracted so we can change
 * in one place.
 */
struct kvm_io_bus {
	int                   dev_count;
#define NR_IOBUS_DEVS 6
	struct kvm_io_device *devs[NR_IOBUS_DEVS];
};

void kvm_io_bus_init(struct kvm_io_bus *bus);
void kvm_io_bus_destroy(struct kvm_io_bus *bus);
struct kvm_io_device *kvm_io_bus_find_dev(struct kvm_io_bus *bus, gpa_t addr);
void kvm_io_bus_register_dev(struct kvm_io_bus *bus,
			     struct kvm_io_device *dev);

A
Avi Kivity 已提交
310 311
struct kvm_vcpu {
	struct kvm *kvm;
312
	struct preempt_notifier preempt_notifier;
313
	int vcpu_id;
A
Avi Kivity 已提交
314 315
	struct mutex mutex;
	int   cpu;
316
	u64 host_tsc;
317
	struct kvm_run *run;
318
	int interrupt_window_open;
319 320
	int guest_mode;
	unsigned long requests;
A
Avi Kivity 已提交
321
	unsigned long irq_summary; /* bit vector: 1 per word in irq_pending */
322
	DECLARE_BITMAP(irq_pending, KVM_NR_INTERRUPTS);
A
Avi Kivity 已提交
323 324 325 326 327 328 329 330
	unsigned long regs[NR_VCPU_REGS]; /* for rsp: vcpu_load_rsp_rip() */
	unsigned long rip;      /* needs vcpu_load_rsp_rip() */

	unsigned long cr0;
	unsigned long cr2;
	unsigned long cr3;
	unsigned long cr4;
	unsigned long cr8;
331
	u64 pdptrs[4]; /* pae */
A
Avi Kivity 已提交
332 333
	u64 shadow_efer;
	u64 apic_base;
E
Eddie Dong 已提交
334
	struct kvm_lapic *apic;    /* kernel irqchip context */
335 336 337 338 339 340 341
#define VCPU_MP_STATE_RUNNABLE          0
#define VCPU_MP_STATE_UNINITIALIZED     1
#define VCPU_MP_STATE_INIT_RECEIVED     2
#define VCPU_MP_STATE_SIPI_RECEIVED     3
#define VCPU_MP_STATE_HALTED            4
	int mp_state;
	int sipi_vector;
342
	u64 ia32_misc_enable_msr;
A
Avi Kivity 已提交
343 344 345

	struct kvm_mmu mmu;

346 347
	struct kvm_mmu_memory_cache mmu_pte_chain_cache;
	struct kvm_mmu_memory_cache mmu_rmap_desc_cache;
348 349
	struct kvm_mmu_memory_cache mmu_page_cache;
	struct kvm_mmu_memory_cache mmu_page_header_cache;
350

351 352
	gfn_t last_pt_write_gfn;
	int   last_pt_write_count;
353
	u64  *last_pte_updated;
354

A
Avi Kivity 已提交
355 356
	struct kvm_guest_debug guest_debug;

357 358
	struct i387_fxsave_struct host_fx_image;
	struct i387_fxsave_struct guest_fx_image;
A
Anthony Liguori 已提交
359
	int fpu_active;
360
	int guest_fpu_loaded;
A
Avi Kivity 已提交
361 362 363 364 365 366 367

	int mmio_needed;
	int mmio_read_completed;
	int mmio_is_write;
	int mmio_size;
	unsigned char mmio_data[8];
	gpa_t mmio_phys_addr;
368
	gva_t mmio_fault_cr2;
369 370
	struct kvm_pio_request pio;
	void *pio_data;
E
Eddie Dong 已提交
371
	wait_queue_head_t wq;
A
Avi Kivity 已提交
372

A
Avi Kivity 已提交
373 374 375
	int sigset_active;
	sigset_t sigset;

A
Avi Kivity 已提交
376 377
	struct kvm_stat stat;

A
Avi Kivity 已提交
378 379 380 381 382 383 384 385 386 387
	struct {
		int active;
		u8 save_iopl;
		struct kvm_save_segment {
			u16 selector;
			unsigned long base;
			u32 limit;
			u32 ar;
		} tr, es, ds, fs, gs;
	} rmode;
388
	int halt_request; /* real mode on Intel only */
389 390 391

	int cpuid_nent;
	struct kvm_cpuid_entry cpuid_entries[KVM_MAX_CPUID_ENTRIES];
392 393 394 395

	/* emulate context */

	struct x86_emulate_ctxt emulate_ctxt;
A
Avi Kivity 已提交
396 397
};

398 399 400 401 402 403
struct kvm_mem_alias {
	gfn_t base_gfn;
	unsigned long npages;
	gfn_t target_gfn;
};

A
Avi Kivity 已提交
404 405 406 407 408
struct kvm_memory_slot {
	gfn_t base_gfn;
	unsigned long npages;
	unsigned long flags;
	struct page **phys_mem;
409
	unsigned long *rmap;
A
Avi Kivity 已提交
410
	unsigned long *dirty_bitmap;
411
	int user_alloc; /* user allocated memory */
412
	unsigned long userspace_addr;
A
Avi Kivity 已提交
413 414 415
};

struct kvm {
S
Shaohua Li 已提交
416
	struct mutex lock; /* protects everything except vcpus */
417 418
	int naliases;
	struct kvm_mem_alias aliases[KVM_ALIAS_SLOTS];
A
Avi Kivity 已提交
419 420
	int nmemslots;
	struct kvm_memory_slot memslots[KVM_MEMORY_SLOTS];
421 422 423
	/*
	 * Hash table of struct kvm_mmu_page.
	 */
A
Avi Kivity 已提交
424
	struct list_head active_mmu_pages;
425 426 427
	unsigned int n_free_mmu_pages;
	unsigned int n_requested_mmu_pages;
	unsigned int n_alloc_mmu_pages;
428
	struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
R
Rusty Russell 已提交
429
	struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
430
	unsigned long rmap_overflow;
431
	struct list_head vm_list;
A
Avi Kivity 已提交
432
	struct file *filp;
433
	struct kvm_io_bus mmio_bus;
434
	struct kvm_io_bus pio_bus;
435
	struct kvm_pic *vpic;
E
Eddie Dong 已提交
436
	struct kvm_ioapic *vioapic;
437
	int round_robin_prev_vcpu;
A
Avi Kivity 已提交
438 439
};

440 441 442 443 444
static inline struct kvm_pic *pic_irqchip(struct kvm *kvm)
{
	return kvm->vpic;
}

E
Eddie Dong 已提交
445 446 447 448 449
static inline struct kvm_ioapic *ioapic_irqchip(struct kvm *kvm)
{
	return kvm->vioapic;
}

450 451 452 453 454
static inline int irqchip_in_kernel(struct kvm *kvm)
{
	return pic_irqchip(kvm) != 0;
}

A
Avi Kivity 已提交
455 456 457 458 459
struct descriptor_table {
	u16 limit;
	unsigned long base;
} __attribute__((packed));

460
struct kvm_x86_ops {
A
Avi Kivity 已提交
461 462 463 464
	int (*cpu_has_kvm_support)(void);          /* __init */
	int (*disabled_by_bios)(void);             /* __init */
	void (*hardware_enable)(void *dummy);      /* __init */
	void (*hardware_disable)(void *dummy);
Y
Yang, Sheng 已提交
465
	void (*check_processor_compatibility)(void *rtn);
A
Avi Kivity 已提交
466 467 468
	int (*hardware_setup)(void);               /* __init */
	void (*hardware_unsetup)(void);            /* __exit */

R
Rusty Russell 已提交
469 470
	/* Create, but do not attach this VCPU */
	struct kvm_vcpu *(*vcpu_create)(struct kvm *kvm, unsigned id);
A
Avi Kivity 已提交
471
	void (*vcpu_free)(struct kvm_vcpu *vcpu);
472
	void (*vcpu_reset)(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
473

474
	void (*prepare_guest_switch)(struct kvm_vcpu *vcpu);
475
	void (*vcpu_load)(struct kvm_vcpu *vcpu, int cpu);
A
Avi Kivity 已提交
476
	void (*vcpu_put)(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
477
	void (*vcpu_decache)(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
478 479 480

	int (*set_guest_debug)(struct kvm_vcpu *vcpu,
			       struct kvm_debug_guest *dbg);
481
	void (*guest_debug_pre)(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
482 483 484 485 486 487 488 489
	int (*get_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 *pdata);
	int (*set_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
	u64 (*get_segment_base)(struct kvm_vcpu *vcpu, int seg);
	void (*get_segment)(struct kvm_vcpu *vcpu,
			    struct kvm_segment *var, int seg);
	void (*set_segment)(struct kvm_vcpu *vcpu,
			    struct kvm_segment *var, int seg);
	void (*get_cs_db_l_bits)(struct kvm_vcpu *vcpu, int *db, int *l);
490
	void (*decache_cr4_guest_bits)(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512
	void (*set_cr0)(struct kvm_vcpu *vcpu, unsigned long cr0);
	void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
	void (*set_cr4)(struct kvm_vcpu *vcpu, unsigned long cr4);
	void (*set_efer)(struct kvm_vcpu *vcpu, u64 efer);
	void (*get_idt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
	void (*set_idt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
	void (*get_gdt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
	void (*set_gdt)(struct kvm_vcpu *vcpu, struct descriptor_table *dt);
	unsigned long (*get_dr)(struct kvm_vcpu *vcpu, int dr);
	void (*set_dr)(struct kvm_vcpu *vcpu, int dr, unsigned long value,
		       int *exception);
	void (*cache_regs)(struct kvm_vcpu *vcpu);
	void (*decache_regs)(struct kvm_vcpu *vcpu);
	unsigned long (*get_rflags)(struct kvm_vcpu *vcpu);
	void (*set_rflags)(struct kvm_vcpu *vcpu, unsigned long rflags);

	void (*tlb_flush)(struct kvm_vcpu *vcpu);
	void (*inject_page_fault)(struct kvm_vcpu *vcpu,
				  unsigned long addr, u32 err_code);

	void (*inject_gp)(struct kvm_vcpu *vcpu, unsigned err_code);

513 514
	void (*run)(struct kvm_vcpu *vcpu, struct kvm_run *run);
	int (*handle_exit)(struct kvm_run *run, struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
515
	void (*skip_emulated_instruction)(struct kvm_vcpu *vcpu);
I
Ingo Molnar 已提交
516 517
	void (*patch_hypercall)(struct kvm_vcpu *vcpu,
				unsigned char *hypercall_addr);
E
Eddie Dong 已提交
518 519
	int (*get_irq)(struct kvm_vcpu *vcpu);
	void (*set_irq)(struct kvm_vcpu *vcpu, int vec);
520 521 522
	void (*inject_pending_irq)(struct kvm_vcpu *vcpu);
	void (*inject_pending_vectors)(struct kvm_vcpu *vcpu,
				       struct kvm_run *run);
A
Avi Kivity 已提交
523 524
};

525
extern struct kvm_x86_ops *kvm_x86_ops;
A
Avi Kivity 已提交
526

527 528 529 530 531 532
/* The guest did something we don't support. */
#define pr_unimpl(vcpu, fmt, ...)					\
 do {									\
	if (printk_ratelimit())						\
		printk(KERN_ERR "kvm: %i: cpu%i " fmt,			\
		       current->tgid, (vcpu)->vcpu_id , ## __VA_ARGS__); \
M
Mike Day 已提交
533
 } while (0)
534

A
Avi Kivity 已提交
535 536 537
#define kvm_printf(kvm, fmt ...) printk(KERN_DEBUG fmt)
#define vcpu_printf(vcpu, fmt...) kvm_printf(vcpu->kvm, fmt)

R
Rusty Russell 已提交
538 539 540
int kvm_vcpu_init(struct kvm_vcpu *vcpu, struct kvm *kvm, unsigned id);
void kvm_vcpu_uninit(struct kvm_vcpu *vcpu);

541 542 543 544
void vcpu_load(struct kvm_vcpu *vcpu);
void vcpu_put(struct kvm_vcpu *vcpu);


545
int kvm_init_x86(struct kvm_x86_ops *ops, unsigned int vcpu_size,
546
		  struct module *module);
547
void kvm_exit_x86(void);
A
Avi Kivity 已提交
548

549 550 551
int kvm_mmu_module_init(void);
void kvm_mmu_module_exit(void);

A
Avi Kivity 已提交
552
void kvm_mmu_destroy(struct kvm_vcpu *vcpu);
553 554
int kvm_mmu_create(struct kvm_vcpu *vcpu);
int kvm_mmu_setup(struct kvm_vcpu *vcpu);
555
void kvm_mmu_set_nonpresent_ptes(u64 trap_pte, u64 notrap_pte);
A
Avi Kivity 已提交
556 557

int kvm_mmu_reset_context(struct kvm_vcpu *vcpu);
558 559
void kvm_mmu_slot_remove_write_access(struct kvm *kvm, int slot);
void kvm_mmu_zap_all(struct kvm *kvm);
560
void kvm_mmu_change_mmu_pages(struct kvm *kvm, unsigned int kvm_nr_mmu_pages);
A
Avi Kivity 已提交
561

562
hpa_t gpa_to_hpa(struct kvm *kvm, gpa_t gpa);
A
Avi Kivity 已提交
563 564 565 566
#define HPA_MSB ((sizeof(hpa_t) * 8) - 1)
#define HPA_ERR_MASK ((hpa_t)1 << HPA_MSB)
static inline int is_error_hpa(hpa_t hpa) { return hpa >> HPA_MSB; }
hpa_t gva_to_hpa(struct kvm_vcpu *vcpu, gva_t gva);
567
struct page *gva_to_page(struct kvm_vcpu *vcpu, gva_t gva);
A
Avi Kivity 已提交
568

569
extern struct page *bad_page;
A
Avi Kivity 已提交
570

571
int is_error_page(struct page *page);
572
gfn_t unalias_gfn(struct kvm *kvm, gfn_t gfn);
A
Avi Kivity 已提交
573
struct page *gfn_to_page(struct kvm *kvm, gfn_t gfn);
574
void kvm_release_page(struct page *page);
575 576 577 578 579 580 581 582 583
int kvm_read_guest_page(struct kvm *kvm, gfn_t gfn, void *data, int offset,
			int len);
int kvm_read_guest(struct kvm *kvm, gpa_t gpa, void *data, unsigned long len);
int kvm_write_guest_page(struct kvm *kvm, gfn_t gfn, const void *data,
			 int offset, int len);
int kvm_write_guest(struct kvm *kvm, gpa_t gpa, const void *data,
		    unsigned long len);
int kvm_clear_guest_page(struct kvm *kvm, gfn_t gfn, int offset, int len);
int kvm_clear_guest(struct kvm *kvm, gpa_t gpa, unsigned long len);
A
Avi Kivity 已提交
584 585 586 587 588 589 590 591 592 593
struct kvm_memory_slot *gfn_to_memslot(struct kvm *kvm, gfn_t gfn);
void mark_page_dirty(struct kvm *kvm, gfn_t gfn);

enum emulation_result {
	EMULATE_DONE,       /* no further processing */
	EMULATE_DO_MMIO,      /* kvm_run filled with mmio request */
	EMULATE_FAIL,         /* can't emulate this instruction */
};

int emulate_instruction(struct kvm_vcpu *vcpu, struct kvm_run *run,
594
			unsigned long cr2, u16 error_code, int no_decode);
595
void kvm_report_emulation_failure(struct kvm_vcpu *cvpu, const char *context);
A
Avi Kivity 已提交
596 597 598 599 600 601 602 603
void realmode_lgdt(struct kvm_vcpu *vcpu, u16 size, unsigned long address);
void realmode_lidt(struct kvm_vcpu *vcpu, u16 size, unsigned long address);
void realmode_lmsw(struct kvm_vcpu *vcpu, unsigned long msw,
		   unsigned long *rflags);

unsigned long realmode_get_cr(struct kvm_vcpu *vcpu, int cr);
void realmode_set_cr(struct kvm_vcpu *vcpu, int cr, unsigned long value,
		     unsigned long *rflags);
604 605
int kvm_get_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 *data);
int kvm_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
A
Avi Kivity 已提交
606 607 608

struct x86_emulate_ctxt;

M
Mike Day 已提交
609
int kvm_emulate_pio(struct kvm_vcpu *vcpu, struct kvm_run *run, int in,
L
Laurent Vivier 已提交
610 611 612 613
		     int size, unsigned port);
int kvm_emulate_pio_string(struct kvm_vcpu *vcpu, struct kvm_run *run, int in,
			   int size, unsigned long count, int down,
			    gva_t address, int rep, unsigned port);
614
void kvm_emulate_cpuid(struct kvm_vcpu *vcpu);
615
int kvm_emulate_halt(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
616 617
int emulate_invlpg(struct kvm_vcpu *vcpu, gva_t address);
int emulate_clts(struct kvm_vcpu *vcpu);
M
Mike Day 已提交
618
int emulator_get_dr(struct x86_emulate_ctxt *ctxt, int dr,
A
Avi Kivity 已提交
619 620 621 622 623 624 625 626
		    unsigned long *dest);
int emulator_set_dr(struct x86_emulate_ctxt *ctxt, int dr,
		    unsigned long value);

void set_cr0(struct kvm_vcpu *vcpu, unsigned long cr0);
void set_cr3(struct kvm_vcpu *vcpu, unsigned long cr0);
void set_cr4(struct kvm_vcpu *vcpu, unsigned long cr0);
void set_cr8(struct kvm_vcpu *vcpu, unsigned long cr0);
627
unsigned long get_cr8(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
628
void lmsw(struct kvm_vcpu *vcpu, unsigned long msw);
629
void kvm_get_cs_db_l_bits(struct kvm_vcpu *vcpu, int *db, int *l);
A
Avi Kivity 已提交
630

631 632
int kvm_get_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 *pdata);
int kvm_set_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 data);
A
Avi Kivity 已提交
633 634 635 636

void fx_init(struct kvm_vcpu *vcpu);

void kvm_resched(struct kvm_vcpu *vcpu);
637 638
void kvm_load_guest_fpu(struct kvm_vcpu *vcpu);
void kvm_put_guest_fpu(struct kvm_vcpu *vcpu);
639
void kvm_flush_remote_tlbs(struct kvm *kvm);
A
Avi Kivity 已提交
640

641
int emulator_read_std(unsigned long addr,
M
Mike Day 已提交
642
		      void *val,
643 644 645 646 647 648
		      unsigned int bytes,
		      struct kvm_vcpu *vcpu);
int emulator_write_emulated(unsigned long addr,
			    const void *val,
			    unsigned int bytes,
			    struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
649 650 651

unsigned long segment_base(u16 selector);

652
void kvm_mmu_pte_write(struct kvm_vcpu *vcpu, gpa_t gpa,
653
		       const u8 *new, int bytes);
654
int kvm_mmu_unprotect_page_virt(struct kvm_vcpu *vcpu, gva_t gva);
655
void __kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
656 657
int kvm_mmu_load(struct kvm_vcpu *vcpu);
void kvm_mmu_unload(struct kvm_vcpu *vcpu);
A
Avi Kivity 已提交
658

659 660 661
int kvm_emulate_hypercall(struct kvm_vcpu *vcpu);

int kvm_fix_hypercall(struct kvm_vcpu *vcpu);
662

663 664
long kvm_arch_dev_ioctl(struct file *filp,
			unsigned int ioctl, unsigned long arg);
665 666 667 668 669
long kvm_arch_vcpu_ioctl(struct file *filp,
			 unsigned int ioctl, unsigned long arg);
void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);

670 671
__init void kvm_arch_init(void);

672 673 674 675 676 677 678 679 680 681
static inline void kvm_guest_enter(void)
{
	current->flags |= PF_VCPU;
}

static inline void kvm_guest_exit(void)
{
	current->flags &= ~PF_VCPU;
}

A
Avi Kivity 已提交
682 683 684 685 686
static inline int kvm_mmu_page_fault(struct kvm_vcpu *vcpu, gva_t gva,
				     u32 error_code)
{
	return vcpu->mmu.page_fault(vcpu, gva, error_code);
}
687

688 689 690 691 692 693
static inline void kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu)
{
	if (unlikely(vcpu->kvm->n_free_mmu_pages < KVM_MIN_FREE_MMU_PAGES))
		__kvm_mmu_free_some_pages(vcpu);
}

A
Avi Kivity 已提交
694 695 696 697 698 699 700 701
static inline int kvm_mmu_reload(struct kvm_vcpu *vcpu)
{
	if (likely(vcpu->mmu.root_hpa != INVALID_PAGE))
		return 0;

	return kvm_mmu_load(vcpu);
}

A
Avi Kivity 已提交
702 703 704 705 706 707 708 709 710
static inline int is_long_mode(struct kvm_vcpu *vcpu)
{
#ifdef CONFIG_X86_64
	return vcpu->shadow_efer & EFER_LME;
#else
	return 0;
#endif
}

A
Avi Kivity 已提交
711 712
static inline int is_pae(struct kvm_vcpu *vcpu)
{
713
	return vcpu->cr4 & X86_CR4_PAE;
A
Avi Kivity 已提交
714 715 716 717
}

static inline int is_pse(struct kvm_vcpu *vcpu)
{
718
	return vcpu->cr4 & X86_CR4_PSE;
A
Avi Kivity 已提交
719 720 721 722
}

static inline int is_paging(struct kvm_vcpu *vcpu)
{
723
	return vcpu->cr0 & X86_CR0_PG;
A
Avi Kivity 已提交
724 725 726 727 728 729 730 731 732 733 734
}

static inline int memslot_id(struct kvm *kvm, struct kvm_memory_slot *slot)
{
	return slot - kvm->memslots;
}

static inline struct kvm_mmu_page *page_header(hpa_t shadow_page)
{
	struct page *page = pfn_to_page(shadow_page >> PAGE_SHIFT);

735
	return (struct kvm_mmu_page *)page_private(page);
A
Avi Kivity 已提交
736 737 738 739 740
}

static inline u16 read_fs(void)
{
	u16 seg;
M
Mike Day 已提交
741
	asm("mov %%fs, %0" : "=g"(seg));
A
Avi Kivity 已提交
742 743 744 745 746 747
	return seg;
}

static inline u16 read_gs(void)
{
	u16 seg;
M
Mike Day 已提交
748
	asm("mov %%gs, %0" : "=g"(seg));
A
Avi Kivity 已提交
749 750 751 752 753 754
	return seg;
}

static inline u16 read_ldt(void)
{
	u16 ldt;
M
Mike Day 已提交
755
	asm("sldt %0" : "=g"(ldt));
A
Avi Kivity 已提交
756 757 758 759 760
	return ldt;
}

static inline void load_fs(u16 sel)
{
M
Mike Day 已提交
761
	asm("mov %0, %%fs" : : "rm"(sel));
A
Avi Kivity 已提交
762 763 764 765
}

static inline void load_gs(u16 sel)
{
M
Mike Day 已提交
766
	asm("mov %0, %%gs" : : "rm"(sel));
A
Avi Kivity 已提交
767 768 769 770 771
}

#ifndef load_ldt
static inline void load_ldt(u16 sel)
{
M
Mike Day 已提交
772
	asm("lldt %0" : : "rm"(sel));
A
Avi Kivity 已提交
773 774 775 776 777
}
#endif

static inline void get_idt(struct descriptor_table *table)
{
M
Mike Day 已提交
778
	asm("sidt %0" : "=m"(*table));
A
Avi Kivity 已提交
779 780 781 782
}

static inline void get_gdt(struct descriptor_table *table)
{
M
Mike Day 已提交
783
	asm("sgdt %0" : "=m"(*table));
A
Avi Kivity 已提交
784 785 786 787 788
}

static inline unsigned long read_tr_base(void)
{
	u16 tr;
M
Mike Day 已提交
789
	asm("str %0" : "=g"(tr));
A
Avi Kivity 已提交
790 791 792
	return segment_base(tr);
}

793
#ifdef CONFIG_X86_64
A
Avi Kivity 已提交
794 795 796 797 798 799 800 801 802
static inline unsigned long read_msr(unsigned long msr)
{
	u64 value;

	rdmsrl(msr, value);
	return value;
}
#endif

803
static inline void fx_save(struct i387_fxsave_struct *image)
A
Avi Kivity 已提交
804
{
M
Mike Day 已提交
805
	asm("fxsave (%0)":: "r" (image));
A
Avi Kivity 已提交
806 807
}

808
static inline void fx_restore(struct i387_fxsave_struct *image)
A
Avi Kivity 已提交
809
{
M
Mike Day 已提交
810
	asm("fxrstor (%0)":: "r" (image));
A
Avi Kivity 已提交
811 812 813 814
}

static inline void fpu_init(void)
{
M
Mike Day 已提交
815
	asm("finit");
A
Avi Kivity 已提交
816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841
}

static inline u32 get_rdx_init_val(void)
{
	return 0x600; /* P6 family */
}

#define ASM_VMX_VMCLEAR_RAX       ".byte 0x66, 0x0f, 0xc7, 0x30"
#define ASM_VMX_VMLAUNCH          ".byte 0x0f, 0x01, 0xc2"
#define ASM_VMX_VMRESUME          ".byte 0x0f, 0x01, 0xc3"
#define ASM_VMX_VMPTRLD_RAX       ".byte 0x0f, 0xc7, 0x30"
#define ASM_VMX_VMREAD_RDX_RAX    ".byte 0x0f, 0x78, 0xd0"
#define ASM_VMX_VMWRITE_RAX_RDX   ".byte 0x0f, 0x79, 0xd0"
#define ASM_VMX_VMWRITE_RSP_RDX   ".byte 0x0f, 0x79, 0xd4"
#define ASM_VMX_VMXOFF            ".byte 0x0f, 0x01, 0xc4"
#define ASM_VMX_VMXON_RAX         ".byte 0xf3, 0x0f, 0xc7, 0x30"

#define MSR_IA32_TIME_STAMP_COUNTER		0x010

#define TSS_IOPB_BASE_OFFSET 0x66
#define TSS_BASE_SIZE 0x68
#define TSS_IOPB_SIZE (65536 / 8)
#define TSS_REDIRECTION_SIZE (256 / 8)
#define RMODE_TSS_SIZE (TSS_BASE_SIZE + TSS_REDIRECTION_SIZE + TSS_IOPB_SIZE + 1)

#endif