kvm_host.h 11.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *
 * Copyright IBM Corp. 2007
 *
 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
 */

#ifndef __POWERPC_KVM_HOST_H__
#define __POWERPC_KVM_HOST_H__

#include <linux/mutex.h>
A
Alexander Graf 已提交
24 25
#include <linux/hrtimer.h>
#include <linux/interrupt.h>
26 27
#include <linux/types.h>
#include <linux/kvm_types.h>
28 29
#include <linux/threads.h>
#include <linux/spinlock.h>
A
Alexander Graf 已提交
30
#include <linux/kvm_para.h>
31 32
#include <linux/list.h>
#include <linux/atomic.h>
33
#include <asm/kvm_asm.h>
34
#include <asm/processor.h>
35
#include <asm/page.h>
36

37 38
#define KVM_MAX_VCPUS		NR_CPUS
#define KVM_MAX_VCORES		NR_CPUS
39 40 41
#define KVM_MEMORY_SLOTS 32
/* memory slots that does not exposed to userspace */
#define KVM_PRIVATE_MEM_SLOTS 4
42
#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
43

44
#ifdef CONFIG_KVM_MMIO
45
#define KVM_COALESCED_MMIO_PAGE_OFFSET 1
46
#endif
47

48 49 50 51 52 53 54 55 56 57 58 59 60
#ifdef CONFIG_KVM_BOOK3S_64_HV
#include <linux/mmu_notifier.h>

#define KVM_ARCH_WANT_MMU_NOTIFIER

struct kvm;
extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_age_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);

#endif

61
/* We don't currently support large pages. */
62
#define KVM_HPAGE_GFN_SHIFT(x)	0
63 64
#define KVM_NR_PAGE_SIZES	1
#define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
65

66 67
#define HPTEG_CACHE_NUM			(1 << 15)
#define HPTEG_HASH_BITS_PTE		13
68
#define HPTEG_HASH_BITS_PTE_LONG	12
69 70 71
#define HPTEG_HASH_BITS_VPTE		13
#define HPTEG_HASH_BITS_VPTE_LONG	5
#define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
72
#define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
73 74
#define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
#define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
A
Alexander Graf 已提交
75

A
Alexander Graf 已提交
76 77 78
/* Physical Address Mask - allowed range of real mode RAM access */
#define KVM_PAM			0x0fffffffffffffffULL

79 80 81 82
struct kvm;
struct kvm_run;
struct kvm_vcpu;

83 84 85 86
struct lppaca;
struct slb_shadow;
struct dtl;

87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
struct kvm_vm_stat {
	u32 remote_tlb_flush;
};

struct kvm_vcpu_stat {
	u32 sum_exits;
	u32 mmio_exits;
	u32 dcr_exits;
	u32 signal_exits;
	u32 light_exits;
	/* Account for special types of light exits: */
	u32 itlb_real_miss_exits;
	u32 itlb_virt_miss_exits;
	u32 dtlb_real_miss_exits;
	u32 dtlb_virt_miss_exits;
	u32 syscall_exits;
	u32 isi_exits;
	u32 dsi_exits;
	u32 emulated_inst_exits;
	u32 dec_exits;
	u32 ext_intr_exits;
108
	u32 halt_wakeup;
109
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
110 111 112 113 114 115 116 117 118 119
	u32 pf_storage;
	u32 pf_instruc;
	u32 sp_storage;
	u32 sp_instruc;
	u32 queue_intr;
	u32 ld;
	u32 ld_slow;
	u32 st;
	u32 st_slow;
#endif
120 121
};

122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153
enum kvm_exit_types {
	MMIO_EXITS,
	DCR_EXITS,
	SIGNAL_EXITS,
	ITLB_REAL_MISS_EXITS,
	ITLB_VIRT_MISS_EXITS,
	DTLB_REAL_MISS_EXITS,
	DTLB_VIRT_MISS_EXITS,
	SYSCALL_EXITS,
	ISI_EXITS,
	DSI_EXITS,
	EMULATED_INST_EXITS,
	EMULATED_MTMSRWE_EXITS,
	EMULATED_WRTEE_EXITS,
	EMULATED_MTSPR_EXITS,
	EMULATED_MFSPR_EXITS,
	EMULATED_MTMSR_EXITS,
	EMULATED_MFMSR_EXITS,
	EMULATED_TLBSX_EXITS,
	EMULATED_TLBWE_EXITS,
	EMULATED_RFI_EXITS,
	DEC_EXITS,
	EXT_INTR_EXITS,
	HALT_WAKEUP,
	USR_PR_INST,
	FP_UNAVAIL,
	DEBUG_EXITS,
	TIMEINGUEST,
	__NUMBER_OF_KVM_EXIT_TYPES
};

/* allow access to big endian 32bit upper/lower parts and 64bit var */
154
struct kvmppc_exit_timing {
155 156 157 158 159 160 161 162
	union {
		u64 tv64;
		struct {
			u32 tbu, tbl;
		} tv32;
	};
};

163 164 165 166 167
struct kvmppc_pginfo {
	unsigned long pfn;
	atomic_t refcnt;
};

168 169 170 171 172 173 174 175
struct kvmppc_spapr_tce_table {
	struct list_head list;
	struct kvm *kvm;
	u64 liobn;
	u32 window_size;
	struct page *pages[0];
};

176 177 178 179 180 181 182 183
struct kvmppc_rma_info {
	void		*base_virt;
	unsigned long	 base_pfn;
	unsigned long	 npages;
	struct list_head list;
	atomic_t 	 use_count;
};

184 185 186
/*
 * The reverse mapping array has one entry for each HPTE,
 * which stores the guest's view of the second word of the HPTE
187 188 189 190
 * (including the guest physical address of the mapping),
 * plus forward and backward pointers in a doubly-linked ring
 * of HPTEs that map the same host page.  The pointers in this
 * ring are 32-bit HPTE indexes, to save space.
191 192 193
 */
struct revmap_entry {
	unsigned long guest_rpte;
194
	unsigned int forw, back;
195 196
};

197 198 199 200 201 202
/*
 * We use the top bit of each memslot->rmap entry as a lock bit,
 * and bit 32 as a present flag.  The bottom 32 bits are the
 * index in the guest HPT of a HPTE that points to the page.
 */
#define KVMPPC_RMAP_LOCK_BIT	63
203 204 205
#define KVMPPC_RMAP_RC_SHIFT	32
#define KVMPPC_RMAP_REFERENCED	(HPTE_R_R << KVMPPC_RMAP_RC_SHIFT)
#define KVMPPC_RMAP_CHANGED	(HPTE_R_C << KVMPPC_RMAP_RC_SHIFT)
206 207 208
#define KVMPPC_RMAP_PRESENT	0x100000000ul
#define KVMPPC_RMAP_INDEX	0xfffffffful

209
/* Low-order bits in kvm->arch.slot_phys[][] */
210
#define KVMPPC_PAGE_ORDER_MASK	0x1f
211 212
#define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
#define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
213 214
#define KVMPPC_GOT_PAGE		0x80

215
struct kvm_arch {
216 217
#ifdef CONFIG_KVM_BOOK3S_64_HV
	unsigned long hpt_virt;
218
	struct revmap_entry *revmap;
219 220 221 222 223 224
	unsigned int lpid;
	unsigned int host_lpid;
	unsigned long host_lpcr;
	unsigned long sdr1;
	unsigned long host_sdr1;
	int tlbie_lock;
225 226 227
	unsigned long lpcr;
	unsigned long rmor;
	struct kvmppc_rma_info *rma;
228
	unsigned long vrma_slb_v;
229
	int rma_setup_done;
230
	int using_mmu_notifiers;
231
	struct list_head spapr_tce_tables;
232
	spinlock_t slot_phys_lock;
233 234
	unsigned long *slot_phys[KVM_MEM_SLOTS_NUM];
	int slot_npages[KVM_MEM_SLOTS_NUM];
235
	unsigned short last_vcpu[NR_CPUS];
236
	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
237
#endif /* CONFIG_KVM_BOOK3S_64_HV */
238 239
};

240 241 242 243 244 245 246 247 248
/*
 * Struct for a virtual core.
 * Note: entry_exit_count combines an entry count in the bottom 8 bits
 * and an exit count in the next 8 bits.  This is so that we can
 * atomically increment the entry count iff the exit count is 0
 * without taking the lock.
 */
struct kvmppc_vcore {
	int n_runnable;
249
	int n_busy;
250 251 252 253
	int num_threads;
	int entry_exit_count;
	int n_woken;
	int nap_count;
254
	int napping_threads;
255
	u16 pcpu;
256
	u8 vcore_state;
257 258 259
	u8 in_guest;
	struct list_head runnable_threads;
	spinlock_t lock;
260
	wait_queue_head_t wq;
261 262 263 264 265
};

#define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
#define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)

266 267 268 269 270 271
/* Values for vcore_state */
#define VCORE_INACTIVE	0
#define VCORE_RUNNING	1
#define VCORE_EXITING	2
#define VCORE_SLEEPING	3

A
Alexander Graf 已提交
272
struct kvmppc_pte {
A
Alexander Graf 已提交
273
	ulong eaddr;
A
Alexander Graf 已提交
274
	u64 vpage;
A
Alexander Graf 已提交
275
	ulong raddr;
A
Alexander Graf 已提交
276 277 278
	bool may_read		: 1;
	bool may_write		: 1;
	bool may_execute	: 1;
A
Alexander Graf 已提交
279 280 281 282 283 284 285 286 287 288 289 290 291 292 293
};

struct kvmppc_mmu {
	/* book3s_64 only */
	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbia)(struct kvm_vcpu *vcpu);
	/* book3s */
	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
	void (*reset_msr)(struct kvm_vcpu *vcpu);
	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
A
Alexander Graf 已提交
294
	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
A
Alexander Graf 已提交
295 296 297 298
	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
};

299 300 301 302 303 304 305 306 307 308 309 310
struct kvmppc_slb {
	u64 esid;
	u64 vsid;
	u64 orige;
	u64 origv;
	bool valid	: 1;
	bool Ks		: 1;
	bool Kp		: 1;
	bool nx		: 1;
	bool large	: 1;	/* PTEs are 16MB */
	bool tb		: 1;	/* 1TB segment */
	bool class	: 1;
A
Alexander Graf 已提交
311 312
};

313
struct kvm_vcpu_arch {
A
Alexander Graf 已提交
314
	ulong host_stack;
315
	u32 host_pid;
316
#ifdef CONFIG_PPC_BOOK3S
317
	struct kvmppc_slb slb[64];
318
	int slb_max;		/* 1 + index of last valid entry in slb[] */
319
	int slb_nr;		/* total number of entries in SLB */
A
Alexander Graf 已提交
320 321
	struct kvmppc_mmu mmu;
#endif
322

323
	ulong gpr[32];
324

325
	u64 fpr[32];
A
Alexander Graf 已提交
326
	u64 fpscr;
327

328 329 330 331 332 333
#ifdef CONFIG_SPE
	ulong evr[32];
	ulong spefscr;
	ulong host_spefscr;
	u64 acc;
#endif
334 335 336 337 338 339
#ifdef CONFIG_ALTIVEC
	vector128 vr[32];
	vector128 vscr;
#endif

#ifdef CONFIG_VSX
340
	u64 vsr[64];
341 342
#endif

A
Alexander Graf 已提交
343 344 345 346 347
#ifdef CONFIG_PPC_BOOK3S
	/* For Gekko paired singles */
	u32 qpr[32];
#endif

348 349 350
	ulong pc;
	ulong ctr;
	ulong lr;
351

352
	ulong xer;
353
	u32 cr;
354

355
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
356
	ulong hflags;
357
	ulong guest_owned_ext;
358 359 360 361 362 363 364
	ulong purr;
	ulong spurr;
	ulong dscr;
	ulong amr;
	ulong uamor;
	u32 ctrl;
	ulong dabr;
A
Alexander Graf 已提交
365
#endif
366
	u32 vrsave; /* also USPRG0 */
367
	u32 mmucr;
S
Scott Wood 已提交
368
	ulong shadow_msr;
369 370 371 372
	ulong csrr0;
	ulong csrr1;
	ulong dsrr0;
	ulong dsrr1;
S
Scott Wood 已提交
373 374 375
	ulong mcsrr0;
	ulong mcsrr1;
	ulong mcsr;
376 377 378 379 380
	u32 dec;
	u32 decar;
	u32 tbl;
	u32 tbu;
	u32 tcr;
381
	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
382
	u32 ivor[64];
383
	ulong ivpr;
A
Alexander Graf 已提交
384
	u32 pvr;
385 386

	u32 shadow_pid;
L
Liu Yu 已提交
387
	u32 shadow_pid1;
388
	u32 pid;
389 390
	u32 swap_pid;

391 392 393 394
	u32 ccr0;
	u32 ccr1;
	u32 dbcr0;
	u32 dbcr1;
395
	u32 dbsr;
396

397
	u64 mmcr[3];
398
	u32 pmc[8];
399

400
#ifdef CONFIG_KVM_EXIT_TIMING
401
	struct mutex exit_timing_lock;
402 403
	struct kvmppc_exit_timing timing_exit;
	struct kvmppc_exit_timing timing_last_enter;
404 405 406 407 408 409 410 411 412 413
	u32 last_exit_type;
	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_last_exit;
	struct dentry *debugfs_exit_timing;
#endif

414 415 416 417 418
#ifdef CONFIG_PPC_BOOK3S
	ulong fault_dar;
	u32 fault_dsisr;
#endif

419
#ifdef CONFIG_BOOKE
420 421
	ulong fault_dear;
	ulong fault_esr;
422 423
	ulong queued_dear;
	ulong queued_esr;
424
#endif
425 426 427 428
	gpa_t paddr_accessed;

	u8 io_gpr; /* GPR used as IO source/target */
	u8 mmio_is_bigendian;
A
Alexander Graf 已提交
429
	u8 mmio_sign_extend;
430 431
	u8 dcr_needed;
	u8 dcr_is_write;
432 433
	u8 osi_needed;
	u8 osi_enabled;
A
Alexander Graf 已提交
434
	u8 papr_enabled;
435 436
	u8 sane;
	u8 cpu_type;
437
	u8 hcall_needed;
438 439 440

	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */

A
Alexander Graf 已提交
441 442
	struct hrtimer dec_timer;
	struct tasklet_struct tasklet;
A
Alexander Graf 已提交
443
	u64 dec_jiffies;
444
	u64 dec_expires;
445
	unsigned long pending_exceptions;
446
	u16 last_cpu;
447 448
	u8 ceded;
	u8 prodded;
449
	u32 last_inst;
450 451 452 453 454

	struct lppaca *vpa;
	struct slb_shadow *slb_shadow;
	struct dtl *dtl;
	struct dtl *dtl_end;
455

456
	wait_queue_head_t *wqp;
457 458
	struct kvmppc_vcore *vcore;
	int ret;
459
	int trap;
460 461
	int state;
	int ptid;
462
	bool timer_running;
463 464
	wait_queue_head_t cpu_run;

A
Alexander Graf 已提交
465
	struct kvm_vcpu_arch_shared *shared;
A
Alexander Graf 已提交
466 467
	unsigned long magic_page_pa; /* phys addr to map the magic page to */
	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
468 469 470

#ifdef CONFIG_KVM_BOOK3S_64_HV
	struct kvm_vcpu_arch_shared shregs;
471

472 473 474 475
	unsigned long pgfault_addr;
	long pgfault_index;
	unsigned long pgfault_hpte[2];

476 477 478
	struct list_head run_list;
	struct task_struct *run_task;
	struct kvm_run *kvm_run;
479
	pgd_t *pgdir;
480
#endif
481 482
};

483 484 485
/* Values for vcpu->arch.state */
#define KVMPPC_VCPU_STOPPED		0
#define KVMPPC_VCPU_BUSY_IN_HOST	1
486 487
#define KVMPPC_VCPU_RUNNABLE		2

488
#endif /* __POWERPC_KVM_HOST_H__ */