kvm_host.h 11.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *
 * Copyright IBM Corp. 2007
 *
 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
 */

#ifndef __POWERPC_KVM_HOST_H__
#define __POWERPC_KVM_HOST_H__

#include <linux/mutex.h>
A
Alexander Graf 已提交
24 25
#include <linux/hrtimer.h>
#include <linux/interrupt.h>
26 27
#include <linux/types.h>
#include <linux/kvm_types.h>
28 29
#include <linux/threads.h>
#include <linux/spinlock.h>
A
Alexander Graf 已提交
30
#include <linux/kvm_para.h>
31 32
#include <linux/list.h>
#include <linux/atomic.h>
33
#include <asm/kvm_asm.h>
34
#include <asm/processor.h>
35
#include <asm/page.h>
36

37 38
#define KVM_MAX_VCPUS		NR_CPUS
#define KVM_MAX_VCORES		NR_CPUS
39 40 41
#define KVM_MEMORY_SLOTS 32
/* memory slots that does not exposed to userspace */
#define KVM_PRIVATE_MEM_SLOTS 4
42
#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
43

44
#ifdef CONFIG_KVM_MMIO
45
#define KVM_COALESCED_MMIO_PAGE_OFFSET 1
46
#endif
47

48 49 50 51 52 53 54 55 56 57 58 59 60
#ifdef CONFIG_KVM_BOOK3S_64_HV
#include <linux/mmu_notifier.h>

#define KVM_ARCH_WANT_MMU_NOTIFIER

struct kvm;
extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_age_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);

#endif

61
/* We don't currently support large pages. */
62
#define KVM_HPAGE_GFN_SHIFT(x)	0
63 64
#define KVM_NR_PAGE_SIZES	1
#define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
65

66 67
#define HPTEG_CACHE_NUM			(1 << 15)
#define HPTEG_HASH_BITS_PTE		13
68
#define HPTEG_HASH_BITS_PTE_LONG	12
69 70 71
#define HPTEG_HASH_BITS_VPTE		13
#define HPTEG_HASH_BITS_VPTE_LONG	5
#define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
72
#define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
73 74
#define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
#define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
A
Alexander Graf 已提交
75

A
Alexander Graf 已提交
76 77 78
/* Physical Address Mask - allowed range of real mode RAM access */
#define KVM_PAM			0x0fffffffffffffffULL

79 80 81 82
struct kvm;
struct kvm_run;
struct kvm_vcpu;

83 84 85 86
struct lppaca;
struct slb_shadow;
struct dtl;

87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
struct kvm_vm_stat {
	u32 remote_tlb_flush;
};

struct kvm_vcpu_stat {
	u32 sum_exits;
	u32 mmio_exits;
	u32 dcr_exits;
	u32 signal_exits;
	u32 light_exits;
	/* Account for special types of light exits: */
	u32 itlb_real_miss_exits;
	u32 itlb_virt_miss_exits;
	u32 dtlb_real_miss_exits;
	u32 dtlb_virt_miss_exits;
	u32 syscall_exits;
	u32 isi_exits;
	u32 dsi_exits;
	u32 emulated_inst_exits;
	u32 dec_exits;
	u32 ext_intr_exits;
108
	u32 halt_wakeup;
109
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
110 111 112 113 114 115 116 117 118 119
	u32 pf_storage;
	u32 pf_instruc;
	u32 sp_storage;
	u32 sp_instruc;
	u32 queue_intr;
	u32 ld;
	u32 ld_slow;
	u32 st;
	u32 st_slow;
#endif
120 121
};

122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153
enum kvm_exit_types {
	MMIO_EXITS,
	DCR_EXITS,
	SIGNAL_EXITS,
	ITLB_REAL_MISS_EXITS,
	ITLB_VIRT_MISS_EXITS,
	DTLB_REAL_MISS_EXITS,
	DTLB_VIRT_MISS_EXITS,
	SYSCALL_EXITS,
	ISI_EXITS,
	DSI_EXITS,
	EMULATED_INST_EXITS,
	EMULATED_MTMSRWE_EXITS,
	EMULATED_WRTEE_EXITS,
	EMULATED_MTSPR_EXITS,
	EMULATED_MFSPR_EXITS,
	EMULATED_MTMSR_EXITS,
	EMULATED_MFMSR_EXITS,
	EMULATED_TLBSX_EXITS,
	EMULATED_TLBWE_EXITS,
	EMULATED_RFI_EXITS,
	DEC_EXITS,
	EXT_INTR_EXITS,
	HALT_WAKEUP,
	USR_PR_INST,
	FP_UNAVAIL,
	DEBUG_EXITS,
	TIMEINGUEST,
	__NUMBER_OF_KVM_EXIT_TYPES
};

/* allow access to big endian 32bit upper/lower parts and 64bit var */
154
struct kvmppc_exit_timing {
155 156 157 158 159 160 161 162
	union {
		u64 tv64;
		struct {
			u32 tbu, tbl;
		} tv32;
	};
};

163 164 165 166 167
struct kvmppc_pginfo {
	unsigned long pfn;
	atomic_t refcnt;
};

168 169 170 171 172 173 174 175
struct kvmppc_spapr_tce_table {
	struct list_head list;
	struct kvm *kvm;
	u64 liobn;
	u32 window_size;
	struct page *pages[0];
};

176 177 178 179 180 181 182 183
struct kvmppc_rma_info {
	void		*base_virt;
	unsigned long	 base_pfn;
	unsigned long	 npages;
	struct list_head list;
	atomic_t 	 use_count;
};

184 185 186
/*
 * The reverse mapping array has one entry for each HPTE,
 * which stores the guest's view of the second word of the HPTE
187 188 189 190
 * (including the guest physical address of the mapping),
 * plus forward and backward pointers in a doubly-linked ring
 * of HPTEs that map the same host page.  The pointers in this
 * ring are 32-bit HPTE indexes, to save space.
191 192 193
 */
struct revmap_entry {
	unsigned long guest_rpte;
194
	unsigned int forw, back;
195 196
};

197 198 199 200 201 202 203 204 205 206 207
/*
 * We use the top bit of each memslot->rmap entry as a lock bit,
 * and bit 32 as a present flag.  The bottom 32 bits are the
 * index in the guest HPT of a HPTE that points to the page.
 */
#define KVMPPC_RMAP_LOCK_BIT	63
#define KVMPPC_RMAP_REF_BIT	33
#define KVMPPC_RMAP_REFERENCED	(1ul << KVMPPC_RMAP_REF_BIT)
#define KVMPPC_RMAP_PRESENT	0x100000000ul
#define KVMPPC_RMAP_INDEX	0xfffffffful

208
/* Low-order bits in kvm->arch.slot_phys[][] */
209
#define KVMPPC_PAGE_ORDER_MASK	0x1f
210 211
#define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
#define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
212 213
#define KVMPPC_GOT_PAGE		0x80

214
struct kvm_arch {
215 216
#ifdef CONFIG_KVM_BOOK3S_64_HV
	unsigned long hpt_virt;
217
	struct revmap_entry *revmap;
218 219 220 221 222 223
	unsigned int lpid;
	unsigned int host_lpid;
	unsigned long host_lpcr;
	unsigned long sdr1;
	unsigned long host_sdr1;
	int tlbie_lock;
224 225 226
	unsigned long lpcr;
	unsigned long rmor;
	struct kvmppc_rma_info *rma;
227
	unsigned long vrma_slb_v;
228
	int rma_setup_done;
229
	int using_mmu_notifiers;
230
	struct list_head spapr_tce_tables;
231
	spinlock_t slot_phys_lock;
232 233
	unsigned long *slot_phys[KVM_MEM_SLOTS_NUM];
	int slot_npages[KVM_MEM_SLOTS_NUM];
234
	unsigned short last_vcpu[NR_CPUS];
235
	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
236
#endif /* CONFIG_KVM_BOOK3S_64_HV */
237 238
};

239 240 241 242 243 244 245 246 247
/*
 * Struct for a virtual core.
 * Note: entry_exit_count combines an entry count in the bottom 8 bits
 * and an exit count in the next 8 bits.  This is so that we can
 * atomically increment the entry count iff the exit count is 0
 * without taking the lock.
 */
struct kvmppc_vcore {
	int n_runnable;
248
	int n_busy;
249 250 251 252
	int num_threads;
	int entry_exit_count;
	int n_woken;
	int nap_count;
253
	int napping_threads;
254
	u16 pcpu;
255
	u8 vcore_state;
256 257 258
	u8 in_guest;
	struct list_head runnable_threads;
	spinlock_t lock;
259
	wait_queue_head_t wq;
260 261 262 263 264
};

#define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
#define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)

265 266 267 268 269 270
/* Values for vcore_state */
#define VCORE_INACTIVE	0
#define VCORE_RUNNING	1
#define VCORE_EXITING	2
#define VCORE_SLEEPING	3

A
Alexander Graf 已提交
271
struct kvmppc_pte {
A
Alexander Graf 已提交
272
	ulong eaddr;
A
Alexander Graf 已提交
273
	u64 vpage;
A
Alexander Graf 已提交
274
	ulong raddr;
A
Alexander Graf 已提交
275 276 277
	bool may_read		: 1;
	bool may_write		: 1;
	bool may_execute	: 1;
A
Alexander Graf 已提交
278 279 280 281 282 283 284 285 286 287 288 289 290 291 292
};

struct kvmppc_mmu {
	/* book3s_64 only */
	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbia)(struct kvm_vcpu *vcpu);
	/* book3s */
	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
	void (*reset_msr)(struct kvm_vcpu *vcpu);
	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
A
Alexander Graf 已提交
293
	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
A
Alexander Graf 已提交
294 295 296 297
	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
};

298 299 300 301 302 303 304 305 306 307 308 309
struct kvmppc_slb {
	u64 esid;
	u64 vsid;
	u64 orige;
	u64 origv;
	bool valid	: 1;
	bool Ks		: 1;
	bool Kp		: 1;
	bool nx		: 1;
	bool large	: 1;	/* PTEs are 16MB */
	bool tb		: 1;	/* 1TB segment */
	bool class	: 1;
A
Alexander Graf 已提交
310 311
};

312
struct kvm_vcpu_arch {
A
Alexander Graf 已提交
313
	ulong host_stack;
314
	u32 host_pid;
315
#ifdef CONFIG_PPC_BOOK3S
316
	struct kvmppc_slb slb[64];
317
	int slb_max;		/* 1 + index of last valid entry in slb[] */
318
	int slb_nr;		/* total number of entries in SLB */
A
Alexander Graf 已提交
319 320
	struct kvmppc_mmu mmu;
#endif
321

322
	ulong gpr[32];
323

324
	u64 fpr[32];
A
Alexander Graf 已提交
325
	u64 fpscr;
326

327 328 329 330 331 332
#ifdef CONFIG_SPE
	ulong evr[32];
	ulong spefscr;
	ulong host_spefscr;
	u64 acc;
#endif
333 334 335 336 337 338
#ifdef CONFIG_ALTIVEC
	vector128 vr[32];
	vector128 vscr;
#endif

#ifdef CONFIG_VSX
339
	u64 vsr[64];
340 341
#endif

A
Alexander Graf 已提交
342 343 344 345 346
#ifdef CONFIG_PPC_BOOK3S
	/* For Gekko paired singles */
	u32 qpr[32];
#endif

347 348 349
	ulong pc;
	ulong ctr;
	ulong lr;
350

351
	ulong xer;
352
	u32 cr;
353

354
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
355
	ulong hflags;
356
	ulong guest_owned_ext;
357 358 359 360 361 362 363
	ulong purr;
	ulong spurr;
	ulong dscr;
	ulong amr;
	ulong uamor;
	u32 ctrl;
	ulong dabr;
A
Alexander Graf 已提交
364
#endif
365
	u32 vrsave; /* also USPRG0 */
366
	u32 mmucr;
S
Scott Wood 已提交
367
	ulong shadow_msr;
368 369 370 371
	ulong csrr0;
	ulong csrr1;
	ulong dsrr0;
	ulong dsrr1;
S
Scott Wood 已提交
372 373 374
	ulong mcsrr0;
	ulong mcsrr1;
	ulong mcsr;
375 376 377 378 379
	u32 dec;
	u32 decar;
	u32 tbl;
	u32 tbu;
	u32 tcr;
380
	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
381
	u32 ivor[64];
382
	ulong ivpr;
A
Alexander Graf 已提交
383
	u32 pvr;
384 385

	u32 shadow_pid;
L
Liu Yu 已提交
386
	u32 shadow_pid1;
387
	u32 pid;
388 389
	u32 swap_pid;

390 391 392 393
	u32 ccr0;
	u32 ccr1;
	u32 dbcr0;
	u32 dbcr1;
394
	u32 dbsr;
395

396
	u64 mmcr[3];
397
	u32 pmc[8];
398

399
#ifdef CONFIG_KVM_EXIT_TIMING
400
	struct mutex exit_timing_lock;
401 402
	struct kvmppc_exit_timing timing_exit;
	struct kvmppc_exit_timing timing_last_enter;
403 404 405 406 407 408 409 410 411 412
	u32 last_exit_type;
	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_last_exit;
	struct dentry *debugfs_exit_timing;
#endif

413 414 415 416 417
#ifdef CONFIG_PPC_BOOK3S
	ulong fault_dar;
	u32 fault_dsisr;
#endif

418
#ifdef CONFIG_BOOKE
419 420
	ulong fault_dear;
	ulong fault_esr;
421 422
	ulong queued_dear;
	ulong queued_esr;
423
#endif
424 425 426 427
	gpa_t paddr_accessed;

	u8 io_gpr; /* GPR used as IO source/target */
	u8 mmio_is_bigendian;
A
Alexander Graf 已提交
428
	u8 mmio_sign_extend;
429 430
	u8 dcr_needed;
	u8 dcr_is_write;
431 432
	u8 osi_needed;
	u8 osi_enabled;
A
Alexander Graf 已提交
433
	u8 papr_enabled;
434 435
	u8 sane;
	u8 cpu_type;
436
	u8 hcall_needed;
437 438 439

	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */

A
Alexander Graf 已提交
440 441
	struct hrtimer dec_timer;
	struct tasklet_struct tasklet;
A
Alexander Graf 已提交
442
	u64 dec_jiffies;
443
	u64 dec_expires;
444
	unsigned long pending_exceptions;
445
	u16 last_cpu;
446 447
	u8 ceded;
	u8 prodded;
448
	u32 last_inst;
449 450 451 452 453

	struct lppaca *vpa;
	struct slb_shadow *slb_shadow;
	struct dtl *dtl;
	struct dtl *dtl_end;
454

455
	wait_queue_head_t *wqp;
456 457
	struct kvmppc_vcore *vcore;
	int ret;
458
	int trap;
459 460
	int state;
	int ptid;
461
	bool timer_running;
462 463
	wait_queue_head_t cpu_run;

A
Alexander Graf 已提交
464
	struct kvm_vcpu_arch_shared *shared;
A
Alexander Graf 已提交
465 466
	unsigned long magic_page_pa; /* phys addr to map the magic page to */
	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
467 468 469

#ifdef CONFIG_KVM_BOOK3S_64_HV
	struct kvm_vcpu_arch_shared shregs;
470

471 472 473 474
	unsigned long pgfault_addr;
	long pgfault_index;
	unsigned long pgfault_hpte[2];

475 476 477
	struct list_head run_list;
	struct task_struct *run_task;
	struct kvm_run *kvm_run;
478
	pgd_t *pgdir;
479
#endif
480 481
};

482 483 484
/* Values for vcpu->arch.state */
#define KVMPPC_VCPU_STOPPED		0
#define KVMPPC_VCPU_BUSY_IN_HOST	1
485 486
#define KVMPPC_VCPU_RUNNABLE		2

487
#endif /* __POWERPC_KVM_HOST_H__ */