kvm_host.h 11.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *
 * Copyright IBM Corp. 2007
 *
 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
 */

#ifndef __POWERPC_KVM_HOST_H__
#define __POWERPC_KVM_HOST_H__

#include <linux/mutex.h>
A
Alexander Graf 已提交
24 25
#include <linux/hrtimer.h>
#include <linux/interrupt.h>
26 27
#include <linux/types.h>
#include <linux/kvm_types.h>
28 29
#include <linux/threads.h>
#include <linux/spinlock.h>
A
Alexander Graf 已提交
30
#include <linux/kvm_para.h>
31 32
#include <linux/list.h>
#include <linux/atomic.h>
33
#include <asm/kvm_asm.h>
34
#include <asm/processor.h>
35
#include <asm/page.h>
36

37 38
#define KVM_MAX_VCPUS		NR_CPUS
#define KVM_MAX_VCORES		NR_CPUS
39 40 41
#define KVM_MEMORY_SLOTS 32
/* memory slots that does not exposed to userspace */
#define KVM_PRIVATE_MEM_SLOTS 4
42
#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
43

44
#ifdef CONFIG_KVM_MMIO
45
#define KVM_COALESCED_MMIO_PAGE_OFFSET 1
46
#endif
47

48 49 50 51 52 53 54 55 56 57 58 59 60
#ifdef CONFIG_KVM_BOOK3S_64_HV
#include <linux/mmu_notifier.h>

#define KVM_ARCH_WANT_MMU_NOTIFIER

struct kvm;
extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_age_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);

#endif

61
/* We don't currently support large pages. */
62
#define KVM_HPAGE_GFN_SHIFT(x)	0
63 64
#define KVM_NR_PAGE_SIZES	1
#define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
65

66 67
#define HPTEG_CACHE_NUM			(1 << 15)
#define HPTEG_HASH_BITS_PTE		13
68
#define HPTEG_HASH_BITS_PTE_LONG	12
69 70 71
#define HPTEG_HASH_BITS_VPTE		13
#define HPTEG_HASH_BITS_VPTE_LONG	5
#define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
72
#define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
73 74
#define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
#define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
A
Alexander Graf 已提交
75

A
Alexander Graf 已提交
76 77 78
/* Physical Address Mask - allowed range of real mode RAM access */
#define KVM_PAM			0x0fffffffffffffffULL

79 80 81 82
struct kvm;
struct kvm_run;
struct kvm_vcpu;

83 84 85 86
struct lppaca;
struct slb_shadow;
struct dtl;

87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
struct kvm_vm_stat {
	u32 remote_tlb_flush;
};

struct kvm_vcpu_stat {
	u32 sum_exits;
	u32 mmio_exits;
	u32 dcr_exits;
	u32 signal_exits;
	u32 light_exits;
	/* Account for special types of light exits: */
	u32 itlb_real_miss_exits;
	u32 itlb_virt_miss_exits;
	u32 dtlb_real_miss_exits;
	u32 dtlb_virt_miss_exits;
	u32 syscall_exits;
	u32 isi_exits;
	u32 dsi_exits;
	u32 emulated_inst_exits;
	u32 dec_exits;
	u32 ext_intr_exits;
108
	u32 halt_wakeup;
109
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
110 111 112 113 114 115 116 117 118 119
	u32 pf_storage;
	u32 pf_instruc;
	u32 sp_storage;
	u32 sp_instruc;
	u32 queue_intr;
	u32 ld;
	u32 ld_slow;
	u32 st;
	u32 st_slow;
#endif
120 121
};

122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153
enum kvm_exit_types {
	MMIO_EXITS,
	DCR_EXITS,
	SIGNAL_EXITS,
	ITLB_REAL_MISS_EXITS,
	ITLB_VIRT_MISS_EXITS,
	DTLB_REAL_MISS_EXITS,
	DTLB_VIRT_MISS_EXITS,
	SYSCALL_EXITS,
	ISI_EXITS,
	DSI_EXITS,
	EMULATED_INST_EXITS,
	EMULATED_MTMSRWE_EXITS,
	EMULATED_WRTEE_EXITS,
	EMULATED_MTSPR_EXITS,
	EMULATED_MFSPR_EXITS,
	EMULATED_MTMSR_EXITS,
	EMULATED_MFMSR_EXITS,
	EMULATED_TLBSX_EXITS,
	EMULATED_TLBWE_EXITS,
	EMULATED_RFI_EXITS,
	DEC_EXITS,
	EXT_INTR_EXITS,
	HALT_WAKEUP,
	USR_PR_INST,
	FP_UNAVAIL,
	DEBUG_EXITS,
	TIMEINGUEST,
	__NUMBER_OF_KVM_EXIT_TYPES
};

/* allow access to big endian 32bit upper/lower parts and 64bit var */
154
struct kvmppc_exit_timing {
155 156 157 158 159 160 161 162
	union {
		u64 tv64;
		struct {
			u32 tbu, tbl;
		} tv32;
	};
};

163 164 165 166 167
struct kvmppc_pginfo {
	unsigned long pfn;
	atomic_t refcnt;
};

168 169 170 171 172 173 174 175
struct kvmppc_spapr_tce_table {
	struct list_head list;
	struct kvm *kvm;
	u64 liobn;
	u32 window_size;
	struct page *pages[0];
};

176
struct kvmppc_linear_info {
177 178 179 180
	void		*base_virt;
	unsigned long	 base_pfn;
	unsigned long	 npages;
	struct list_head list;
181 182
	atomic_t	 use_count;
	int		 type;
183 184
};

185 186 187
/*
 * The reverse mapping array has one entry for each HPTE,
 * which stores the guest's view of the second word of the HPTE
188 189 190 191
 * (including the guest physical address of the mapping),
 * plus forward and backward pointers in a doubly-linked ring
 * of HPTEs that map the same host page.  The pointers in this
 * ring are 32-bit HPTE indexes, to save space.
192 193 194
 */
struct revmap_entry {
	unsigned long guest_rpte;
195
	unsigned int forw, back;
196 197
};

198 199 200 201 202 203
/*
 * We use the top bit of each memslot->rmap entry as a lock bit,
 * and bit 32 as a present flag.  The bottom 32 bits are the
 * index in the guest HPT of a HPTE that points to the page.
 */
#define KVMPPC_RMAP_LOCK_BIT	63
204 205 206
#define KVMPPC_RMAP_RC_SHIFT	32
#define KVMPPC_RMAP_REFERENCED	(HPTE_R_R << KVMPPC_RMAP_RC_SHIFT)
#define KVMPPC_RMAP_CHANGED	(HPTE_R_C << KVMPPC_RMAP_RC_SHIFT)
207 208 209
#define KVMPPC_RMAP_PRESENT	0x100000000ul
#define KVMPPC_RMAP_INDEX	0xfffffffful

210
/* Low-order bits in kvm->arch.slot_phys[][] */
211
#define KVMPPC_PAGE_ORDER_MASK	0x1f
212 213
#define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
#define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
214 215
#define KVMPPC_GOT_PAGE		0x80

216 217 218
struct kvm_arch_memory_slot {
};

219
struct kvm_arch {
220 221
#ifdef CONFIG_KVM_BOOK3S_64_HV
	unsigned long hpt_virt;
222
	struct revmap_entry *revmap;
223 224 225 226 227 228
	unsigned int lpid;
	unsigned int host_lpid;
	unsigned long host_lpcr;
	unsigned long sdr1;
	unsigned long host_sdr1;
	int tlbie_lock;
229 230
	unsigned long lpcr;
	unsigned long rmor;
231
	struct kvmppc_linear_info *rma;
232
	unsigned long vrma_slb_v;
233
	int rma_setup_done;
234
	int using_mmu_notifiers;
235
	struct list_head spapr_tce_tables;
236
	spinlock_t slot_phys_lock;
237 238
	unsigned long *slot_phys[KVM_MEM_SLOTS_NUM];
	int slot_npages[KVM_MEM_SLOTS_NUM];
239
	unsigned short last_vcpu[NR_CPUS];
240
	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
A
Alexander Graf 已提交
241
	struct kvmppc_linear_info *hpt_li;
242
#endif /* CONFIG_KVM_BOOK3S_64_HV */
243 244
};

245 246 247 248 249 250 251 252 253
/*
 * Struct for a virtual core.
 * Note: entry_exit_count combines an entry count in the bottom 8 bits
 * and an exit count in the next 8 bits.  This is so that we can
 * atomically increment the entry count iff the exit count is 0
 * without taking the lock.
 */
struct kvmppc_vcore {
	int n_runnable;
254
	int n_busy;
255 256 257 258
	int num_threads;
	int entry_exit_count;
	int n_woken;
	int nap_count;
259
	int napping_threads;
260
	u16 pcpu;
261
	u8 vcore_state;
262 263 264
	u8 in_guest;
	struct list_head runnable_threads;
	spinlock_t lock;
265
	wait_queue_head_t wq;
266 267 268 269 270
};

#define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
#define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)

271 272 273 274 275 276
/* Values for vcore_state */
#define VCORE_INACTIVE	0
#define VCORE_RUNNING	1
#define VCORE_EXITING	2
#define VCORE_SLEEPING	3

A
Alexander Graf 已提交
277
struct kvmppc_pte {
A
Alexander Graf 已提交
278
	ulong eaddr;
A
Alexander Graf 已提交
279
	u64 vpage;
A
Alexander Graf 已提交
280
	ulong raddr;
A
Alexander Graf 已提交
281 282 283
	bool may_read		: 1;
	bool may_write		: 1;
	bool may_execute	: 1;
A
Alexander Graf 已提交
284 285 286 287 288 289 290 291 292 293 294 295 296 297 298
};

struct kvmppc_mmu {
	/* book3s_64 only */
	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbia)(struct kvm_vcpu *vcpu);
	/* book3s */
	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
	void (*reset_msr)(struct kvm_vcpu *vcpu);
	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
A
Alexander Graf 已提交
299
	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
A
Alexander Graf 已提交
300 301 302 303
	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
};

304 305 306 307 308 309 310 311 312 313 314 315
struct kvmppc_slb {
	u64 esid;
	u64 vsid;
	u64 orige;
	u64 origv;
	bool valid	: 1;
	bool Ks		: 1;
	bool Kp		: 1;
	bool nx		: 1;
	bool large	: 1;	/* PTEs are 16MB */
	bool tb		: 1;	/* 1TB segment */
	bool class	: 1;
A
Alexander Graf 已提交
316 317
};

318
struct kvm_vcpu_arch {
A
Alexander Graf 已提交
319
	ulong host_stack;
320
	u32 host_pid;
321
#ifdef CONFIG_PPC_BOOK3S
322
	struct kvmppc_slb slb[64];
323
	int slb_max;		/* 1 + index of last valid entry in slb[] */
324
	int slb_nr;		/* total number of entries in SLB */
A
Alexander Graf 已提交
325 326
	struct kvmppc_mmu mmu;
#endif
327

328
	ulong gpr[32];
329

330
	u64 fpr[32];
A
Alexander Graf 已提交
331
	u64 fpscr;
332

333 334 335 336 337 338
#ifdef CONFIG_SPE
	ulong evr[32];
	ulong spefscr;
	ulong host_spefscr;
	u64 acc;
#endif
339 340 341 342 343 344
#ifdef CONFIG_ALTIVEC
	vector128 vr[32];
	vector128 vscr;
#endif

#ifdef CONFIG_VSX
345
	u64 vsr[64];
346 347
#endif

A
Alexander Graf 已提交
348 349 350 351 352
#ifdef CONFIG_PPC_BOOK3S
	/* For Gekko paired singles */
	u32 qpr[32];
#endif

353 354 355
	ulong pc;
	ulong ctr;
	ulong lr;
356

357
	ulong xer;
358
	u32 cr;
359

360
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
361
	ulong hflags;
362
	ulong guest_owned_ext;
363 364 365 366 367 368 369
	ulong purr;
	ulong spurr;
	ulong dscr;
	ulong amr;
	ulong uamor;
	u32 ctrl;
	ulong dabr;
A
Alexander Graf 已提交
370
#endif
371
	u32 vrsave; /* also USPRG0 */
372
	u32 mmucr;
S
Scott Wood 已提交
373
	ulong shadow_msr;
374 375 376 377
	ulong csrr0;
	ulong csrr1;
	ulong dsrr0;
	ulong dsrr1;
S
Scott Wood 已提交
378 379 380
	ulong mcsrr0;
	ulong mcsrr1;
	ulong mcsr;
381 382 383 384 385
	u32 dec;
	u32 decar;
	u32 tbl;
	u32 tbu;
	u32 tcr;
386
	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
387
	u32 ivor[64];
388
	ulong ivpr;
A
Alexander Graf 已提交
389
	u32 pvr;
390 391

	u32 shadow_pid;
L
Liu Yu 已提交
392
	u32 shadow_pid1;
393
	u32 pid;
394 395
	u32 swap_pid;

396 397 398 399
	u32 ccr0;
	u32 ccr1;
	u32 dbcr0;
	u32 dbcr1;
400
	u32 dbsr;
401

402
	u64 mmcr[3];
403
	u32 pmc[8];
404

405
#ifdef CONFIG_KVM_EXIT_TIMING
406
	struct mutex exit_timing_lock;
407 408
	struct kvmppc_exit_timing timing_exit;
	struct kvmppc_exit_timing timing_last_enter;
409 410 411 412 413 414 415 416 417 418
	u32 last_exit_type;
	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_last_exit;
	struct dentry *debugfs_exit_timing;
#endif

419 420 421 422 423
#ifdef CONFIG_PPC_BOOK3S
	ulong fault_dar;
	u32 fault_dsisr;
#endif

424
#ifdef CONFIG_BOOKE
425 426
	ulong fault_dear;
	ulong fault_esr;
427 428
	ulong queued_dear;
	ulong queued_esr;
429 430
	u32 tlbcfg[4];
	u32 mmucfg;
431
#endif
432 433 434 435
	gpa_t paddr_accessed;

	u8 io_gpr; /* GPR used as IO source/target */
	u8 mmio_is_bigendian;
A
Alexander Graf 已提交
436
	u8 mmio_sign_extend;
437 438
	u8 dcr_needed;
	u8 dcr_is_write;
439 440
	u8 osi_needed;
	u8 osi_enabled;
A
Alexander Graf 已提交
441
	u8 papr_enabled;
442 443
	u8 sane;
	u8 cpu_type;
444
	u8 hcall_needed;
445 446 447

	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */

A
Alexander Graf 已提交
448 449
	struct hrtimer dec_timer;
	struct tasklet_struct tasklet;
A
Alexander Graf 已提交
450
	u64 dec_jiffies;
451
	u64 dec_expires;
452
	unsigned long pending_exceptions;
453
	u16 last_cpu;
454 455
	u8 ceded;
	u8 prodded;
456
	u32 last_inst;
457 458 459 460 461

	struct lppaca *vpa;
	struct slb_shadow *slb_shadow;
	struct dtl *dtl;
	struct dtl *dtl_end;
462

463
	wait_queue_head_t *wqp;
464 465
	struct kvmppc_vcore *vcore;
	int ret;
466
	int trap;
467 468
	int state;
	int ptid;
469
	bool timer_running;
470 471
	wait_queue_head_t cpu_run;

A
Alexander Graf 已提交
472
	struct kvm_vcpu_arch_shared *shared;
A
Alexander Graf 已提交
473 474
	unsigned long magic_page_pa; /* phys addr to map the magic page to */
	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
475 476 477

#ifdef CONFIG_KVM_BOOK3S_64_HV
	struct kvm_vcpu_arch_shared shregs;
478

479 480 481 482
	unsigned long pgfault_addr;
	long pgfault_index;
	unsigned long pgfault_hpte[2];

483 484 485
	struct list_head run_list;
	struct task_struct *run_task;
	struct kvm_run *kvm_run;
486
	pgd_t *pgdir;
487
#endif
488 489
};

490 491 492
/* Values for vcpu->arch.state */
#define KVMPPC_VCPU_STOPPED		0
#define KVMPPC_VCPU_BUSY_IN_HOST	1
493 494
#define KVMPPC_VCPU_RUNNABLE		2

495 496 497 498 499 500 501 502
/* Values for vcpu->arch.io_gpr */
#define KVM_MMIO_REG_MASK	0x001f
#define KVM_MMIO_REG_EXT_MASK	0xffe0
#define KVM_MMIO_REG_GPR	0x0000
#define KVM_MMIO_REG_FPR	0x0020
#define KVM_MMIO_REG_QPR	0x0040
#define KVM_MMIO_REG_FQPR	0x0060

503
#define __KVM_HAVE_ARCH_WQP
504

505
#endif /* __POWERPC_KVM_HOST_H__ */