kvm_host.h 11.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *
 * Copyright IBM Corp. 2007
 *
 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
 */

#ifndef __POWERPC_KVM_HOST_H__
#define __POWERPC_KVM_HOST_H__

#include <linux/mutex.h>
A
Alexander Graf 已提交
24 25
#include <linux/hrtimer.h>
#include <linux/interrupt.h>
26 27
#include <linux/types.h>
#include <linux/kvm_types.h>
28 29
#include <linux/threads.h>
#include <linux/spinlock.h>
A
Alexander Graf 已提交
30
#include <linux/kvm_para.h>
31 32
#include <linux/list.h>
#include <linux/atomic.h>
33
#include <asm/kvm_asm.h>
34
#include <asm/processor.h>
35
#include <asm/page.h>
36

37 38
#define KVM_MAX_VCPUS		NR_CPUS
#define KVM_MAX_VCORES		NR_CPUS
39 40 41
#define KVM_MEMORY_SLOTS 32
/* memory slots that does not exposed to userspace */
#define KVM_PRIVATE_MEM_SLOTS 4
42
#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
43

44
#ifdef CONFIG_KVM_MMIO
45
#define KVM_COALESCED_MMIO_PAGE_OFFSET 1
46
#endif
47

48 49 50 51 52 53 54 55 56 57 58 59 60
#ifdef CONFIG_KVM_BOOK3S_64_HV
#include <linux/mmu_notifier.h>

#define KVM_ARCH_WANT_MMU_NOTIFIER

struct kvm;
extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_age_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);

#endif

61
/* We don't currently support large pages. */
62
#define KVM_HPAGE_GFN_SHIFT(x)	0
63 64
#define KVM_NR_PAGE_SIZES	1
#define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
65

66 67
#define HPTEG_CACHE_NUM			(1 << 15)
#define HPTEG_HASH_BITS_PTE		13
68
#define HPTEG_HASH_BITS_PTE_LONG	12
69 70 71
#define HPTEG_HASH_BITS_VPTE		13
#define HPTEG_HASH_BITS_VPTE_LONG	5
#define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
72
#define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
73 74
#define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
#define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
A
Alexander Graf 已提交
75

A
Alexander Graf 已提交
76 77 78
/* Physical Address Mask - allowed range of real mode RAM access */
#define KVM_PAM			0x0fffffffffffffffULL

79 80 81 82
struct kvm;
struct kvm_run;
struct kvm_vcpu;

83 84 85 86
struct lppaca;
struct slb_shadow;
struct dtl;

87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
struct kvm_vm_stat {
	u32 remote_tlb_flush;
};

struct kvm_vcpu_stat {
	u32 sum_exits;
	u32 mmio_exits;
	u32 dcr_exits;
	u32 signal_exits;
	u32 light_exits;
	/* Account for special types of light exits: */
	u32 itlb_real_miss_exits;
	u32 itlb_virt_miss_exits;
	u32 dtlb_real_miss_exits;
	u32 dtlb_virt_miss_exits;
	u32 syscall_exits;
	u32 isi_exits;
	u32 dsi_exits;
	u32 emulated_inst_exits;
	u32 dec_exits;
	u32 ext_intr_exits;
108
	u32 halt_wakeup;
109
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
110 111 112 113 114 115 116 117 118 119
	u32 pf_storage;
	u32 pf_instruc;
	u32 sp_storage;
	u32 sp_instruc;
	u32 queue_intr;
	u32 ld;
	u32 ld_slow;
	u32 st;
	u32 st_slow;
#endif
120 121
};

122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153
enum kvm_exit_types {
	MMIO_EXITS,
	DCR_EXITS,
	SIGNAL_EXITS,
	ITLB_REAL_MISS_EXITS,
	ITLB_VIRT_MISS_EXITS,
	DTLB_REAL_MISS_EXITS,
	DTLB_VIRT_MISS_EXITS,
	SYSCALL_EXITS,
	ISI_EXITS,
	DSI_EXITS,
	EMULATED_INST_EXITS,
	EMULATED_MTMSRWE_EXITS,
	EMULATED_WRTEE_EXITS,
	EMULATED_MTSPR_EXITS,
	EMULATED_MFSPR_EXITS,
	EMULATED_MTMSR_EXITS,
	EMULATED_MFMSR_EXITS,
	EMULATED_TLBSX_EXITS,
	EMULATED_TLBWE_EXITS,
	EMULATED_RFI_EXITS,
	DEC_EXITS,
	EXT_INTR_EXITS,
	HALT_WAKEUP,
	USR_PR_INST,
	FP_UNAVAIL,
	DEBUG_EXITS,
	TIMEINGUEST,
	__NUMBER_OF_KVM_EXIT_TYPES
};

/* allow access to big endian 32bit upper/lower parts and 64bit var */
154
struct kvmppc_exit_timing {
155 156 157 158 159 160 161 162
	union {
		u64 tv64;
		struct {
			u32 tbu, tbl;
		} tv32;
	};
};

163 164 165 166 167
struct kvmppc_pginfo {
	unsigned long pfn;
	atomic_t refcnt;
};

168 169 170 171 172 173 174 175
struct kvmppc_spapr_tce_table {
	struct list_head list;
	struct kvm *kvm;
	u64 liobn;
	u32 window_size;
	struct page *pages[0];
};

176
struct kvmppc_linear_info {
177 178 179 180
	void		*base_virt;
	unsigned long	 base_pfn;
	unsigned long	 npages;
	struct list_head list;
181 182
	atomic_t	 use_count;
	int		 type;
183 184
};

185 186 187
/*
 * The reverse mapping array has one entry for each HPTE,
 * which stores the guest's view of the second word of the HPTE
188 189 190 191
 * (including the guest physical address of the mapping),
 * plus forward and backward pointers in a doubly-linked ring
 * of HPTEs that map the same host page.  The pointers in this
 * ring are 32-bit HPTE indexes, to save space.
192 193 194
 */
struct revmap_entry {
	unsigned long guest_rpte;
195
	unsigned int forw, back;
196 197
};

198 199 200 201 202 203
/*
 * We use the top bit of each memslot->rmap entry as a lock bit,
 * and bit 32 as a present flag.  The bottom 32 bits are the
 * index in the guest HPT of a HPTE that points to the page.
 */
#define KVMPPC_RMAP_LOCK_BIT	63
204 205 206
#define KVMPPC_RMAP_RC_SHIFT	32
#define KVMPPC_RMAP_REFERENCED	(HPTE_R_R << KVMPPC_RMAP_RC_SHIFT)
#define KVMPPC_RMAP_CHANGED	(HPTE_R_C << KVMPPC_RMAP_RC_SHIFT)
207 208 209
#define KVMPPC_RMAP_PRESENT	0x100000000ul
#define KVMPPC_RMAP_INDEX	0xfffffffful

210
/* Low-order bits in kvm->arch.slot_phys[][] */
211
#define KVMPPC_PAGE_ORDER_MASK	0x1f
212 213
#define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
#define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
214 215
#define KVMPPC_GOT_PAGE		0x80

216
struct kvm_arch {
217 218
#ifdef CONFIG_KVM_BOOK3S_64_HV
	unsigned long hpt_virt;
219
	struct revmap_entry *revmap;
220 221 222 223 224 225
	unsigned int lpid;
	unsigned int host_lpid;
	unsigned long host_lpcr;
	unsigned long sdr1;
	unsigned long host_sdr1;
	int tlbie_lock;
226 227
	unsigned long lpcr;
	unsigned long rmor;
228
	struct kvmppc_linear_info *rma;
229
	unsigned long vrma_slb_v;
230
	int rma_setup_done;
231
	int using_mmu_notifiers;
232
	struct list_head spapr_tce_tables;
233
	spinlock_t slot_phys_lock;
234 235
	unsigned long *slot_phys[KVM_MEM_SLOTS_NUM];
	int slot_npages[KVM_MEM_SLOTS_NUM];
236
	unsigned short last_vcpu[NR_CPUS];
237
	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
238
#endif /* CONFIG_KVM_BOOK3S_64_HV */
239 240
};

241 242 243 244 245 246 247 248 249
/*
 * Struct for a virtual core.
 * Note: entry_exit_count combines an entry count in the bottom 8 bits
 * and an exit count in the next 8 bits.  This is so that we can
 * atomically increment the entry count iff the exit count is 0
 * without taking the lock.
 */
struct kvmppc_vcore {
	int n_runnable;
250
	int n_busy;
251 252 253 254
	int num_threads;
	int entry_exit_count;
	int n_woken;
	int nap_count;
255
	int napping_threads;
256
	u16 pcpu;
257
	u8 vcore_state;
258 259 260
	u8 in_guest;
	struct list_head runnable_threads;
	spinlock_t lock;
261
	wait_queue_head_t wq;
262 263 264 265 266
};

#define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
#define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)

267 268 269 270 271 272
/* Values for vcore_state */
#define VCORE_INACTIVE	0
#define VCORE_RUNNING	1
#define VCORE_EXITING	2
#define VCORE_SLEEPING	3

A
Alexander Graf 已提交
273
struct kvmppc_pte {
A
Alexander Graf 已提交
274
	ulong eaddr;
A
Alexander Graf 已提交
275
	u64 vpage;
A
Alexander Graf 已提交
276
	ulong raddr;
A
Alexander Graf 已提交
277 278 279
	bool may_read		: 1;
	bool may_write		: 1;
	bool may_execute	: 1;
A
Alexander Graf 已提交
280 281 282 283 284 285 286 287 288 289 290 291 292 293 294
};

struct kvmppc_mmu {
	/* book3s_64 only */
	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbia)(struct kvm_vcpu *vcpu);
	/* book3s */
	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
	void (*reset_msr)(struct kvm_vcpu *vcpu);
	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
A
Alexander Graf 已提交
295
	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
A
Alexander Graf 已提交
296 297 298 299
	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
};

300 301 302 303 304 305 306 307 308 309 310 311
struct kvmppc_slb {
	u64 esid;
	u64 vsid;
	u64 orige;
	u64 origv;
	bool valid	: 1;
	bool Ks		: 1;
	bool Kp		: 1;
	bool nx		: 1;
	bool large	: 1;	/* PTEs are 16MB */
	bool tb		: 1;	/* 1TB segment */
	bool class	: 1;
A
Alexander Graf 已提交
312 313
};

314
struct kvm_vcpu_arch {
A
Alexander Graf 已提交
315
	ulong host_stack;
316
	u32 host_pid;
317
#ifdef CONFIG_PPC_BOOK3S
318
	struct kvmppc_slb slb[64];
319
	int slb_max;		/* 1 + index of last valid entry in slb[] */
320
	int slb_nr;		/* total number of entries in SLB */
A
Alexander Graf 已提交
321 322
	struct kvmppc_mmu mmu;
#endif
323

324
	ulong gpr[32];
325

326
	u64 fpr[32];
A
Alexander Graf 已提交
327
	u64 fpscr;
328

329 330 331 332 333 334
#ifdef CONFIG_SPE
	ulong evr[32];
	ulong spefscr;
	ulong host_spefscr;
	u64 acc;
#endif
335 336 337 338 339 340
#ifdef CONFIG_ALTIVEC
	vector128 vr[32];
	vector128 vscr;
#endif

#ifdef CONFIG_VSX
341
	u64 vsr[64];
342 343
#endif

A
Alexander Graf 已提交
344 345 346 347 348
#ifdef CONFIG_PPC_BOOK3S
	/* For Gekko paired singles */
	u32 qpr[32];
#endif

349 350 351
	ulong pc;
	ulong ctr;
	ulong lr;
352

353
	ulong xer;
354
	u32 cr;
355

356
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
357
	ulong hflags;
358
	ulong guest_owned_ext;
359 360 361 362 363 364 365
	ulong purr;
	ulong spurr;
	ulong dscr;
	ulong amr;
	ulong uamor;
	u32 ctrl;
	ulong dabr;
A
Alexander Graf 已提交
366
#endif
367
	u32 vrsave; /* also USPRG0 */
368
	u32 mmucr;
S
Scott Wood 已提交
369
	ulong shadow_msr;
370 371 372 373
	ulong csrr0;
	ulong csrr1;
	ulong dsrr0;
	ulong dsrr1;
S
Scott Wood 已提交
374 375 376
	ulong mcsrr0;
	ulong mcsrr1;
	ulong mcsr;
377 378 379 380 381
	u32 dec;
	u32 decar;
	u32 tbl;
	u32 tbu;
	u32 tcr;
382
	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
383
	u32 ivor[64];
384
	ulong ivpr;
A
Alexander Graf 已提交
385
	u32 pvr;
386 387

	u32 shadow_pid;
L
Liu Yu 已提交
388
	u32 shadow_pid1;
389
	u32 pid;
390 391
	u32 swap_pid;

392 393 394 395
	u32 ccr0;
	u32 ccr1;
	u32 dbcr0;
	u32 dbcr1;
396
	u32 dbsr;
397

398
	u64 mmcr[3];
399
	u32 pmc[8];
400

401
#ifdef CONFIG_KVM_EXIT_TIMING
402
	struct mutex exit_timing_lock;
403 404
	struct kvmppc_exit_timing timing_exit;
	struct kvmppc_exit_timing timing_last_enter;
405 406 407 408 409 410 411 412 413 414
	u32 last_exit_type;
	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_last_exit;
	struct dentry *debugfs_exit_timing;
#endif

415 416 417 418 419
#ifdef CONFIG_PPC_BOOK3S
	ulong fault_dar;
	u32 fault_dsisr;
#endif

420
#ifdef CONFIG_BOOKE
421 422
	ulong fault_dear;
	ulong fault_esr;
423 424
	ulong queued_dear;
	ulong queued_esr;
425
#endif
426 427 428 429
	gpa_t paddr_accessed;

	u8 io_gpr; /* GPR used as IO source/target */
	u8 mmio_is_bigendian;
A
Alexander Graf 已提交
430
	u8 mmio_sign_extend;
431 432
	u8 dcr_needed;
	u8 dcr_is_write;
433 434
	u8 osi_needed;
	u8 osi_enabled;
A
Alexander Graf 已提交
435
	u8 papr_enabled;
436 437
	u8 sane;
	u8 cpu_type;
438
	u8 hcall_needed;
439 440 441

	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */

A
Alexander Graf 已提交
442 443
	struct hrtimer dec_timer;
	struct tasklet_struct tasklet;
A
Alexander Graf 已提交
444
	u64 dec_jiffies;
445
	u64 dec_expires;
446
	unsigned long pending_exceptions;
447
	u16 last_cpu;
448 449
	u8 ceded;
	u8 prodded;
450
	u32 last_inst;
451 452 453 454 455

	struct lppaca *vpa;
	struct slb_shadow *slb_shadow;
	struct dtl *dtl;
	struct dtl *dtl_end;
456

457
	wait_queue_head_t *wqp;
458 459
	struct kvmppc_vcore *vcore;
	int ret;
460
	int trap;
461 462
	int state;
	int ptid;
463
	bool timer_running;
464 465
	wait_queue_head_t cpu_run;

A
Alexander Graf 已提交
466
	struct kvm_vcpu_arch_shared *shared;
A
Alexander Graf 已提交
467 468
	unsigned long magic_page_pa; /* phys addr to map the magic page to */
	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
469 470 471

#ifdef CONFIG_KVM_BOOK3S_64_HV
	struct kvm_vcpu_arch_shared shregs;
472

473 474 475 476
	unsigned long pgfault_addr;
	long pgfault_index;
	unsigned long pgfault_hpte[2];

477 478 479
	struct list_head run_list;
	struct task_struct *run_task;
	struct kvm_run *kvm_run;
480
	pgd_t *pgdir;
481
#endif
482 483
};

484 485 486
/* Values for vcpu->arch.state */
#define KVMPPC_VCPU_STOPPED		0
#define KVMPPC_VCPU_BUSY_IN_HOST	1
487 488
#define KVMPPC_VCPU_RUNNABLE		2

489 490 491 492 493 494 495 496
/* Values for vcpu->arch.io_gpr */
#define KVM_MMIO_REG_MASK	0x001f
#define KVM_MMIO_REG_EXT_MASK	0xffe0
#define KVM_MMIO_REG_GPR	0x0000
#define KVM_MMIO_REG_FPR	0x0020
#define KVM_MMIO_REG_QPR	0x0040
#define KVM_MMIO_REG_FQPR	0x0060

497
#endif /* __POWERPC_KVM_HOST_H__ */