kvm_host.h 10.5 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *
 * Copyright IBM Corp. 2007
 *
 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
 */

#ifndef __POWERPC_KVM_HOST_H__
#define __POWERPC_KVM_HOST_H__

#include <linux/mutex.h>
A
Alexander Graf 已提交
24 25
#include <linux/hrtimer.h>
#include <linux/interrupt.h>
26 27
#include <linux/types.h>
#include <linux/kvm_types.h>
28 29
#include <linux/threads.h>
#include <linux/spinlock.h>
A
Alexander Graf 已提交
30
#include <linux/kvm_para.h>
31 32
#include <linux/list.h>
#include <linux/atomic.h>
33
#include <asm/kvm_asm.h>
34
#include <asm/processor.h>
35

36 37
#define KVM_MAX_VCPUS		NR_CPUS
#define KVM_MAX_VCORES		NR_CPUS
38 39 40
#define KVM_MEMORY_SLOTS 32
/* memory slots that does not exposed to userspace */
#define KVM_PRIVATE_MEM_SLOTS 4
41
#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
42

43
#ifdef CONFIG_KVM_MMIO
44
#define KVM_COALESCED_MMIO_PAGE_OFFSET 1
45
#endif
46

47
/* We don't currently support large pages. */
48
#define KVM_HPAGE_GFN_SHIFT(x)	0
49 50
#define KVM_NR_PAGE_SIZES	1
#define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
51

52 53
#define HPTEG_CACHE_NUM			(1 << 15)
#define HPTEG_HASH_BITS_PTE		13
54
#define HPTEG_HASH_BITS_PTE_LONG	12
55 56 57
#define HPTEG_HASH_BITS_VPTE		13
#define HPTEG_HASH_BITS_VPTE_LONG	5
#define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
58
#define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
59 60
#define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
#define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
A
Alexander Graf 已提交
61

A
Alexander Graf 已提交
62 63 64
/* Physical Address Mask - allowed range of real mode RAM access */
#define KVM_PAM			0x0fffffffffffffffULL

65 66 67 68
struct kvm;
struct kvm_run;
struct kvm_vcpu;

69 70 71 72
struct lppaca;
struct slb_shadow;
struct dtl;

73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93
struct kvm_vm_stat {
	u32 remote_tlb_flush;
};

struct kvm_vcpu_stat {
	u32 sum_exits;
	u32 mmio_exits;
	u32 dcr_exits;
	u32 signal_exits;
	u32 light_exits;
	/* Account for special types of light exits: */
	u32 itlb_real_miss_exits;
	u32 itlb_virt_miss_exits;
	u32 dtlb_real_miss_exits;
	u32 dtlb_virt_miss_exits;
	u32 syscall_exits;
	u32 isi_exits;
	u32 dsi_exits;
	u32 emulated_inst_exits;
	u32 dec_exits;
	u32 ext_intr_exits;
94
	u32 halt_wakeup;
95
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
96 97 98 99 100 101 102 103 104 105
	u32 pf_storage;
	u32 pf_instruc;
	u32 sp_storage;
	u32 sp_instruc;
	u32 queue_intr;
	u32 ld;
	u32 ld_slow;
	u32 st;
	u32 st_slow;
#endif
106 107
};

108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139
enum kvm_exit_types {
	MMIO_EXITS,
	DCR_EXITS,
	SIGNAL_EXITS,
	ITLB_REAL_MISS_EXITS,
	ITLB_VIRT_MISS_EXITS,
	DTLB_REAL_MISS_EXITS,
	DTLB_VIRT_MISS_EXITS,
	SYSCALL_EXITS,
	ISI_EXITS,
	DSI_EXITS,
	EMULATED_INST_EXITS,
	EMULATED_MTMSRWE_EXITS,
	EMULATED_WRTEE_EXITS,
	EMULATED_MTSPR_EXITS,
	EMULATED_MFSPR_EXITS,
	EMULATED_MTMSR_EXITS,
	EMULATED_MFMSR_EXITS,
	EMULATED_TLBSX_EXITS,
	EMULATED_TLBWE_EXITS,
	EMULATED_RFI_EXITS,
	DEC_EXITS,
	EXT_INTR_EXITS,
	HALT_WAKEUP,
	USR_PR_INST,
	FP_UNAVAIL,
	DEBUG_EXITS,
	TIMEINGUEST,
	__NUMBER_OF_KVM_EXIT_TYPES
};

/* allow access to big endian 32bit upper/lower parts and 64bit var */
140
struct kvmppc_exit_timing {
141 142 143 144 145 146 147 148
	union {
		u64 tv64;
		struct {
			u32 tbu, tbl;
		} tv32;
	};
};

149 150 151 152 153
struct kvmppc_pginfo {
	unsigned long pfn;
	atomic_t refcnt;
};

154 155 156 157 158 159 160 161
struct kvmppc_spapr_tce_table {
	struct list_head list;
	struct kvm *kvm;
	u64 liobn;
	u32 window_size;
	struct page *pages[0];
};

162 163 164 165 166 167 168 169
struct kvmppc_rma_info {
	void		*base_virt;
	unsigned long	 base_pfn;
	unsigned long	 npages;
	struct list_head list;
	atomic_t 	 use_count;
};

170 171 172
/*
 * The reverse mapping array has one entry for each HPTE,
 * which stores the guest's view of the second word of the HPTE
173 174 175 176
 * (including the guest physical address of the mapping),
 * plus forward and backward pointers in a doubly-linked ring
 * of HPTEs that map the same host page.  The pointers in this
 * ring are 32-bit HPTE indexes, to save space.
177 178 179
 */
struct revmap_entry {
	unsigned long guest_rpte;
180
	unsigned int forw, back;
181 182
};

183 184 185 186 187 188 189 190 191 192 193
/*
 * We use the top bit of each memslot->rmap entry as a lock bit,
 * and bit 32 as a present flag.  The bottom 32 bits are the
 * index in the guest HPT of a HPTE that points to the page.
 */
#define KVMPPC_RMAP_LOCK_BIT	63
#define KVMPPC_RMAP_REF_BIT	33
#define KVMPPC_RMAP_REFERENCED	(1ul << KVMPPC_RMAP_REF_BIT)
#define KVMPPC_RMAP_PRESENT	0x100000000ul
#define KVMPPC_RMAP_INDEX	0xfffffffful

194
/* Low-order bits in kvm->arch.slot_phys[][] */
195
#define KVMPPC_PAGE_ORDER_MASK	0x1f
196 197
#define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
#define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
198 199
#define KVMPPC_GOT_PAGE		0x80

200
struct kvm_arch {
201 202
#ifdef CONFIG_KVM_BOOK3S_64_HV
	unsigned long hpt_virt;
203
	struct revmap_entry *revmap;
204 205 206 207 208 209
	unsigned int lpid;
	unsigned int host_lpid;
	unsigned long host_lpcr;
	unsigned long sdr1;
	unsigned long host_sdr1;
	int tlbie_lock;
210 211 212
	unsigned long lpcr;
	unsigned long rmor;
	struct kvmppc_rma_info *rma;
213
	unsigned long vrma_slb_v;
214
	int rma_setup_done;
215
	struct list_head spapr_tce_tables;
216
	spinlock_t slot_phys_lock;
217 218
	unsigned long *slot_phys[KVM_MEM_SLOTS_NUM];
	int slot_npages[KVM_MEM_SLOTS_NUM];
219
	unsigned short last_vcpu[NR_CPUS];
220
	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
221
#endif /* CONFIG_KVM_BOOK3S_64_HV */
222 223
};

224 225 226 227 228 229 230 231 232
/*
 * Struct for a virtual core.
 * Note: entry_exit_count combines an entry count in the bottom 8 bits
 * and an exit count in the next 8 bits.  This is so that we can
 * atomically increment the entry count iff the exit count is 0
 * without taking the lock.
 */
struct kvmppc_vcore {
	int n_runnable;
233
	int n_busy;
234 235 236 237
	int num_threads;
	int entry_exit_count;
	int n_woken;
	int nap_count;
238
	int napping_threads;
239
	u16 pcpu;
240
	u8 vcore_state;
241 242 243
	u8 in_guest;
	struct list_head runnable_threads;
	spinlock_t lock;
244
	wait_queue_head_t wq;
245 246 247 248 249
};

#define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
#define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)

250 251 252 253 254 255
/* Values for vcore_state */
#define VCORE_INACTIVE	0
#define VCORE_RUNNING	1
#define VCORE_EXITING	2
#define VCORE_SLEEPING	3

A
Alexander Graf 已提交
256
struct kvmppc_pte {
A
Alexander Graf 已提交
257
	ulong eaddr;
A
Alexander Graf 已提交
258
	u64 vpage;
A
Alexander Graf 已提交
259
	ulong raddr;
A
Alexander Graf 已提交
260 261 262
	bool may_read		: 1;
	bool may_write		: 1;
	bool may_execute	: 1;
A
Alexander Graf 已提交
263 264 265 266 267 268 269 270 271 272 273 274 275 276 277
};

struct kvmppc_mmu {
	/* book3s_64 only */
	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbia)(struct kvm_vcpu *vcpu);
	/* book3s */
	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
	void (*reset_msr)(struct kvm_vcpu *vcpu);
	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
A
Alexander Graf 已提交
278
	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
A
Alexander Graf 已提交
279 280 281 282
	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
};

283 284 285 286 287 288 289 290 291 292 293 294
struct kvmppc_slb {
	u64 esid;
	u64 vsid;
	u64 orige;
	u64 origv;
	bool valid	: 1;
	bool Ks		: 1;
	bool Kp		: 1;
	bool nx		: 1;
	bool large	: 1;	/* PTEs are 16MB */
	bool tb		: 1;	/* 1TB segment */
	bool class	: 1;
A
Alexander Graf 已提交
295 296
};

297
struct kvm_vcpu_arch {
A
Alexander Graf 已提交
298
	ulong host_stack;
299
	u32 host_pid;
300
#ifdef CONFIG_PPC_BOOK3S
301
	struct kvmppc_slb slb[64];
302
	int slb_max;		/* 1 + index of last valid entry in slb[] */
303
	int slb_nr;		/* total number of entries in SLB */
A
Alexander Graf 已提交
304 305
	struct kvmppc_mmu mmu;
#endif
306

307
	ulong gpr[32];
308

309
	u64 fpr[32];
A
Alexander Graf 已提交
310
	u64 fpscr;
311

312 313 314 315 316 317
#ifdef CONFIG_SPE
	ulong evr[32];
	ulong spefscr;
	ulong host_spefscr;
	u64 acc;
#endif
318 319 320 321 322 323
#ifdef CONFIG_ALTIVEC
	vector128 vr[32];
	vector128 vscr;
#endif

#ifdef CONFIG_VSX
324
	u64 vsr[64];
325 326
#endif

A
Alexander Graf 已提交
327 328 329 330 331
#ifdef CONFIG_PPC_BOOK3S
	/* For Gekko paired singles */
	u32 qpr[32];
#endif

332 333 334
	ulong pc;
	ulong ctr;
	ulong lr;
335

336
	ulong xer;
337
	u32 cr;
338

339
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
340
	ulong hflags;
341
	ulong guest_owned_ext;
342 343 344 345 346 347 348
	ulong purr;
	ulong spurr;
	ulong dscr;
	ulong amr;
	ulong uamor;
	u32 ctrl;
	ulong dabr;
A
Alexander Graf 已提交
349
#endif
350
	u32 vrsave; /* also USPRG0 */
351
	u32 mmucr;
S
Scott Wood 已提交
352
	ulong shadow_msr;
353 354 355 356
	ulong csrr0;
	ulong csrr1;
	ulong dsrr0;
	ulong dsrr1;
S
Scott Wood 已提交
357 358 359
	ulong mcsrr0;
	ulong mcsrr1;
	ulong mcsr;
360 361 362 363 364
	u32 dec;
	u32 decar;
	u32 tbl;
	u32 tbu;
	u32 tcr;
365
	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
366
	u32 ivor[64];
367
	ulong ivpr;
A
Alexander Graf 已提交
368
	u32 pvr;
369 370

	u32 shadow_pid;
L
Liu Yu 已提交
371
	u32 shadow_pid1;
372
	u32 pid;
373 374
	u32 swap_pid;

375 376 377 378
	u32 ccr0;
	u32 ccr1;
	u32 dbcr0;
	u32 dbcr1;
379
	u32 dbsr;
380

381
	u64 mmcr[3];
382
	u32 pmc[8];
383

384
#ifdef CONFIG_KVM_EXIT_TIMING
385
	struct mutex exit_timing_lock;
386 387
	struct kvmppc_exit_timing timing_exit;
	struct kvmppc_exit_timing timing_last_enter;
388 389 390 391 392 393 394 395 396 397
	u32 last_exit_type;
	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_last_exit;
	struct dentry *debugfs_exit_timing;
#endif

398 399 400 401 402
#ifdef CONFIG_PPC_BOOK3S
	ulong fault_dar;
	u32 fault_dsisr;
#endif

403
#ifdef CONFIG_BOOKE
404 405
	ulong fault_dear;
	ulong fault_esr;
406 407
	ulong queued_dear;
	ulong queued_esr;
408
#endif
409 410 411 412
	gpa_t paddr_accessed;

	u8 io_gpr; /* GPR used as IO source/target */
	u8 mmio_is_bigendian;
A
Alexander Graf 已提交
413
	u8 mmio_sign_extend;
414 415
	u8 dcr_needed;
	u8 dcr_is_write;
416 417
	u8 osi_needed;
	u8 osi_enabled;
A
Alexander Graf 已提交
418
	u8 papr_enabled;
419 420
	u8 sane;
	u8 cpu_type;
421
	u8 hcall_needed;
422 423 424

	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */

A
Alexander Graf 已提交
425 426
	struct hrtimer dec_timer;
	struct tasklet_struct tasklet;
A
Alexander Graf 已提交
427
	u64 dec_jiffies;
428
	u64 dec_expires;
429
	unsigned long pending_exceptions;
430
	u16 last_cpu;
431 432
	u8 ceded;
	u8 prodded;
433
	u32 last_inst;
434 435 436 437 438

	struct lppaca *vpa;
	struct slb_shadow *slb_shadow;
	struct dtl *dtl;
	struct dtl *dtl_end;
439

440
	wait_queue_head_t *wqp;
441 442
	struct kvmppc_vcore *vcore;
	int ret;
443
	int trap;
444 445
	int state;
	int ptid;
446
	bool timer_running;
447 448
	wait_queue_head_t cpu_run;

A
Alexander Graf 已提交
449
	struct kvm_vcpu_arch_shared *shared;
A
Alexander Graf 已提交
450 451
	unsigned long magic_page_pa; /* phys addr to map the magic page to */
	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
452 453 454

#ifdef CONFIG_KVM_BOOK3S_64_HV
	struct kvm_vcpu_arch_shared shregs;
455

456 457 458 459
	unsigned long pgfault_addr;
	long pgfault_index;
	unsigned long pgfault_hpte[2];

460 461 462
	struct list_head run_list;
	struct task_struct *run_task;
	struct kvm_run *kvm_run;
463
#endif
464 465
};

466 467 468
/* Values for vcpu->arch.state */
#define KVMPPC_VCPU_STOPPED		0
#define KVMPPC_VCPU_BUSY_IN_HOST	1
469 470
#define KVMPPC_VCPU_RUNNABLE		2

471
#endif /* __POWERPC_KVM_HOST_H__ */