kvm_host.h 13.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
/*
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *
 * Copyright IBM Corp. 2007
 *
 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
 */

#ifndef __POWERPC_KVM_HOST_H__
#define __POWERPC_KVM_HOST_H__

#include <linux/mutex.h>
A
Alexander Graf 已提交
24 25
#include <linux/hrtimer.h>
#include <linux/interrupt.h>
26 27
#include <linux/types.h>
#include <linux/kvm_types.h>
28 29
#include <linux/threads.h>
#include <linux/spinlock.h>
A
Alexander Graf 已提交
30
#include <linux/kvm_para.h>
31 32
#include <linux/list.h>
#include <linux/atomic.h>
33
#include <asm/kvm_asm.h>
34
#include <asm/processor.h>
35
#include <asm/page.h>
36
#include <asm/cacheflush.h>
37

38 39
#define KVM_MAX_VCPUS		NR_CPUS
#define KVM_MAX_VCORES		NR_CPUS
40
#define KVM_USER_MEM_SLOTS 32
41
#define KVM_MEM_SLOTS_NUM KVM_USER_MEM_SLOTS
42

43
#ifdef CONFIG_KVM_MMIO
44
#define KVM_COALESCED_MMIO_PAGE_OFFSET 1
45
#endif
46

47
#if !defined(CONFIG_KVM_440)
48 49 50 51 52 53
#include <linux/mmu_notifier.h>

#define KVM_ARCH_WANT_MMU_NOTIFIER

struct kvm;
extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
54 55
extern int kvm_unmap_hva_range(struct kvm *kvm,
			       unsigned long start, unsigned long end);
56 57 58 59 60 61
extern int kvm_age_hva(struct kvm *kvm, unsigned long hva);
extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);

#endif

62
/* We don't currently support large pages. */
63
#define KVM_HPAGE_GFN_SHIFT(x)	0
64 65
#define KVM_NR_PAGE_SIZES	1
#define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
66

67 68
#define HPTEG_CACHE_NUM			(1 << 15)
#define HPTEG_HASH_BITS_PTE		13
69
#define HPTEG_HASH_BITS_PTE_LONG	12
70 71 72
#define HPTEG_HASH_BITS_VPTE		13
#define HPTEG_HASH_BITS_VPTE_LONG	5
#define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
73
#define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
74 75
#define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
#define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
A
Alexander Graf 已提交
76

A
Alexander Graf 已提交
77 78 79
/* Physical Address Mask - allowed range of real mode RAM access */
#define KVM_PAM			0x0fffffffffffffffULL

80 81 82 83
struct kvm;
struct kvm_run;
struct kvm_vcpu;

84 85
struct lppaca;
struct slb_shadow;
86
struct dtl_entry;
87

88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
struct kvm_vm_stat {
	u32 remote_tlb_flush;
};

struct kvm_vcpu_stat {
	u32 sum_exits;
	u32 mmio_exits;
	u32 dcr_exits;
	u32 signal_exits;
	u32 light_exits;
	/* Account for special types of light exits: */
	u32 itlb_real_miss_exits;
	u32 itlb_virt_miss_exits;
	u32 dtlb_real_miss_exits;
	u32 dtlb_virt_miss_exits;
	u32 syscall_exits;
	u32 isi_exits;
	u32 dsi_exits;
	u32 emulated_inst_exits;
	u32 dec_exits;
	u32 ext_intr_exits;
109
	u32 halt_wakeup;
110 111
	u32 dbell_exits;
	u32 gdbell_exits;
112
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
113 114 115 116 117 118 119 120 121 122
	u32 pf_storage;
	u32 pf_instruc;
	u32 sp_storage;
	u32 sp_instruc;
	u32 queue_intr;
	u32 ld;
	u32 ld_slow;
	u32 st;
	u32 st_slow;
#endif
123 124
};

125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145
enum kvm_exit_types {
	MMIO_EXITS,
	DCR_EXITS,
	SIGNAL_EXITS,
	ITLB_REAL_MISS_EXITS,
	ITLB_VIRT_MISS_EXITS,
	DTLB_REAL_MISS_EXITS,
	DTLB_VIRT_MISS_EXITS,
	SYSCALL_EXITS,
	ISI_EXITS,
	DSI_EXITS,
	EMULATED_INST_EXITS,
	EMULATED_MTMSRWE_EXITS,
	EMULATED_WRTEE_EXITS,
	EMULATED_MTSPR_EXITS,
	EMULATED_MFSPR_EXITS,
	EMULATED_MTMSR_EXITS,
	EMULATED_MFMSR_EXITS,
	EMULATED_TLBSX_EXITS,
	EMULATED_TLBWE_EXITS,
	EMULATED_RFI_EXITS,
146
	EMULATED_RFCI_EXITS,
147 148 149 150 151 152 153
	DEC_EXITS,
	EXT_INTR_EXITS,
	HALT_WAKEUP,
	USR_PR_INST,
	FP_UNAVAIL,
	DEBUG_EXITS,
	TIMEINGUEST,
154 155
	DBELL_EXITS,
	GDBELL_EXITS,
156 157 158 159
	__NUMBER_OF_KVM_EXIT_TYPES
};

/* allow access to big endian 32bit upper/lower parts and 64bit var */
160
struct kvmppc_exit_timing {
161 162 163 164 165 166 167 168
	union {
		u64 tv64;
		struct {
			u32 tbu, tbl;
		} tv32;
	};
};

169 170 171 172 173
struct kvmppc_pginfo {
	unsigned long pfn;
	atomic_t refcnt;
};

174 175 176 177 178 179 180 181
struct kvmppc_spapr_tce_table {
	struct list_head list;
	struct kvm *kvm;
	u64 liobn;
	u32 window_size;
	struct page *pages[0];
};

182
struct kvmppc_linear_info {
183 184 185 186
	void		*base_virt;
	unsigned long	 base_pfn;
	unsigned long	 npages;
	struct list_head list;
187 188
	atomic_t	 use_count;
	int		 type;
189 190
};

191 192 193
/*
 * The reverse mapping array has one entry for each HPTE,
 * which stores the guest's view of the second word of the HPTE
194 195 196 197
 * (including the guest physical address of the mapping),
 * plus forward and backward pointers in a doubly-linked ring
 * of HPTEs that map the same host page.  The pointers in this
 * ring are 32-bit HPTE indexes, to save space.
198 199 200
 */
struct revmap_entry {
	unsigned long guest_rpte;
201
	unsigned int forw, back;
202 203
};

204
/*
205
 * We use the top bit of each memslot->arch.rmap entry as a lock bit,
206 207 208 209
 * and bit 32 as a present flag.  The bottom 32 bits are the
 * index in the guest HPT of a HPTE that points to the page.
 */
#define KVMPPC_RMAP_LOCK_BIT	63
210 211 212
#define KVMPPC_RMAP_RC_SHIFT	32
#define KVMPPC_RMAP_REFERENCED	(HPTE_R_R << KVMPPC_RMAP_RC_SHIFT)
#define KVMPPC_RMAP_CHANGED	(HPTE_R_C << KVMPPC_RMAP_RC_SHIFT)
213 214 215
#define KVMPPC_RMAP_PRESENT	0x100000000ul
#define KVMPPC_RMAP_INDEX	0xfffffffful

216
/* Low-order bits in memslot->arch.slot_phys[] */
217
#define KVMPPC_PAGE_ORDER_MASK	0x1f
218 219
#define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
#define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
220 221
#define KVMPPC_GOT_PAGE		0x80

222
struct kvm_arch_memory_slot {
223
#ifdef CONFIG_KVM_BOOK3S_64_HV
224
	unsigned long *rmap;
225 226
	unsigned long *slot_phys;
#endif /* CONFIG_KVM_BOOK3S_64_HV */
227 228
};

229
struct kvm_arch {
230
	unsigned int lpid;
231 232
#ifdef CONFIG_KVM_BOOK3S_64_HV
	unsigned long hpt_virt;
233
	struct revmap_entry *revmap;
234 235 236 237 238
	unsigned int host_lpid;
	unsigned long host_lpcr;
	unsigned long sdr1;
	unsigned long host_sdr1;
	int tlbie_lock;
239 240
	unsigned long lpcr;
	unsigned long rmor;
241
	struct kvmppc_linear_info *rma;
242
	unsigned long vrma_slb_v;
243
	int rma_setup_done;
244
	int using_mmu_notifiers;
245 246
	u32 hpt_order;
	atomic_t vcpus_running;
247
	u32 online_vcores;
248 249
	unsigned long hpt_npte;
	unsigned long hpt_mask;
250
	atomic_t hpte_mod_interest;
251
	spinlock_t slot_phys_lock;
252
	cpumask_t need_tlb_flush;
253
	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
A
Alexander Graf 已提交
254
	struct kvmppc_linear_info *hpt_li;
255
#endif /* CONFIG_KVM_BOOK3S_64_HV */
256 257 258
#ifdef CONFIG_PPC_BOOK3S_64
	struct list_head spapr_tce_tables;
#endif
259 260
};

261 262 263 264 265 266 267 268 269
/*
 * Struct for a virtual core.
 * Note: entry_exit_count combines an entry count in the bottom 8 bits
 * and an exit count in the next 8 bits.  This is so that we can
 * atomically increment the entry count iff the exit count is 0
 * without taking the lock.
 */
struct kvmppc_vcore {
	int n_runnable;
270
	int n_busy;
271 272 273 274
	int num_threads;
	int entry_exit_count;
	int n_woken;
	int nap_count;
275
	int napping_threads;
276
	u16 pcpu;
277
	u16 last_cpu;
278
	u8 vcore_state;
279 280 281
	u8 in_guest;
	struct list_head runnable_threads;
	spinlock_t lock;
282
	wait_queue_head_t wq;
283 284 285
	u64 stolen_tb;
	u64 preempt_tb;
	struct kvm_vcpu *runner;
286 287 288 289 290
};

#define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
#define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)

291 292
/* Values for vcore_state */
#define VCORE_INACTIVE	0
293 294 295 296
#define VCORE_SLEEPING	1
#define VCORE_STARTING	2
#define VCORE_RUNNING	3
#define VCORE_EXITING	4
297

298 299 300 301 302 303 304 305 306 307 308 309 310
/*
 * Struct used to manage memory for a virtual processor area
 * registered by a PAPR guest.  There are three types of area
 * that a guest can register.
 */
struct kvmppc_vpa {
	void *pinned_addr;	/* Address in kernel linear mapping */
	void *pinned_end;	/* End of region */
	unsigned long next_gpa;	/* Guest phys addr for update */
	unsigned long len;	/* Number of bytes required */
	u8 update_pending;	/* 1 => update pinned_addr from next_gpa */
};

A
Alexander Graf 已提交
311
struct kvmppc_pte {
A
Alexander Graf 已提交
312
	ulong eaddr;
A
Alexander Graf 已提交
313
	u64 vpage;
A
Alexander Graf 已提交
314
	ulong raddr;
A
Alexander Graf 已提交
315 316 317
	bool may_read		: 1;
	bool may_write		: 1;
	bool may_execute	: 1;
A
Alexander Graf 已提交
318 319 320 321 322 323 324 325 326 327 328 329 330 331 332
};

struct kvmppc_mmu {
	/* book3s_64 only */
	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
	void (*slbia)(struct kvm_vcpu *vcpu);
	/* book3s */
	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
	void (*reset_msr)(struct kvm_vcpu *vcpu);
	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
A
Alexander Graf 已提交
333
	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
A
Alexander Graf 已提交
334 335 336 337
	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
};

338 339 340 341 342 343 344 345 346 347 348 349
struct kvmppc_slb {
	u64 esid;
	u64 vsid;
	u64 orige;
	u64 origv;
	bool valid	: 1;
	bool Ks		: 1;
	bool Kp		: 1;
	bool nx		: 1;
	bool large	: 1;	/* PTEs are 16MB */
	bool tb		: 1;	/* 1TB segment */
	bool class	: 1;
A
Alexander Graf 已提交
350 351
};

352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372
# ifdef CONFIG_PPC_FSL_BOOK3E
#define KVMPPC_BOOKE_IAC_NUM	2
#define KVMPPC_BOOKE_DAC_NUM	2
# else
#define KVMPPC_BOOKE_IAC_NUM	4
#define KVMPPC_BOOKE_DAC_NUM	2
# endif
#define KVMPPC_BOOKE_MAX_IAC	4
#define KVMPPC_BOOKE_MAX_DAC	2

struct kvmppc_booke_debug_reg {
	u32 dbcr0;
	u32 dbcr1;
	u32 dbcr2;
#ifdef CONFIG_KVM_E500MC
	u32 dbcr4;
#endif
	u64 iac[KVMPPC_BOOKE_MAX_IAC];
	u64 dac[KVMPPC_BOOKE_MAX_DAC];
};

373
struct kvm_vcpu_arch {
A
Alexander Graf 已提交
374
	ulong host_stack;
375
	u32 host_pid;
376
#ifdef CONFIG_PPC_BOOK3S
377
	struct kvmppc_slb slb[64];
378
	int slb_max;		/* 1 + index of last valid entry in slb[] */
379
	int slb_nr;		/* total number of entries in SLB */
A
Alexander Graf 已提交
380 381
	struct kvmppc_mmu mmu;
#endif
382

383
	ulong gpr[32];
384

385
	u64 fpr[32];
A
Alexander Graf 已提交
386
	u64 fpscr;
387

388 389 390 391 392 393
#ifdef CONFIG_SPE
	ulong evr[32];
	ulong spefscr;
	ulong host_spefscr;
	u64 acc;
#endif
394 395 396 397 398 399
#ifdef CONFIG_ALTIVEC
	vector128 vr[32];
	vector128 vscr;
#endif

#ifdef CONFIG_VSX
400
	u64 vsr[64];
401 402
#endif

403 404 405 406 407 408 409 410 411 412
#ifdef CONFIG_KVM_BOOKE_HV
	u32 host_mas4;
	u32 host_mas6;
	u32 shadow_epcr;
	u32 shadow_msrp;
	u32 eplc;
	u32 epsc;
	u32 oldpir;
#endif

413 414 415 416 417 418
#if defined(CONFIG_BOOKE)
#if defined(CONFIG_KVM_BOOKE_HV) || defined(CONFIG_64BIT)
	u32 epcr;
#endif
#endif

A
Alexander Graf 已提交
419 420 421 422 423
#ifdef CONFIG_PPC_BOOK3S
	/* For Gekko paired singles */
	u32 qpr[32];
#endif

424 425 426
	ulong pc;
	ulong ctr;
	ulong lr;
427

428
	ulong xer;
429
	u32 cr;
430

431
#ifdef CONFIG_PPC_BOOK3S
A
Alexander Graf 已提交
432
	ulong hflags;
433
	ulong guest_owned_ext;
434 435 436 437 438 439 440
	ulong purr;
	ulong spurr;
	ulong dscr;
	ulong amr;
	ulong uamor;
	u32 ctrl;
	ulong dabr;
441
	ulong cfar;
A
Alexander Graf 已提交
442
#endif
443
	u32 vrsave; /* also USPRG0 */
444
	u32 mmucr;
445
	/* shadow_msr is unused for BookE HV */
S
Scott Wood 已提交
446
	ulong shadow_msr;
447 448 449 450
	ulong csrr0;
	ulong csrr1;
	ulong dsrr0;
	ulong dsrr1;
S
Scott Wood 已提交
451 452 453
	ulong mcsrr0;
	ulong mcsrr1;
	ulong mcsr;
454
	u32 dec;
455
#ifdef CONFIG_BOOKE
456
	u32 decar;
457
#endif
458 459 460
	u32 tbl;
	u32 tbu;
	u32 tcr;
461
	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
462
	u32 ivor[64];
463
	ulong ivpr;
A
Alexander Graf 已提交
464
	u32 pvr;
465 466

	u32 shadow_pid;
L
Liu Yu 已提交
467
	u32 shadow_pid1;
468
	u32 pid;
469 470
	u32 swap_pid;

471 472
	u32 ccr0;
	u32 ccr1;
473
	u32 dbsr;
474

475
	u64 mmcr[3];
476
	u32 pmc[8];
477

478
#ifdef CONFIG_KVM_EXIT_TIMING
479
	struct mutex exit_timing_lock;
480 481
	struct kvmppc_exit_timing timing_exit;
	struct kvmppc_exit_timing timing_last_enter;
482 483 484 485 486 487 488 489 490 491
	u32 last_exit_type;
	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
	u64 timing_last_exit;
	struct dentry *debugfs_exit_timing;
#endif

492 493 494 495 496
#ifdef CONFIG_PPC_BOOK3S
	ulong fault_dar;
	u32 fault_dsisr;
#endif

497
#ifdef CONFIG_BOOKE
498 499
	ulong fault_dear;
	ulong fault_esr;
500 501
	ulong queued_dear;
	ulong queued_esr;
502 503
	spinlock_t wdt_lock;
	struct timer_list wdt_timer;
504 505
	u32 tlbcfg[4];
	u32 mmucfg;
506
	u32 epr;
507
	u32 crit_save;
508
	struct kvmppc_booke_debug_reg dbg_reg;
509
#endif
510
	gpa_t paddr_accessed;
511
	gva_t vaddr_accessed;
512 513 514

	u8 io_gpr; /* GPR used as IO source/target */
	u8 mmio_is_bigendian;
A
Alexander Graf 已提交
515
	u8 mmio_sign_extend;
516 517
	u8 dcr_needed;
	u8 dcr_is_write;
518 519
	u8 osi_needed;
	u8 osi_enabled;
A
Alexander Graf 已提交
520
	u8 papr_enabled;
521
	u8 watchdog_enabled;
522 523
	u8 sane;
	u8 cpu_type;
524
	u8 hcall_needed;
525 526
	u8 epr_enabled;
	u8 epr_needed;
527 528 529

	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */

A
Alexander Graf 已提交
530 531
	struct hrtimer dec_timer;
	struct tasklet_struct tasklet;
A
Alexander Graf 已提交
532
	u64 dec_jiffies;
533
	u64 dec_expires;
534
	unsigned long pending_exceptions;
535 536
	u8 ceded;
	u8 prodded;
537
	u32 last_inst;
538

539
	wait_queue_head_t *wqp;
540 541
	struct kvmppc_vcore *vcore;
	int ret;
542
	int trap;
543 544
	int state;
	int ptid;
545
	bool timer_running;
546 547
	wait_queue_head_t cpu_run;

A
Alexander Graf 已提交
548
	struct kvm_vcpu_arch_shared *shared;
A
Alexander Graf 已提交
549 550
	unsigned long magic_page_pa; /* phys addr to map the magic page to */
	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
551 552 553

#ifdef CONFIG_KVM_BOOK3S_64_HV
	struct kvm_vcpu_arch_shared shregs;
554

555 556 557 558
	unsigned long pgfault_addr;
	long pgfault_index;
	unsigned long pgfault_hpte[2];

559 560 561
	struct list_head run_list;
	struct task_struct *run_task;
	struct kvm_run *kvm_run;
562
	pgd_t *pgdir;
563 564 565 566 567 568

	spinlock_t vpa_update_lock;
	struct kvmppc_vpa vpa;
	struct kvmppc_vpa dtl;
	struct dtl_entry *dtl_ptr;
	unsigned long dtl_index;
569
	u64 stolen_logged;
570
	struct kvmppc_vpa slb_shadow;
571 572 573 574

	spinlock_t tbacct_lock;
	u64 busy_stolen;
	u64 busy_preempt;
575
#endif
576 577
};

578
/* Values for vcpu->arch.state */
579 580
#define KVMPPC_VCPU_NOTREADY		0
#define KVMPPC_VCPU_RUNNABLE		1
581
#define KVMPPC_VCPU_BUSY_IN_HOST	2
582

583 584 585 586 587 588 589 590
/* Values for vcpu->arch.io_gpr */
#define KVM_MMIO_REG_MASK	0x001f
#define KVM_MMIO_REG_EXT_MASK	0xffe0
#define KVM_MMIO_REG_GPR	0x0000
#define KVM_MMIO_REG_FPR	0x0020
#define KVM_MMIO_REG_QPR	0x0040
#define KVM_MMIO_REG_FQPR	0x0060

591
#define __KVM_HAVE_ARCH_WQP
592

593
#endif /* __POWERPC_KVM_HOST_H__ */