book3s.c 26.9 KB
Newer Older
A
Alexander Graf 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
/*
 * Copyright (C) 2009. SUSE Linux Products GmbH. All rights reserved.
 *
 * Authors:
 *    Alexander Graf <agraf@suse.de>
 *    Kevin Wolf <mail@kevin-wolf.de>
 *
 * Description:
 * This file is derived from arch/powerpc/kvm/44x.c,
 * by Hollis Blanchard <hollisb@us.ibm.com>.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License, version 2, as
 * published by the Free Software Foundation.
 */

#include <linux/kvm_host.h>
#include <linux/err.h>
19
#include <linux/export.h>
20
#include <linux/slab.h>
21 22
#include <linux/module.h>
#include <linux/miscdevice.h>
23 24 25 26
#include <linux/gfp.h>
#include <linux/sched.h>
#include <linux/vmalloc.h>
#include <linux/highmem.h>
A
Alexander Graf 已提交
27 28 29 30

#include <asm/reg.h>
#include <asm/cputable.h>
#include <asm/cacheflush.h>
31
#include <linux/uaccess.h>
A
Alexander Graf 已提交
32 33 34 35
#include <asm/io.h>
#include <asm/kvm_ppc.h>
#include <asm/kvm_book3s.h>
#include <asm/mmu_context.h>
36
#include <asm/page.h>
37
#include <asm/xive.h>
A
Alexander Graf 已提交
38

39
#include "book3s.h"
40 41
#include "trace.h"

A
Alexander Graf 已提交
42 43 44
#define VCPU_STAT(x) offsetof(struct kvm_vcpu, stat.x), KVM_STAT_VCPU

/* #define EXIT_DEBUG */
45

A
Alexander Graf 已提交
46 47 48 49 50 51 52 53 54
struct kvm_stats_debugfs_item debugfs_entries[] = {
	{ "exits",       VCPU_STAT(sum_exits) },
	{ "mmio",        VCPU_STAT(mmio_exits) },
	{ "sig",         VCPU_STAT(signal_exits) },
	{ "sysc",        VCPU_STAT(syscall_exits) },
	{ "inst_emu",    VCPU_STAT(emulated_inst_exits) },
	{ "dec",         VCPU_STAT(dec_exits) },
	{ "ext_intr",    VCPU_STAT(ext_intr_exits) },
	{ "queue_intr",  VCPU_STAT(queue_intr) },
55 56 57
	{ "halt_poll_success_ns",	VCPU_STAT(halt_poll_success_ns) },
	{ "halt_poll_fail_ns",		VCPU_STAT(halt_poll_fail_ns) },
	{ "halt_wait_ns",		VCPU_STAT(halt_wait_ns) },
58
	{ "halt_successful_poll", VCPU_STAT(halt_successful_poll), },
59
	{ "halt_attempted_poll", VCPU_STAT(halt_attempted_poll), },
60
	{ "halt_successful_wait",	VCPU_STAT(halt_successful_wait) },
61
	{ "halt_poll_invalid", VCPU_STAT(halt_poll_invalid) },
A
Alexander Graf 已提交
62 63 64 65 66 67 68 69 70
	{ "halt_wakeup", VCPU_STAT(halt_wakeup) },
	{ "pf_storage",  VCPU_STAT(pf_storage) },
	{ "sp_storage",  VCPU_STAT(sp_storage) },
	{ "pf_instruc",  VCPU_STAT(pf_instruc) },
	{ "sp_instruc",  VCPU_STAT(sp_instruc) },
	{ "ld",          VCPU_STAT(ld) },
	{ "ld_slow",     VCPU_STAT(ld_slow) },
	{ "st",          VCPU_STAT(st) },
	{ "st_slow",     VCPU_STAT(st_slow) },
71 72 73
	{ "pthru_all",       VCPU_STAT(pthru_all) },
	{ "pthru_host",      VCPU_STAT(pthru_host) },
	{ "pthru_bad_aff",   VCPU_STAT(pthru_bad_aff) },
A
Alexander Graf 已提交
74 75 76
	{ NULL }
};

77 78 79 80
void kvmppc_unfixup_split_real(struct kvm_vcpu *vcpu)
{
	if (vcpu->arch.hflags & BOOK3S_HFLAG_SPLIT_HACK) {
		ulong pc = kvmppc_get_pc(vcpu);
81
		ulong lr = kvmppc_get_lr(vcpu);
82 83
		if ((pc & SPLIT_HACK_MASK) == SPLIT_HACK_OFFS)
			kvmppc_set_pc(vcpu, pc & ~SPLIT_HACK_MASK);
84 85
		if ((lr & SPLIT_HACK_MASK) == SPLIT_HACK_OFFS)
			kvmppc_set_lr(vcpu, lr & ~SPLIT_HACK_MASK);
86 87 88 89 90
		vcpu->arch.hflags &= ~BOOK3S_HFLAG_SPLIT_HACK;
	}
}
EXPORT_SYMBOL_GPL(kvmppc_unfixup_split_real);

91 92
static inline unsigned long kvmppc_interrupt_offset(struct kvm_vcpu *vcpu)
{
93
	if (!is_kvmppc_hv_enabled(vcpu->kvm))
94 95 96 97 98 99 100
		return to_book3s(vcpu)->hior;
	return 0;
}

static inline void kvmppc_update_int_pending(struct kvm_vcpu *vcpu,
			unsigned long pending_now, unsigned long old_pending)
{
101
	if (is_kvmppc_hv_enabled(vcpu->kvm))
102 103
		return;
	if (pending_now)
104
		kvmppc_set_int_pending(vcpu, 1);
105
	else if (old_pending)
106
		kvmppc_set_int_pending(vcpu, 0);
107 108 109 110 111 112 113 114
}

static inline bool kvmppc_critical_section(struct kvm_vcpu *vcpu)
{
	ulong crit_raw;
	ulong crit_r1;
	bool crit;

115
	if (is_kvmppc_hv_enabled(vcpu->kvm))
116 117
		return false;

118
	crit_raw = kvmppc_get_critical(vcpu);
119 120 121
	crit_r1 = kvmppc_get_gpr(vcpu, 1);

	/* Truncate crit indicators in 32 bit mode */
122
	if (!(kvmppc_get_msr(vcpu) & MSR_SF)) {
123 124 125 126 127 128 129
		crit_raw &= 0xffffffff;
		crit_r1 &= 0xffffffff;
	}

	/* Critical section when crit == r1 */
	crit = (crit_raw == crit_r1);
	/* ... and we're in supervisor mode */
130
	crit = crit && !(kvmppc_get_msr(vcpu) & MSR_PR);
131 132 133 134

	return crit;
}

A
Alexander Graf 已提交
135 136
void kvmppc_inject_interrupt(struct kvm_vcpu *vcpu, int vec, u64 flags)
{
137
	kvmppc_unfixup_split_real(vcpu);
138
	kvmppc_set_srr0(vcpu, kvmppc_get_pc(vcpu));
139
	kvmppc_set_srr1(vcpu, (kvmppc_get_msr(vcpu) & ~0x783f0000ul) | flags);
140
	kvmppc_set_pc(vcpu, kvmppc_interrupt_offset(vcpu) + vec);
A
Alexander Graf 已提交
141 142 143
	vcpu->arch.mmu.reset_msr(vcpu);
}

144
static int kvmppc_book3s_vec2irqprio(unsigned int vec)
A
Alexander Graf 已提交
145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163
{
	unsigned int prio;

	switch (vec) {
	case 0x100: prio = BOOK3S_IRQPRIO_SYSTEM_RESET;		break;
	case 0x200: prio = BOOK3S_IRQPRIO_MACHINE_CHECK;	break;
	case 0x300: prio = BOOK3S_IRQPRIO_DATA_STORAGE;		break;
	case 0x380: prio = BOOK3S_IRQPRIO_DATA_SEGMENT;		break;
	case 0x400: prio = BOOK3S_IRQPRIO_INST_STORAGE;		break;
	case 0x480: prio = BOOK3S_IRQPRIO_INST_SEGMENT;		break;
	case 0x500: prio = BOOK3S_IRQPRIO_EXTERNAL;		break;
	case 0x600: prio = BOOK3S_IRQPRIO_ALIGNMENT;		break;
	case 0x700: prio = BOOK3S_IRQPRIO_PROGRAM;		break;
	case 0x800: prio = BOOK3S_IRQPRIO_FP_UNAVAIL;		break;
	case 0x900: prio = BOOK3S_IRQPRIO_DECREMENTER;		break;
	case 0xc00: prio = BOOK3S_IRQPRIO_SYSCALL;		break;
	case 0xd00: prio = BOOK3S_IRQPRIO_DEBUG;		break;
	case 0xf20: prio = BOOK3S_IRQPRIO_ALTIVEC;		break;
	case 0xf40: prio = BOOK3S_IRQPRIO_VSX;			break;
164
	case 0xf60: prio = BOOK3S_IRQPRIO_FAC_UNAVAIL;		break;
A
Alexander Graf 已提交
165 166 167
	default:    prio = BOOK3S_IRQPRIO_MAX;			break;
	}

168 169 170
	return prio;
}

171
void kvmppc_book3s_dequeue_irqprio(struct kvm_vcpu *vcpu,
172 173
					  unsigned int vec)
{
174 175
	unsigned long old_pending = vcpu->arch.pending_exceptions;

176 177
	clear_bit(kvmppc_book3s_vec2irqprio(vec),
		  &vcpu->arch.pending_exceptions);
178

179 180
	kvmppc_update_int_pending(vcpu, vcpu->arch.pending_exceptions,
				  old_pending);
181 182
}

183 184 185 186 187 188
void kvmppc_book3s_queue_irqprio(struct kvm_vcpu *vcpu, unsigned int vec)
{
	vcpu->stat.queue_intr++;

	set_bit(kvmppc_book3s_vec2irqprio(vec),
		&vcpu->arch.pending_exceptions);
A
Alexander Graf 已提交
189 190 191 192
#ifdef EXIT_DEBUG
	printk(KERN_INFO "Queueing interrupt %x\n", vec);
#endif
}
193
EXPORT_SYMBOL_GPL(kvmppc_book3s_queue_irqprio);
A
Alexander Graf 已提交
194

195
void kvmppc_core_queue_program(struct kvm_vcpu *vcpu, ulong flags)
A
Alexander Graf 已提交
196
{
197 198
	/* might as well deliver this straight away */
	kvmppc_inject_interrupt(vcpu, BOOK3S_INTERRUPT_PROGRAM, flags);
A
Alexander Graf 已提交
199
}
200
EXPORT_SYMBOL_GPL(kvmppc_core_queue_program);
A
Alexander Graf 已提交
201

202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219
void kvmppc_core_queue_fpunavail(struct kvm_vcpu *vcpu)
{
	/* might as well deliver this straight away */
	kvmppc_inject_interrupt(vcpu, BOOK3S_INTERRUPT_FP_UNAVAIL, 0);
}

void kvmppc_core_queue_vec_unavail(struct kvm_vcpu *vcpu)
{
	/* might as well deliver this straight away */
	kvmppc_inject_interrupt(vcpu, BOOK3S_INTERRUPT_ALTIVEC, 0);
}

void kvmppc_core_queue_vsx_unavail(struct kvm_vcpu *vcpu)
{
	/* might as well deliver this straight away */
	kvmppc_inject_interrupt(vcpu, BOOK3S_INTERRUPT_VSX, 0);
}

A
Alexander Graf 已提交
220 221 222 223
void kvmppc_core_queue_dec(struct kvm_vcpu *vcpu)
{
	kvmppc_book3s_queue_irqprio(vcpu, BOOK3S_INTERRUPT_DECREMENTER);
}
224
EXPORT_SYMBOL_GPL(kvmppc_core_queue_dec);
A
Alexander Graf 已提交
225 226 227

int kvmppc_core_pending_dec(struct kvm_vcpu *vcpu)
{
228
	return test_bit(BOOK3S_IRQPRIO_DECREMENTER, &vcpu->arch.pending_exceptions);
A
Alexander Graf 已提交
229
}
230
EXPORT_SYMBOL_GPL(kvmppc_core_pending_dec);
A
Alexander Graf 已提交
231

232 233 234 235
void kvmppc_core_dequeue_dec(struct kvm_vcpu *vcpu)
{
	kvmppc_book3s_dequeue_irqprio(vcpu, BOOK3S_INTERRUPT_DECREMENTER);
}
236
EXPORT_SYMBOL_GPL(kvmppc_core_dequeue_dec);
237

A
Alexander Graf 已提交
238 239 240
void kvmppc_core_queue_external(struct kvm_vcpu *vcpu,
                                struct kvm_interrupt *irq)
{
241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264
	/*
	 * This case (KVM_INTERRUPT_SET) should never actually arise for
	 * a pseries guest (because pseries guests expect their interrupt
	 * controllers to continue asserting an external interrupt request
	 * until it is acknowledged at the interrupt controller), but is
	 * included to avoid ABI breakage and potentially for other
	 * sorts of guest.
	 *
	 * There is a subtlety here: HV KVM does not test the
	 * external_oneshot flag in the code that synthesizes
	 * external interrupts for the guest just before entering
	 * the guest.  That is OK even if userspace did do a
	 * KVM_INTERRUPT_SET on a pseries guest vcpu, because the
	 * caller (kvm_vcpu_ioctl_interrupt) does a kvm_vcpu_kick()
	 * which ends up doing a smp_send_reschedule(), which will
	 * pull the guest all the way out to the host, meaning that
	 * we will call kvmppc_core_prepare_to_enter() before entering
	 * the guest again, and that will handle the external_oneshot
	 * flag correctly.
	 */
	if (irq->irq == KVM_INTERRUPT_SET)
		vcpu->arch.external_oneshot = 1;

	kvmppc_book3s_queue_irqprio(vcpu, BOOK3S_INTERRUPT_EXTERNAL);
A
Alexander Graf 已提交
265 266
}

267
void kvmppc_core_dequeue_external(struct kvm_vcpu *vcpu)
268 269 270 271
{
	kvmppc_book3s_dequeue_irqprio(vcpu, BOOK3S_INTERRUPT_EXTERNAL);
}

272 273 274 275 276
void kvmppc_core_queue_data_storage(struct kvm_vcpu *vcpu, ulong dar,
				    ulong flags)
{
	kvmppc_set_dar(vcpu, dar);
	kvmppc_set_dsisr(vcpu, flags);
277
	kvmppc_inject_interrupt(vcpu, BOOK3S_INTERRUPT_DATA_STORAGE, 0);
278
}
279
EXPORT_SYMBOL_GPL(kvmppc_core_queue_data_storage);
280 281 282

void kvmppc_core_queue_inst_storage(struct kvm_vcpu *vcpu, ulong flags)
{
283
	kvmppc_inject_interrupt(vcpu, BOOK3S_INTERRUPT_INST_STORAGE, flags);
284
}
285
EXPORT_SYMBOL_GPL(kvmppc_core_queue_inst_storage);
286

T
Thomas Huth 已提交
287 288
static int kvmppc_book3s_irqprio_deliver(struct kvm_vcpu *vcpu,
					 unsigned int priority)
A
Alexander Graf 已提交
289 290 291
{
	int deliver = 1;
	int vec = 0;
292
	bool crit = kvmppc_critical_section(vcpu);
A
Alexander Graf 已提交
293 294 295

	switch (priority) {
	case BOOK3S_IRQPRIO_DECREMENTER:
296
		deliver = (kvmppc_get_msr(vcpu) & MSR_EE) && !crit;
A
Alexander Graf 已提交
297 298 299
		vec = BOOK3S_INTERRUPT_DECREMENTER;
		break;
	case BOOK3S_IRQPRIO_EXTERNAL:
300
		deliver = (kvmppc_get_msr(vcpu) & MSR_EE) && !crit;
A
Alexander Graf 已提交
301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344
		vec = BOOK3S_INTERRUPT_EXTERNAL;
		break;
	case BOOK3S_IRQPRIO_SYSTEM_RESET:
		vec = BOOK3S_INTERRUPT_SYSTEM_RESET;
		break;
	case BOOK3S_IRQPRIO_MACHINE_CHECK:
		vec = BOOK3S_INTERRUPT_MACHINE_CHECK;
		break;
	case BOOK3S_IRQPRIO_DATA_STORAGE:
		vec = BOOK3S_INTERRUPT_DATA_STORAGE;
		break;
	case BOOK3S_IRQPRIO_INST_STORAGE:
		vec = BOOK3S_INTERRUPT_INST_STORAGE;
		break;
	case BOOK3S_IRQPRIO_DATA_SEGMENT:
		vec = BOOK3S_INTERRUPT_DATA_SEGMENT;
		break;
	case BOOK3S_IRQPRIO_INST_SEGMENT:
		vec = BOOK3S_INTERRUPT_INST_SEGMENT;
		break;
	case BOOK3S_IRQPRIO_ALIGNMENT:
		vec = BOOK3S_INTERRUPT_ALIGNMENT;
		break;
	case BOOK3S_IRQPRIO_PROGRAM:
		vec = BOOK3S_INTERRUPT_PROGRAM;
		break;
	case BOOK3S_IRQPRIO_VSX:
		vec = BOOK3S_INTERRUPT_VSX;
		break;
	case BOOK3S_IRQPRIO_ALTIVEC:
		vec = BOOK3S_INTERRUPT_ALTIVEC;
		break;
	case BOOK3S_IRQPRIO_FP_UNAVAIL:
		vec = BOOK3S_INTERRUPT_FP_UNAVAIL;
		break;
	case BOOK3S_IRQPRIO_SYSCALL:
		vec = BOOK3S_INTERRUPT_SYSCALL;
		break;
	case BOOK3S_IRQPRIO_DEBUG:
		vec = BOOK3S_INTERRUPT_TRACE;
		break;
	case BOOK3S_IRQPRIO_PERFORMANCE_MONITOR:
		vec = BOOK3S_INTERRUPT_PERFMON;
		break;
345 346 347
	case BOOK3S_IRQPRIO_FAC_UNAVAIL:
		vec = BOOK3S_INTERRUPT_FAC_UNAVAIL;
		break;
A
Alexander Graf 已提交
348 349 350 351 352 353 354 355 356 357 358
	default:
		deliver = 0;
		printk(KERN_ERR "KVM: Unknown interrupt: 0x%x\n", priority);
		break;
	}

#if 0
	printk(KERN_INFO "Deliver interrupt 0x%x? %x\n", vec, deliver);
#endif

	if (deliver)
359
		kvmppc_inject_interrupt(vcpu, vec, 0);
A
Alexander Graf 已提交
360 361 362 363

	return deliver;
}

364 365 366 367 368 369 370 371 372
/*
 * This function determines if an irqprio should be cleared once issued.
 */
static bool clear_irqprio(struct kvm_vcpu *vcpu, unsigned int priority)
{
	switch (priority) {
		case BOOK3S_IRQPRIO_DECREMENTER:
			/* DEC interrupts get cleared by mtdec */
			return false;
373 374 375 376 377 378 379 380 381 382
		case BOOK3S_IRQPRIO_EXTERNAL:
			/*
			 * External interrupts get cleared by userspace
			 * except when set by the KVM_INTERRUPT ioctl with
			 * KVM_INTERRUPT_SET (not KVM_INTERRUPT_SET_LEVEL).
			 */
			if (vcpu->arch.external_oneshot) {
				vcpu->arch.external_oneshot = 0;
				return true;
			}
383 384 385 386 387 388
			return false;
	}

	return true;
}

389
int kvmppc_core_prepare_to_enter(struct kvm_vcpu *vcpu)
A
Alexander Graf 已提交
390 391
{
	unsigned long *pending = &vcpu->arch.pending_exceptions;
392
	unsigned long old_pending = vcpu->arch.pending_exceptions;
A
Alexander Graf 已提交
393 394 395 396 397 398 399
	unsigned int priority;

#ifdef EXIT_DEBUG
	if (vcpu->arch.pending_exceptions)
		printk(KERN_EMERG "KVM: Check pending: %lx\n", vcpu->arch.pending_exceptions);
#endif
	priority = __ffs(*pending);
A
Alexander Graf 已提交
400
	while (priority < BOOK3S_IRQPRIO_MAX) {
401
		if (kvmppc_book3s_irqprio_deliver(vcpu, priority) &&
402
		    clear_irqprio(vcpu, priority)) {
A
Alexander Graf 已提交
403 404 405 406 407 408 409 410
			clear_bit(priority, &vcpu->arch.pending_exceptions);
			break;
		}

		priority = find_next_bit(pending,
					 BITS_PER_BYTE * sizeof(*pending),
					 priority + 1);
	}
411 412

	/* Tell the guest about our interrupt status */
413
	kvmppc_update_int_pending(vcpu, *pending, old_pending);
414 415

	return 0;
A
Alexander Graf 已提交
416
}
417
EXPORT_SYMBOL_GPL(kvmppc_core_prepare_to_enter);
A
Alexander Graf 已提交
418

D
Dan Williams 已提交
419
kvm_pfn_t kvmppc_gpa_to_pfn(struct kvm_vcpu *vcpu, gpa_t gpa, bool writing,
420
			bool *writable)
421
{
422 423
	ulong mp_pa = vcpu->arch.magic_page_pa & KVM_PAM;
	gfn_t gfn = gpa >> PAGE_SHIFT;
424

425
	if (!(kvmppc_get_msr(vcpu) & MSR_SF))
426 427
		mp_pa = (uint32_t)mp_pa;

428
	/* Magic page override */
429 430
	gpa &= ~0xFFFULL;
	if (unlikely(mp_pa) && unlikely((gpa & KVM_PAM) == mp_pa)) {
431
		ulong shared_page = ((ulong)vcpu->arch.shared) & PAGE_MASK;
D
Dan Williams 已提交
432
		kvm_pfn_t pfn;
433

D
Dan Williams 已提交
434
		pfn = (kvm_pfn_t)virt_to_phys((void*)shared_page) >> PAGE_SHIFT;
435
		get_page(pfn_to_page(pfn));
436 437
		if (writable)
			*writable = true;
438 439 440
		return pfn;
	}

441
	return gfn_to_pfn_prot(vcpu->kvm, gfn, writing, writable);
442
}
443
EXPORT_SYMBOL_GPL(kvmppc_gpa_to_pfn);
444

445 446
int kvmppc_xlate(struct kvm_vcpu *vcpu, ulong eaddr, enum xlate_instdata xlid,
		 enum xlate_readwrite xlrw, struct kvmppc_pte *pte)
A
Alexander Graf 已提交
447
{
448 449
	bool data = (xlid == XLATE_DATA);
	bool iswrite = (xlrw == XLATE_WRITE);
450
	int relocated = (kvmppc_get_msr(vcpu) & (data ? MSR_DR : MSR_IR));
A
Alexander Graf 已提交
451 452 453
	int r;

	if (relocated) {
454
		r = vcpu->arch.mmu.xlate(vcpu, eaddr, pte, data, iswrite);
A
Alexander Graf 已提交
455 456
	} else {
		pte->eaddr = eaddr;
A
Alexander Graf 已提交
457
		pte->raddr = eaddr & KVM_PAM;
458
		pte->vpage = VSID_REAL | eaddr >> 12;
A
Alexander Graf 已提交
459 460 461 462
		pte->may_read = true;
		pte->may_write = true;
		pte->may_execute = true;
		r = 0;
463 464 465 466 467 468 469

		if ((kvmppc_get_msr(vcpu) & (MSR_IR | MSR_DR)) == MSR_DR &&
		    !data) {
			if ((vcpu->arch.hflags & BOOK3S_HFLAG_SPLIT_HACK) &&
			    ((eaddr & SPLIT_HACK_MASK) == SPLIT_HACK_OFFS))
			pte->raddr &= ~SPLIT_HACK_MASK;
		}
A
Alexander Graf 已提交
470 471 472 473 474
	}

	return r;
}

475 476
int kvmppc_load_last_inst(struct kvm_vcpu *vcpu,
		enum instruction_fetch_type type, u32 *inst)
477 478 479 480 481 482 483 484 485 486 487 488 489 490 491
{
	ulong pc = kvmppc_get_pc(vcpu);
	int r;

	if (type == INST_SC)
		pc -= 4;

	r = kvmppc_ld(vcpu, &pc, sizeof(u32), inst, false);
	if (r == EMULATE_DONE)
		return r;
	else
		return EMULATE_AGAIN;
}
EXPORT_SYMBOL_GPL(kvmppc_load_last_inst);

A
Alexander Graf 已提交
492 493 494 495 496
int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu)
{
	return 0;
}

497 498 499 500 501 502 503 504 505
int kvmppc_subarch_vcpu_init(struct kvm_vcpu *vcpu)
{
	return 0;
}

void kvmppc_subarch_vcpu_uninit(struct kvm_vcpu *vcpu)
{
}

506 507 508
int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
				  struct kvm_sregs *sregs)
{
509 510 511 512 513 514 515
	int ret;

	vcpu_load(vcpu);
	ret = vcpu->kvm->arch.kvm_ops->get_sregs(vcpu, sregs);
	vcpu_put(vcpu);

	return ret;
516 517 518 519 520
}

int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
				  struct kvm_sregs *sregs)
{
521 522 523 524 525 526 527
	int ret;

	vcpu_load(vcpu);
	ret = vcpu->kvm->arch.kvm_ops->set_sregs(vcpu, sregs);
	vcpu_put(vcpu);

	return ret;
528 529
}

A
Alexander Graf 已提交
530 531 532 533
int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs)
{
	int i;

534
	regs->pc = kvmppc_get_pc(vcpu);
535
	regs->cr = kvmppc_get_cr(vcpu);
536 537
	regs->ctr = kvmppc_get_ctr(vcpu);
	regs->lr = kvmppc_get_lr(vcpu);
538
	regs->xer = kvmppc_get_xer(vcpu);
539 540 541
	regs->msr = kvmppc_get_msr(vcpu);
	regs->srr0 = kvmppc_get_srr0(vcpu);
	regs->srr1 = kvmppc_get_srr1(vcpu);
A
Alexander Graf 已提交
542
	regs->pid = vcpu->arch.pid;
543 544 545 546 547 548 549 550
	regs->sprg0 = kvmppc_get_sprg0(vcpu);
	regs->sprg1 = kvmppc_get_sprg1(vcpu);
	regs->sprg2 = kvmppc_get_sprg2(vcpu);
	regs->sprg3 = kvmppc_get_sprg3(vcpu);
	regs->sprg4 = kvmppc_get_sprg4(vcpu);
	regs->sprg5 = kvmppc_get_sprg5(vcpu);
	regs->sprg6 = kvmppc_get_sprg6(vcpu);
	regs->sprg7 = kvmppc_get_sprg7(vcpu);
A
Alexander Graf 已提交
551 552

	for (i = 0; i < ARRAY_SIZE(regs->gpr); i++)
553
		regs->gpr[i] = kvmppc_get_gpr(vcpu, i);
A
Alexander Graf 已提交
554 555 556 557 558 559 560 561

	return 0;
}

int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs)
{
	int i;

562
	kvmppc_set_pc(vcpu, regs->pc);
563
	kvmppc_set_cr(vcpu, regs->cr);
564 565
	kvmppc_set_ctr(vcpu, regs->ctr);
	kvmppc_set_lr(vcpu, regs->lr);
566
	kvmppc_set_xer(vcpu, regs->xer);
A
Alexander Graf 已提交
567
	kvmppc_set_msr(vcpu, regs->msr);
568 569 570 571 572 573 574 575 576 577
	kvmppc_set_srr0(vcpu, regs->srr0);
	kvmppc_set_srr1(vcpu, regs->srr1);
	kvmppc_set_sprg0(vcpu, regs->sprg0);
	kvmppc_set_sprg1(vcpu, regs->sprg1);
	kvmppc_set_sprg2(vcpu, regs->sprg2);
	kvmppc_set_sprg3(vcpu, regs->sprg3);
	kvmppc_set_sprg4(vcpu, regs->sprg4);
	kvmppc_set_sprg5(vcpu, regs->sprg5);
	kvmppc_set_sprg6(vcpu, regs->sprg6);
	kvmppc_set_sprg7(vcpu, regs->sprg7);
A
Alexander Graf 已提交
578

579 580
	for (i = 0; i < ARRAY_SIZE(regs->gpr); i++)
		kvmppc_set_gpr(vcpu, i, regs->gpr[i]);
A
Alexander Graf 已提交
581 582 583 584 585 586 587 588 589 590 591 592 593 594

	return 0;
}

int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu)
{
	return -ENOTSUPP;
}

int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu)
{
	return -ENOTSUPP;
}

595 596
int kvmppc_get_one_reg(struct kvm_vcpu *vcpu, u64 id,
			union kvmppc_one_reg *val)
597
{
598
	int r = 0;
599
	long int i;
600

601
	r = vcpu->kvm->arch.kvm_ops->get_one_reg(vcpu, id, val);
602 603
	if (r == -EINVAL) {
		r = 0;
604
		switch (id) {
605
		case KVM_REG_PPC_DAR:
606
			*val = get_reg_val(id, kvmppc_get_dar(vcpu));
607 608
			break;
		case KVM_REG_PPC_DSISR:
609
			*val = get_reg_val(id, kvmppc_get_dsisr(vcpu));
610
			break;
611
		case KVM_REG_PPC_FPR0 ... KVM_REG_PPC_FPR31:
612 613
			i = id - KVM_REG_PPC_FPR0;
			*val = get_reg_val(id, VCPU_FPR(vcpu, i));
614 615
			break;
		case KVM_REG_PPC_FPSCR:
616
			*val = get_reg_val(id, vcpu->arch.fp.fpscr);
617
			break;
618 619 620
#ifdef CONFIG_VSX
		case KVM_REG_PPC_VSR0 ... KVM_REG_PPC_VSR31:
			if (cpu_has_feature(CPU_FTR_VSX)) {
621 622 623
				i = id - KVM_REG_PPC_VSR0;
				val->vsxval[0] = vcpu->arch.fp.fpr[i][0];
				val->vsxval[1] = vcpu->arch.fp.fpr[i][1];
624 625 626 627 628
			} else {
				r = -ENXIO;
			}
			break;
#endif /* CONFIG_VSX */
629 630
		case KVM_REG_PPC_DEBUG_INST:
			*val = get_reg_val(id, INS_TW);
631
			break;
632 633
#ifdef CONFIG_KVM_XICS
		case KVM_REG_PPC_ICP_STATE:
634
			if (!vcpu->arch.icp && !vcpu->arch.xive_vcpu) {
635 636 637
				r = -ENXIO;
				break;
			}
638
			if (xics_on_xive())
639 640 641
				*val = get_reg_val(id, kvmppc_xive_get_icp(vcpu));
			else
				*val = get_reg_val(id, kvmppc_xics_get_icp(vcpu));
642 643
			break;
#endif /* CONFIG_KVM_XICS */
644
		case KVM_REG_PPC_FSCR:
645
			*val = get_reg_val(id, vcpu->arch.fscr);
646
			break;
647
		case KVM_REG_PPC_TAR:
648
			*val = get_reg_val(id, vcpu->arch.tar);
649
			break;
650
		case KVM_REG_PPC_EBBHR:
651
			*val = get_reg_val(id, vcpu->arch.ebbhr);
652 653
			break;
		case KVM_REG_PPC_EBBRR:
654
			*val = get_reg_val(id, vcpu->arch.ebbrr);
655 656
			break;
		case KVM_REG_PPC_BESCR:
657
			*val = get_reg_val(id, vcpu->arch.bescr);
658
			break;
659
		case KVM_REG_PPC_IC:
660
			*val = get_reg_val(id, vcpu->arch.ic);
661
			break;
662 663 664 665 666 667 668 669 670
		default:
			r = -EINVAL;
			break;
		}
	}

	return r;
}

671 672
int kvmppc_set_one_reg(struct kvm_vcpu *vcpu, u64 id,
			union kvmppc_one_reg *val)
673
{
674
	int r = 0;
675
	long int i;
676

677
	r = vcpu->kvm->arch.kvm_ops->set_one_reg(vcpu, id, val);
678 679
	if (r == -EINVAL) {
		r = 0;
680
		switch (id) {
681
		case KVM_REG_PPC_DAR:
682
			kvmppc_set_dar(vcpu, set_reg_val(id, *val));
683 684
			break;
		case KVM_REG_PPC_DSISR:
685
			kvmppc_set_dsisr(vcpu, set_reg_val(id, *val));
686
			break;
687
		case KVM_REG_PPC_FPR0 ... KVM_REG_PPC_FPR31:
688 689
			i = id - KVM_REG_PPC_FPR0;
			VCPU_FPR(vcpu, i) = set_reg_val(id, *val);
690 691
			break;
		case KVM_REG_PPC_FPSCR:
692
			vcpu->arch.fp.fpscr = set_reg_val(id, *val);
693
			break;
694 695 696
#ifdef CONFIG_VSX
		case KVM_REG_PPC_VSR0 ... KVM_REG_PPC_VSR31:
			if (cpu_has_feature(CPU_FTR_VSX)) {
697 698 699
				i = id - KVM_REG_PPC_VSR0;
				vcpu->arch.fp.fpr[i][0] = val->vsxval[0];
				vcpu->arch.fp.fpr[i][1] = val->vsxval[1];
700 701 702 703 704
			} else {
				r = -ENXIO;
			}
			break;
#endif /* CONFIG_VSX */
705 706
#ifdef CONFIG_KVM_XICS
		case KVM_REG_PPC_ICP_STATE:
707
			if (!vcpu->arch.icp && !vcpu->arch.xive_vcpu) {
708 709 710
				r = -ENXIO;
				break;
			}
711
			if (xics_on_xive())
712 713 714
				r = kvmppc_xive_set_icp(vcpu, set_reg_val(id, *val));
			else
				r = kvmppc_xics_set_icp(vcpu, set_reg_val(id, *val));
715 716
			break;
#endif /* CONFIG_KVM_XICS */
717
		case KVM_REG_PPC_FSCR:
718
			vcpu->arch.fscr = set_reg_val(id, *val);
719
			break;
720
		case KVM_REG_PPC_TAR:
721
			vcpu->arch.tar = set_reg_val(id, *val);
722
			break;
723
		case KVM_REG_PPC_EBBHR:
724
			vcpu->arch.ebbhr = set_reg_val(id, *val);
725 726
			break;
		case KVM_REG_PPC_EBBRR:
727
			vcpu->arch.ebbrr = set_reg_val(id, *val);
728 729
			break;
		case KVM_REG_PPC_BESCR:
730
			vcpu->arch.bescr = set_reg_val(id, *val);
731
			break;
732
		case KVM_REG_PPC_IC:
733
			vcpu->arch.ic = set_reg_val(id, *val);
734
			break;
735 736 737 738 739 740 741 742 743
		default:
			r = -EINVAL;
			break;
		}
	}

	return r;
}

744 745
void kvmppc_core_vcpu_load(struct kvm_vcpu *vcpu, int cpu)
{
746
	vcpu->kvm->arch.kvm_ops->vcpu_load(vcpu, cpu);
747 748 749 750
}

void kvmppc_core_vcpu_put(struct kvm_vcpu *vcpu)
{
751
	vcpu->kvm->arch.kvm_ops->vcpu_put(vcpu);
752 753 754 755
}

void kvmppc_set_msr(struct kvm_vcpu *vcpu, u64 msr)
{
756
	vcpu->kvm->arch.kvm_ops->set_msr(vcpu, msr);
757
}
758
EXPORT_SYMBOL_GPL(kvmppc_set_msr);
759 760 761

int kvmppc_vcpu_run(struct kvm_run *kvm_run, struct kvm_vcpu *vcpu)
{
762
	return vcpu->kvm->arch.kvm_ops->vcpu_run(kvm_run, vcpu);
763 764
}

A
Alexander Graf 已提交
765 766 767 768 769 770
int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
                                  struct kvm_translation *tr)
{
	return 0;
}

771 772 773
int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
					struct kvm_guest_debug *dbg)
{
774
	vcpu_load(vcpu);
775
	vcpu->guest_debug = dbg->control;
776
	vcpu_put(vcpu);
777
	return 0;
778 779
}

780
void kvmppc_decrementer_func(struct kvm_vcpu *vcpu)
781 782 783 784
{
	kvmppc_core_queue_dec(vcpu);
	kvm_vcpu_kick(vcpu);
}
785 786 787

struct kvm_vcpu *kvmppc_core_vcpu_create(struct kvm *kvm, unsigned int id)
{
788
	return kvm->arch.kvm_ops->vcpu_create(kvm, id);
789 790 791 792
}

void kvmppc_core_vcpu_free(struct kvm_vcpu *vcpu)
{
793
	vcpu->kvm->arch.kvm_ops->vcpu_free(vcpu);
794 795 796 797
}

int kvmppc_core_check_requests(struct kvm_vcpu *vcpu)
{
798
	return vcpu->kvm->arch.kvm_ops->check_requests(vcpu);
799 800 801 802
}

int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm, struct kvm_dirty_log *log)
{
803
	return kvm->arch.kvm_ops->get_dirty_log(kvm, log);
804 805
}

806
void kvmppc_core_free_memslot(struct kvm *kvm, struct kvm_memory_slot *free,
807 808
			      struct kvm_memory_slot *dont)
{
809
	kvm->arch.kvm_ops->free_memslot(free, dont);
810 811
}

812
int kvmppc_core_create_memslot(struct kvm *kvm, struct kvm_memory_slot *slot,
813 814
			       unsigned long npages)
{
815
	return kvm->arch.kvm_ops->create_memslot(slot, npages);
816 817 818 819
}

void kvmppc_core_flush_memslot(struct kvm *kvm, struct kvm_memory_slot *memslot)
{
820
	kvm->arch.kvm_ops->flush_memslot(kvm, memslot);
821 822 823 824
}

int kvmppc_core_prepare_memory_region(struct kvm *kvm,
				struct kvm_memory_slot *memslot,
825
				const struct kvm_userspace_memory_region *mem)
826
{
827
	return kvm->arch.kvm_ops->prepare_memory_region(kvm, memslot, mem);
828 829 830
}

void kvmppc_core_commit_memory_region(struct kvm *kvm,
831
				const struct kvm_userspace_memory_region *mem,
832
				const struct kvm_memory_slot *old,
833 834
				const struct kvm_memory_slot *new,
				enum kvm_mr_change change)
835
{
836
	kvm->arch.kvm_ops->commit_memory_region(kvm, mem, old, new, change);
837 838 839 840
}

int kvm_unmap_hva_range(struct kvm *kvm, unsigned long start, unsigned long end)
{
841
	return kvm->arch.kvm_ops->unmap_hva_range(kvm, start, end);
842 843
}

A
Andres Lagar-Cavilla 已提交
844
int kvm_age_hva(struct kvm *kvm, unsigned long start, unsigned long end)
845
{
A
Andres Lagar-Cavilla 已提交
846
	return kvm->arch.kvm_ops->age_hva(kvm, start, end);
847 848 849 850
}

int kvm_test_age_hva(struct kvm *kvm, unsigned long hva)
{
851
	return kvm->arch.kvm_ops->test_age_hva(kvm, hva);
852 853
}

854
int kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte)
855
{
856
	kvm->arch.kvm_ops->set_spte_hva(kvm, hva, pte);
857
	return 0;
858 859 860 861
}

void kvmppc_mmu_destroy(struct kvm_vcpu *vcpu)
{
862
	vcpu->kvm->arch.kvm_ops->mmu_destroy(vcpu);
863 864 865 866 867 868
}

int kvmppc_core_init_vm(struct kvm *kvm)
{

#ifdef CONFIG_PPC64
869
	INIT_LIST_HEAD_RCU(&kvm->arch.spapr_tce_tables);
870 871 872
	INIT_LIST_HEAD(&kvm->arch.rtas_tokens);
#endif

873
	return kvm->arch.kvm_ops->init_vm(kvm);
874 875 876 877
}

void kvmppc_core_destroy_vm(struct kvm *kvm)
{
878
	kvm->arch.kvm_ops->destroy_vm(kvm);
879 880 881 882 883 884 885

#ifdef CONFIG_PPC64
	kvmppc_rtas_tokens_free(kvm);
	WARN_ON(!list_empty(&kvm->arch.spapr_tce_tables));
#endif
}

886 887 888 889 890
int kvmppc_h_logical_ci_load(struct kvm_vcpu *vcpu)
{
	unsigned long size = kvmppc_get_gpr(vcpu, 4);
	unsigned long addr = kvmppc_get_gpr(vcpu, 5);
	u64 buf;
891
	int srcu_idx;
892 893 894 895 896
	int ret;

	if (!is_power_of_2(size) || (size > sizeof(buf)))
		return H_TOO_HARD;

897
	srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
898
	ret = kvm_io_bus_read(vcpu, KVM_MMIO_BUS, addr, size, &buf);
899
	srcu_read_unlock(&vcpu->kvm->srcu, srcu_idx);
900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933
	if (ret != 0)
		return H_TOO_HARD;

	switch (size) {
	case 1:
		kvmppc_set_gpr(vcpu, 4, *(u8 *)&buf);
		break;

	case 2:
		kvmppc_set_gpr(vcpu, 4, be16_to_cpu(*(__be16 *)&buf));
		break;

	case 4:
		kvmppc_set_gpr(vcpu, 4, be32_to_cpu(*(__be32 *)&buf));
		break;

	case 8:
		kvmppc_set_gpr(vcpu, 4, be64_to_cpu(*(__be64 *)&buf));
		break;

	default:
		BUG();
	}

	return H_SUCCESS;
}
EXPORT_SYMBOL_GPL(kvmppc_h_logical_ci_load);

int kvmppc_h_logical_ci_store(struct kvm_vcpu *vcpu)
{
	unsigned long size = kvmppc_get_gpr(vcpu, 4);
	unsigned long addr = kvmppc_get_gpr(vcpu, 5);
	unsigned long val = kvmppc_get_gpr(vcpu, 6);
	u64 buf;
934
	int srcu_idx;
935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957
	int ret;

	switch (size) {
	case 1:
		*(u8 *)&buf = val;
		break;

	case 2:
		*(__be16 *)&buf = cpu_to_be16(val);
		break;

	case 4:
		*(__be32 *)&buf = cpu_to_be32(val);
		break;

	case 8:
		*(__be64 *)&buf = cpu_to_be64(val);
		break;

	default:
		return H_TOO_HARD;
	}

958
	srcu_idx = srcu_read_lock(&vcpu->kvm->srcu);
959
	ret = kvm_io_bus_write(vcpu, KVM_MMIO_BUS, addr, size, &buf);
960
	srcu_read_unlock(&vcpu->kvm->srcu, srcu_idx);
961 962 963 964 965 966 967
	if (ret != 0)
		return H_TOO_HARD;

	return H_SUCCESS;
}
EXPORT_SYMBOL_GPL(kvmppc_h_logical_ci_store);

968 969
int kvmppc_core_check_processor_compat(void)
{
970 971
	/*
	 * We always return 0 for book3s. We check
972
	 * for compatibility while loading the HV
973 974 975 976 977
	 * or PR module
	 */
	return 0;
}

978 979 980 981 982
int kvmppc_book3s_hcall_implemented(struct kvm *kvm, unsigned long hcall)
{
	return kvm->arch.kvm_ops->hcall_implemented(hcall);
}

983 984 985 986
#ifdef CONFIG_KVM_XICS
int kvm_set_irq(struct kvm *kvm, int irq_source_id, u32 irq, int level,
		bool line_status)
{
987
	if (xics_on_xive())
988 989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026
		return kvmppc_xive_set_irq(kvm, irq_source_id, irq, level,
					   line_status);
	else
		return kvmppc_xics_set_irq(kvm, irq_source_id, irq, level,
					   line_status);
}

int kvm_arch_set_irq_inatomic(struct kvm_kernel_irq_routing_entry *irq_entry,
			      struct kvm *kvm, int irq_source_id,
			      int level, bool line_status)
{
	return kvm_set_irq(kvm, irq_source_id, irq_entry->gsi,
			   level, line_status);
}
static int kvmppc_book3s_set_irq(struct kvm_kernel_irq_routing_entry *e,
				 struct kvm *kvm, int irq_source_id, int level,
				 bool line_status)
{
	return kvm_set_irq(kvm, irq_source_id, e->gsi, level, line_status);
}

int kvm_irq_map_gsi(struct kvm *kvm,
		    struct kvm_kernel_irq_routing_entry *entries, int gsi)
{
	entries->gsi = gsi;
	entries->type = KVM_IRQ_ROUTING_IRQCHIP;
	entries->set = kvmppc_book3s_set_irq;
	entries->irqchip.irqchip = 0;
	entries->irqchip.pin = gsi;
	return 1;
}

int kvm_irq_map_chip_pin(struct kvm *kvm, unsigned irqchip, unsigned pin)
{
	return pin;
}

#endif /* CONFIG_KVM_XICS */

1027 1028 1029 1030 1031 1032 1033
static int kvmppc_book3s_init(void)
{
	int r;

	r = kvm_init(NULL, sizeof(struct kvm_vcpu), 0, THIS_MODULE);
	if (r)
		return r;
1034
#ifdef CONFIG_KVM_BOOK3S_32_HANDLER
1035 1036 1037
	r = kvmppc_book3s_init_pr();
#endif

1038 1039
#ifdef CONFIG_KVM_XICS
#ifdef CONFIG_KVM_XIVE
1040
	if (xics_on_xive()) {
1041 1042 1043 1044 1045 1046 1047
		kvmppc_xive_init_module();
		kvm_register_device_ops(&kvm_xive_ops, KVM_DEV_TYPE_XICS);
	} else
#endif
		kvm_register_device_ops(&kvm_xics_ops, KVM_DEV_TYPE_XICS);
#endif
	return r;
1048 1049 1050 1051
}

static void kvmppc_book3s_exit(void)
{
1052
#ifdef CONFIG_KVM_XICS
1053
	if (xics_on_xive())
1054 1055
		kvmppc_xive_exit_module();
#endif
1056
#ifdef CONFIG_KVM_BOOK3S_32_HANDLER
1057 1058 1059
	kvmppc_book3s_exit_pr();
#endif
	kvm_exit();
1060
}
1061 1062 1063

module_init(kvmppc_book3s_init);
module_exit(kvmppc_book3s_exit);
1064 1065

/* On 32bit this is our one and only kernel module */
1066
#ifdef CONFIG_KVM_BOOK3S_32_HANDLER
1067 1068 1069
MODULE_ALIAS_MISCDEV(KVM_MINOR);
MODULE_ALIAS("devname:kvm");
#endif