ioapic.c 10.6 KB
Newer Older
E
Eddie Dong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 *  Copyright (C) 2001  MandrakeSoft S.A.
 *
 *    MandrakeSoft S.A.
 *    43, rue d'Aboukir
 *    75002 Paris - France
 *    http://www.linux-mandrake.com/
 *    http://www.mandrakesoft.com/
 *
 *  This library is free software; you can redistribute it and/or
 *  modify it under the terms of the GNU Lesser General Public
 *  License as published by the Free Software Foundation; either
 *  version 2 of the License, or (at your option) any later version.
 *
 *  This library is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 *  Lesser General Public License for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public
 *  License along with this library; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 *
 *  Yunhong Jiang <yunhong.jiang@intel.com>
 *  Yaozu (Eddie) Dong <eddie.dong@intel.com>
 *  Based on Xen 3.1 code.
 */

29
#include <linux/kvm_host.h>
E
Eddie Dong 已提交
30 31 32 33 34 35
#include <linux/kvm.h>
#include <linux/mm.h>
#include <linux/highmem.h>
#include <linux/smp.h>
#include <linux/hrtimer.h>
#include <linux/io.h>
36
#include <linux/slab.h>
E
Eddie Dong 已提交
37 38 39
#include <asm/processor.h>
#include <asm/page.h>
#include <asm/current.h>
40
#include <trace/events/kvm.h>
41 42 43

#include "ioapic.h"
#include "lapic.h"
M
Marcelo Tosatti 已提交
44
#include "irq.h"
45

46 47 48
#if 0
#define ioapic_debug(fmt,arg...) printk(KERN_WARNING fmt,##arg)
#else
E
Eddie Dong 已提交
49
#define ioapic_debug(fmt, arg...)
50
#endif
51
static int ioapic_deliver(struct kvm_ioapic *vioapic, int irq);
E
Eddie Dong 已提交
52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87

static unsigned long ioapic_read_indirect(struct kvm_ioapic *ioapic,
					  unsigned long addr,
					  unsigned long length)
{
	unsigned long result = 0;

	switch (ioapic->ioregsel) {
	case IOAPIC_REG_VERSION:
		result = ((((IOAPIC_NUM_PINS - 1) & 0xff) << 16)
			  | (IOAPIC_VERSION_ID & 0xff));
		break;

	case IOAPIC_REG_APIC_ID:
	case IOAPIC_REG_ARB_ID:
		result = ((ioapic->id & 0xf) << 24);
		break;

	default:
		{
			u32 redir_index = (ioapic->ioregsel - 0x10) >> 1;
			u64 redir_content;

			ASSERT(redir_index < IOAPIC_NUM_PINS);

			redir_content = ioapic->redirtbl[redir_index].bits;
			result = (ioapic->ioregsel & 0x1) ?
			    (redir_content >> 32) & 0xffffffff :
			    redir_content & 0xffffffff;
			break;
		}
	}

	return result;
}

88
static int ioapic_service(struct kvm_ioapic *ioapic, unsigned int idx)
E
Eddie Dong 已提交
89
{
S
Sheng Yang 已提交
90
	union kvm_ioapic_redirect_entry *pent;
91
	int injected = -1;
E
Eddie Dong 已提交
92 93 94 95

	pent = &ioapic->redirtbl[idx];

	if (!pent->fields.mask) {
96
		injected = ioapic_deliver(ioapic, idx);
97
		if (injected && pent->fields.trig_mode == IOAPIC_LEVEL_TRIG)
E
Eddie Dong 已提交
98 99
			pent->fields.remote_irr = 1;
	}
100 101

	return injected;
E
Eddie Dong 已提交
102 103
}

104 105 106 107 108 109 110 111 112 113 114 115 116
static void update_handled_vectors(struct kvm_ioapic *ioapic)
{
	DECLARE_BITMAP(handled_vectors, 256);
	int i;

	memset(handled_vectors, 0, sizeof(handled_vectors));
	for (i = 0; i < IOAPIC_NUM_PINS; ++i)
		__set_bit(ioapic->redirtbl[i].fields.vector, handled_vectors);
	memcpy(ioapic->handled_vectors, handled_vectors,
	       sizeof(handled_vectors));
	smp_wmb();
}

E
Eddie Dong 已提交
117 118 119
static void ioapic_write_indirect(struct kvm_ioapic *ioapic, u32 val)
{
	unsigned index;
120
	bool mask_before, mask_after;
121
	union kvm_ioapic_redirect_entry *e;
E
Eddie Dong 已提交
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137

	switch (ioapic->ioregsel) {
	case IOAPIC_REG_VERSION:
		/* Writes are ignored. */
		break;

	case IOAPIC_REG_APIC_ID:
		ioapic->id = (val >> 24) & 0xf;
		break;

	case IOAPIC_REG_ARB_ID:
		break;

	default:
		index = (ioapic->ioregsel - 0x10) >> 1;

138
		ioapic_debug("change redir index %x val %x\n", index, val);
E
Eddie Dong 已提交
139 140
		if (index >= IOAPIC_NUM_PINS)
			return;
141 142
		e = &ioapic->redirtbl[index];
		mask_before = e->fields.mask;
E
Eddie Dong 已提交
143
		if (ioapic->ioregsel & 1) {
144 145
			e->bits &= 0xffffffff;
			e->bits |= (u64) val << 32;
E
Eddie Dong 已提交
146
		} else {
147 148 149
			e->bits &= ~0xffffffffULL;
			e->bits |= (u32) val;
			e->fields.remote_irr = 0;
E
Eddie Dong 已提交
150
		}
151
		update_handled_vectors(ioapic);
152
		mask_after = e->fields.mask;
153 154
		if (mask_before != mask_after)
			kvm_fire_mask_notifiers(ioapic->kvm, index, mask_after);
155
		if (e->fields.trig_mode == IOAPIC_LEVEL_TRIG
156
		    && ioapic->irr & (1 << index))
E
Eddie Dong 已提交
157 158 159 160 161
			ioapic_service(ioapic, index);
		break;
	}
}

162 163
static int ioapic_deliver(struct kvm_ioapic *ioapic, int irq)
{
164 165
	union kvm_ioapic_redirect_entry *entry = &ioapic->redirtbl[irq];
	struct kvm_lapic_irq irqe;
166 167 168

	ioapic_debug("dest=%x dest_mode=%x delivery_mode=%x "
		     "vector=%x trig_mode=%x\n",
169 170 171 172 173 174 175 176 177 178 179
		     entry->fields.dest, entry->fields.dest_mode,
		     entry->fields.delivery_mode, entry->fields.vector,
		     entry->fields.trig_mode);

	irqe.dest_id = entry->fields.dest_id;
	irqe.vector = entry->fields.vector;
	irqe.dest_mode = entry->fields.dest_mode;
	irqe.trig_mode = entry->fields.trig_mode;
	irqe.delivery_mode = entry->fields.delivery_mode << 8;
	irqe.level = 1;
	irqe.shorthand = 0;
180 181 182 183

#ifdef CONFIG_X86
	/* Always delivery PIT interrupt to vcpu 0 */
	if (irq == 0) {
184
		irqe.dest_mode = 0; /* Physical mode. */
185 186 187
		/* need to read apic_id from apic regiest since
		 * it can be rewritten */
		irqe.dest_id = ioapic->kvm->bsp_vcpu->vcpu_id;
188 189
	}
#endif
190
	return kvm_irq_delivery_to_apic(ioapic->kvm, NULL, &irqe);
191 192
}

193
int kvm_ioapic_set_irq(struct kvm_ioapic *ioapic, int irq, int level)
E
Eddie Dong 已提交
194
{
195
	u32 old_irr;
E
Eddie Dong 已提交
196
	u32 mask = 1 << irq;
S
Sheng Yang 已提交
197
	union kvm_ioapic_redirect_entry entry;
198
	int ret = 1;
E
Eddie Dong 已提交
199

200
	spin_lock(&ioapic->lock);
201
	old_irr = ioapic->irr;
E
Eddie Dong 已提交
202 203 204 205 206 207
	if (irq >= 0 && irq < IOAPIC_NUM_PINS) {
		entry = ioapic->redirtbl[irq];
		level ^= entry.fields.polarity;
		if (!level)
			ioapic->irr &= ~mask;
		else {
208
			int edge = (entry.fields.trig_mode == IOAPIC_EDGE_TRIG);
E
Eddie Dong 已提交
209
			ioapic->irr |= mask;
210 211
			if ((edge && old_irr != ioapic->irr) ||
			    (!edge && !entry.fields.remote_irr))
212
				ret = ioapic_service(ioapic, irq);
213 214
			else
				ret = 0; /* report coalesced interrupt */
E
Eddie Dong 已提交
215
		}
216
		trace_kvm_ioapic_set_irq(entry.bits, irq, ret == 0);
E
Eddie Dong 已提交
217
	}
218
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
219

220
	return ret;
E
Eddie Dong 已提交
221 222
}

G
Gleb Natapov 已提交
223 224
static void __kvm_ioapic_update_eoi(struct kvm_ioapic *ioapic, int vector,
				     int trigger_mode)
E
Eddie Dong 已提交
225
{
G
Gleb Natapov 已提交
226 227 228 229
	int i;

	for (i = 0; i < IOAPIC_NUM_PINS; i++) {
		union kvm_ioapic_redirect_entry *ent = &ioapic->redirtbl[i];
E
Eddie Dong 已提交
230

G
Gleb Natapov 已提交
231 232
		if (ent->fields.vector != vector)
			continue;
E
Eddie Dong 已提交
233

G
Gleb Natapov 已提交
234 235 236 237 238 239 240 241
		/*
		 * We are dropping lock while calling ack notifiers because ack
		 * notifier callbacks for assigned devices call into IOAPIC
		 * recursively. Since remote_irr is cleared only after call
		 * to notifiers if the same vector will be delivered while lock
		 * is dropped it will be put into irr and will be delivered
		 * after ack notifier returns.
		 */
242
		spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
243
		kvm_notify_acked_irq(ioapic->kvm, KVM_IRQCHIP_IOAPIC, i);
244
		spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
245 246 247

		if (trigger_mode != IOAPIC_LEVEL_TRIG)
			continue;
M
Marcelo Tosatti 已提交
248 249 250

		ASSERT(ent->fields.trig_mode == IOAPIC_LEVEL_TRIG);
		ent->fields.remote_irr = 0;
G
Gleb Natapov 已提交
251 252
		if (!ent->fields.mask && (ioapic->irr & (1 << i)))
			ioapic_service(ioapic, i);
M
Marcelo Tosatti 已提交
253
	}
E
Eddie Dong 已提交
254 255
}

M
Marcelo Tosatti 已提交
256
void kvm_ioapic_update_eoi(struct kvm *kvm, int vector, int trigger_mode)
257 258 259
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;

260 261 262
	smp_rmb();
	if (!test_bit(vector, ioapic->handled_vectors))
		return;
263
	spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
264
	__kvm_ioapic_update_eoi(ioapic, vector, trigger_mode);
265
	spin_unlock(&ioapic->lock);
266 267
}

G
Gregory Haskins 已提交
268 269 270 271 272
static inline struct kvm_ioapic *to_ioapic(struct kvm_io_device *dev)
{
	return container_of(dev, struct kvm_ioapic, dev);
}

273
static inline int ioapic_in_range(struct kvm_ioapic *ioapic, gpa_t addr)
E
Eddie Dong 已提交
274 275 276 277 278
{
	return ((addr >= ioapic->base_address &&
		 (addr < ioapic->base_address + IOAPIC_MEM_LENGTH)));
}

279 280
static int ioapic_mmio_read(struct kvm_io_device *this, gpa_t addr, int len,
			    void *val)
E
Eddie Dong 已提交
281
{
G
Gregory Haskins 已提交
282
	struct kvm_ioapic *ioapic = to_ioapic(this);
E
Eddie Dong 已提交
283
	u32 result;
284 285
	if (!ioapic_in_range(ioapic, addr))
		return -EOPNOTSUPP;
E
Eddie Dong 已提交
286

287
	ioapic_debug("addr %lx\n", (unsigned long)addr);
E
Eddie Dong 已提交
288 289 290
	ASSERT(!(addr & 0xf));	/* check alignment */

	addr &= 0xff;
291
	spin_lock(&ioapic->lock);
E
Eddie Dong 已提交
292 293 294 295 296 297 298 299 300 301 302 303 304
	switch (addr) {
	case IOAPIC_REG_SELECT:
		result = ioapic->ioregsel;
		break;

	case IOAPIC_REG_WINDOW:
		result = ioapic_read_indirect(ioapic, addr, len);
		break;

	default:
		result = 0;
		break;
	}
305
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
306

E
Eddie Dong 已提交
307 308 309 310 311 312 313 314 315 316 317 318
	switch (len) {
	case 8:
		*(u64 *) val = result;
		break;
	case 1:
	case 2:
	case 4:
		memcpy(val, (char *)&result, len);
		break;
	default:
		printk(KERN_WARNING "ioapic: wrong length %d\n", len);
	}
319
	return 0;
E
Eddie Dong 已提交
320 321
}

322 323
static int ioapic_mmio_write(struct kvm_io_device *this, gpa_t addr, int len,
			     const void *val)
E
Eddie Dong 已提交
324
{
G
Gregory Haskins 已提交
325
	struct kvm_ioapic *ioapic = to_ioapic(this);
E
Eddie Dong 已提交
326
	u32 data;
327 328
	if (!ioapic_in_range(ioapic, addr))
		return -EOPNOTSUPP;
E
Eddie Dong 已提交
329

330 331
	ioapic_debug("ioapic_mmio_write addr=%p len=%d val=%p\n",
		     (void*)addr, len, val);
E
Eddie Dong 已提交
332
	ASSERT(!(addr & 0xf));	/* check alignment */
333

E
Eddie Dong 已提交
334 335 336 337
	if (len == 4 || len == 8)
		data = *(u32 *) val;
	else {
		printk(KERN_WARNING "ioapic: Unsupported size %d\n", len);
G
Gleb Natapov 已提交
338
		return 0;
E
Eddie Dong 已提交
339 340 341
	}

	addr &= 0xff;
342
	spin_lock(&ioapic->lock);
E
Eddie Dong 已提交
343 344 345 346 347 348 349 350
	switch (addr) {
	case IOAPIC_REG_SELECT:
		ioapic->ioregsel = data;
		break;

	case IOAPIC_REG_WINDOW:
		ioapic_write_indirect(ioapic, data);
		break;
351 352
#ifdef	CONFIG_IA64
	case IOAPIC_REG_EOI:
G
Gleb Natapov 已提交
353
		__kvm_ioapic_update_eoi(ioapic, data, IOAPIC_LEVEL_TRIG);
354 355
		break;
#endif
E
Eddie Dong 已提交
356 357 358 359

	default:
		break;
	}
360
	spin_unlock(&ioapic->lock);
361
	return 0;
E
Eddie Dong 已提交
362 363
}

364 365 366 367 368 369 370 371 372 373
void kvm_ioapic_reset(struct kvm_ioapic *ioapic)
{
	int i;

	for (i = 0; i < IOAPIC_NUM_PINS; i++)
		ioapic->redirtbl[i].fields.mask = 1;
	ioapic->base_address = IOAPIC_DEFAULT_BASE_ADDRESS;
	ioapic->ioregsel = 0;
	ioapic->irr = 0;
	ioapic->id = 0;
374
	update_handled_vectors(ioapic);
375 376
}

G
Gregory Haskins 已提交
377 378 379 380 381
static const struct kvm_io_device_ops ioapic_mmio_ops = {
	.read     = ioapic_mmio_read,
	.write    = ioapic_mmio_write,
};

E
Eddie Dong 已提交
382 383 384
int kvm_ioapic_init(struct kvm *kvm)
{
	struct kvm_ioapic *ioapic;
385
	int ret;
E
Eddie Dong 已提交
386 387 388 389

	ioapic = kzalloc(sizeof(struct kvm_ioapic), GFP_KERNEL);
	if (!ioapic)
		return -ENOMEM;
390
	spin_lock_init(&ioapic->lock);
391
	kvm->arch.vioapic = ioapic;
392
	kvm_ioapic_reset(ioapic);
G
Gregory Haskins 已提交
393
	kvm_iodevice_init(&ioapic->dev, &ioapic_mmio_ops);
E
Eddie Dong 已提交
394
	ioapic->kvm = kvm;
395
	mutex_lock(&kvm->slots_lock);
M
Marcelo Tosatti 已提交
396
	ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, &ioapic->dev);
397
	mutex_unlock(&kvm->slots_lock);
398 399
	if (ret < 0) {
		kvm->arch.vioapic = NULL;
400
		kfree(ioapic);
401
	}
402 403

	return ret;
E
Eddie Dong 已提交
404
}
405

406 407 408 409 410 411 412 413 414 415 416
void kvm_ioapic_destroy(struct kvm *kvm)
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;

	if (ioapic) {
		kvm_io_bus_unregister_dev(kvm, KVM_MMIO_BUS, &ioapic->dev);
		kvm->arch.vioapic = NULL;
		kfree(ioapic);
	}
}

G
Gleb Natapov 已提交
417 418 419 420 421 422
int kvm_get_ioapic(struct kvm *kvm, struct kvm_ioapic_state *state)
{
	struct kvm_ioapic *ioapic = ioapic_irqchip(kvm);
	if (!ioapic)
		return -EINVAL;

423
	spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
424
	memcpy(state, ioapic, sizeof(struct kvm_ioapic_state));
425
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
426 427 428 429 430 431 432 433 434
	return 0;
}

int kvm_set_ioapic(struct kvm *kvm, struct kvm_ioapic_state *state)
{
	struct kvm_ioapic *ioapic = ioapic_irqchip(kvm);
	if (!ioapic)
		return -EINVAL;

435
	spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
436
	memcpy(ioapic, state, sizeof(struct kvm_ioapic_state));
437
	update_handled_vectors(ioapic);
438
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
439 440
	return 0;
}