ioapic.c 10.6 KB
Newer Older
E
Eddie Dong 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
/*
 *  Copyright (C) 2001  MandrakeSoft S.A.
 *
 *    MandrakeSoft S.A.
 *    43, rue d'Aboukir
 *    75002 Paris - France
 *    http://www.linux-mandrake.com/
 *    http://www.mandrakesoft.com/
 *
 *  This library is free software; you can redistribute it and/or
 *  modify it under the terms of the GNU Lesser General Public
 *  License as published by the Free Software Foundation; either
 *  version 2 of the License, or (at your option) any later version.
 *
 *  This library is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 *  Lesser General Public License for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public
 *  License along with this library; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 *
 *  Yunhong Jiang <yunhong.jiang@intel.com>
 *  Yaozu (Eddie) Dong <eddie.dong@intel.com>
 *  Based on Xen 3.1 code.
 */

29
#include <linux/kvm_host.h>
E
Eddie Dong 已提交
30 31 32 33 34 35
#include <linux/kvm.h>
#include <linux/mm.h>
#include <linux/highmem.h>
#include <linux/smp.h>
#include <linux/hrtimer.h>
#include <linux/io.h>
36
#include <linux/slab.h>
E
Eddie Dong 已提交
37 38 39
#include <asm/processor.h>
#include <asm/page.h>
#include <asm/current.h>
40
#include <trace/events/kvm.h>
41 42 43

#include "ioapic.h"
#include "lapic.h"
M
Marcelo Tosatti 已提交
44
#include "irq.h"
45

46 47 48
#if 0
#define ioapic_debug(fmt,arg...) printk(KERN_WARNING fmt,##arg)
#else
E
Eddie Dong 已提交
49
#define ioapic_debug(fmt, arg...)
50
#endif
51
static int ioapic_deliver(struct kvm_ioapic *vioapic, int irq);
E
Eddie Dong 已提交
52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87

static unsigned long ioapic_read_indirect(struct kvm_ioapic *ioapic,
					  unsigned long addr,
					  unsigned long length)
{
	unsigned long result = 0;

	switch (ioapic->ioregsel) {
	case IOAPIC_REG_VERSION:
		result = ((((IOAPIC_NUM_PINS - 1) & 0xff) << 16)
			  | (IOAPIC_VERSION_ID & 0xff));
		break;

	case IOAPIC_REG_APIC_ID:
	case IOAPIC_REG_ARB_ID:
		result = ((ioapic->id & 0xf) << 24);
		break;

	default:
		{
			u32 redir_index = (ioapic->ioregsel - 0x10) >> 1;
			u64 redir_content;

			ASSERT(redir_index < IOAPIC_NUM_PINS);

			redir_content = ioapic->redirtbl[redir_index].bits;
			result = (ioapic->ioregsel & 0x1) ?
			    (redir_content >> 32) & 0xffffffff :
			    redir_content & 0xffffffff;
			break;
		}
	}

	return result;
}

88
static int ioapic_service(struct kvm_ioapic *ioapic, unsigned int idx)
E
Eddie Dong 已提交
89
{
S
Sheng Yang 已提交
90
	union kvm_ioapic_redirect_entry *pent;
91
	int injected = -1;
E
Eddie Dong 已提交
92 93 94 95

	pent = &ioapic->redirtbl[idx];

	if (!pent->fields.mask) {
96
		injected = ioapic_deliver(ioapic, idx);
97
		if (injected && pent->fields.trig_mode == IOAPIC_LEVEL_TRIG)
E
Eddie Dong 已提交
98 99
			pent->fields.remote_irr = 1;
	}
100 101

	return injected;
E
Eddie Dong 已提交
102 103
}

104 105 106 107 108 109 110 111 112 113 114 115 116
static void update_handled_vectors(struct kvm_ioapic *ioapic)
{
	DECLARE_BITMAP(handled_vectors, 256);
	int i;

	memset(handled_vectors, 0, sizeof(handled_vectors));
	for (i = 0; i < IOAPIC_NUM_PINS; ++i)
		__set_bit(ioapic->redirtbl[i].fields.vector, handled_vectors);
	memcpy(ioapic->handled_vectors, handled_vectors,
	       sizeof(handled_vectors));
	smp_wmb();
}

E
Eddie Dong 已提交
117 118 119
static void ioapic_write_indirect(struct kvm_ioapic *ioapic, u32 val)
{
	unsigned index;
120
	bool mask_before, mask_after;
121
	union kvm_ioapic_redirect_entry *e;
E
Eddie Dong 已提交
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137

	switch (ioapic->ioregsel) {
	case IOAPIC_REG_VERSION:
		/* Writes are ignored. */
		break;

	case IOAPIC_REG_APIC_ID:
		ioapic->id = (val >> 24) & 0xf;
		break;

	case IOAPIC_REG_ARB_ID:
		break;

	default:
		index = (ioapic->ioregsel - 0x10) >> 1;

138
		ioapic_debug("change redir index %x val %x\n", index, val);
E
Eddie Dong 已提交
139 140
		if (index >= IOAPIC_NUM_PINS)
			return;
141 142
		e = &ioapic->redirtbl[index];
		mask_before = e->fields.mask;
E
Eddie Dong 已提交
143
		if (ioapic->ioregsel & 1) {
144 145
			e->bits &= 0xffffffff;
			e->bits |= (u64) val << 32;
E
Eddie Dong 已提交
146
		} else {
147 148 149
			e->bits &= ~0xffffffffULL;
			e->bits |= (u32) val;
			e->fields.remote_irr = 0;
E
Eddie Dong 已提交
150
		}
151
		update_handled_vectors(ioapic);
152
		mask_after = e->fields.mask;
153 154
		if (mask_before != mask_after)
			kvm_fire_mask_notifiers(ioapic->kvm, index, mask_after);
155
		if (e->fields.trig_mode == IOAPIC_LEVEL_TRIG
156
		    && ioapic->irr & (1 << index))
E
Eddie Dong 已提交
157 158 159 160 161
			ioapic_service(ioapic, index);
		break;
	}
}

162 163
static int ioapic_deliver(struct kvm_ioapic *ioapic, int irq)
{
164 165
	union kvm_ioapic_redirect_entry *entry = &ioapic->redirtbl[irq];
	struct kvm_lapic_irq irqe;
166 167 168

	ioapic_debug("dest=%x dest_mode=%x delivery_mode=%x "
		     "vector=%x trig_mode=%x\n",
169 170 171 172 173 174 175 176 177 178 179
		     entry->fields.dest, entry->fields.dest_mode,
		     entry->fields.delivery_mode, entry->fields.vector,
		     entry->fields.trig_mode);

	irqe.dest_id = entry->fields.dest_id;
	irqe.vector = entry->fields.vector;
	irqe.dest_mode = entry->fields.dest_mode;
	irqe.trig_mode = entry->fields.trig_mode;
	irqe.delivery_mode = entry->fields.delivery_mode << 8;
	irqe.level = 1;
	irqe.shorthand = 0;
180 181 182 183

#ifdef CONFIG_X86
	/* Always delivery PIT interrupt to vcpu 0 */
	if (irq == 0) {
184
		irqe.dest_mode = 0; /* Physical mode. */
185 186 187
		/* need to read apic_id from apic regiest since
		 * it can be rewritten */
		irqe.dest_id = ioapic->kvm->bsp_vcpu->vcpu_id;
188 189
	}
#endif
190
	return kvm_irq_delivery_to_apic(ioapic->kvm, NULL, &irqe);
191 192
}

193
int kvm_ioapic_set_irq(struct kvm_ioapic *ioapic, int irq, int level)
E
Eddie Dong 已提交
194 195 196
{
	u32 old_irr = ioapic->irr;
	u32 mask = 1 << irq;
S
Sheng Yang 已提交
197
	union kvm_ioapic_redirect_entry entry;
198
	int ret = 1;
E
Eddie Dong 已提交
199

G
Gleb Natapov 已提交
200
	mutex_lock(&ioapic->lock);
E
Eddie Dong 已提交
201 202 203 204 205 206
	if (irq >= 0 && irq < IOAPIC_NUM_PINS) {
		entry = ioapic->redirtbl[irq];
		level ^= entry.fields.polarity;
		if (!level)
			ioapic->irr &= ~mask;
		else {
207
			int edge = (entry.fields.trig_mode == IOAPIC_EDGE_TRIG);
E
Eddie Dong 已提交
208
			ioapic->irr |= mask;
209 210
			if ((edge && old_irr != ioapic->irr) ||
			    (!edge && !entry.fields.remote_irr))
211
				ret = ioapic_service(ioapic, irq);
212 213
			else
				ret = 0; /* report coalesced interrupt */
E
Eddie Dong 已提交
214
		}
215
		trace_kvm_ioapic_set_irq(entry.bits, irq, ret == 0);
E
Eddie Dong 已提交
216
	}
G
Gleb Natapov 已提交
217 218
	mutex_unlock(&ioapic->lock);

219
	return ret;
E
Eddie Dong 已提交
220 221
}

G
Gleb Natapov 已提交
222 223
static void __kvm_ioapic_update_eoi(struct kvm_ioapic *ioapic, int vector,
				     int trigger_mode)
E
Eddie Dong 已提交
224
{
G
Gleb Natapov 已提交
225 226 227 228
	int i;

	for (i = 0; i < IOAPIC_NUM_PINS; i++) {
		union kvm_ioapic_redirect_entry *ent = &ioapic->redirtbl[i];
E
Eddie Dong 已提交
229

G
Gleb Natapov 已提交
230 231
		if (ent->fields.vector != vector)
			continue;
E
Eddie Dong 已提交
232

G
Gleb Natapov 已提交
233 234 235 236 237 238 239 240 241 242 243 244 245 246
		/*
		 * We are dropping lock while calling ack notifiers because ack
		 * notifier callbacks for assigned devices call into IOAPIC
		 * recursively. Since remote_irr is cleared only after call
		 * to notifiers if the same vector will be delivered while lock
		 * is dropped it will be put into irr and will be delivered
		 * after ack notifier returns.
		 */
		mutex_unlock(&ioapic->lock);
		kvm_notify_acked_irq(ioapic->kvm, KVM_IRQCHIP_IOAPIC, i);
		mutex_lock(&ioapic->lock);

		if (trigger_mode != IOAPIC_LEVEL_TRIG)
			continue;
M
Marcelo Tosatti 已提交
247 248 249

		ASSERT(ent->fields.trig_mode == IOAPIC_LEVEL_TRIG);
		ent->fields.remote_irr = 0;
G
Gleb Natapov 已提交
250 251
		if (!ent->fields.mask && (ioapic->irr & (1 << i)))
			ioapic_service(ioapic, i);
M
Marcelo Tosatti 已提交
252
	}
E
Eddie Dong 已提交
253 254
}

M
Marcelo Tosatti 已提交
255
void kvm_ioapic_update_eoi(struct kvm *kvm, int vector, int trigger_mode)
256 257 258
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;

259 260 261
	smp_rmb();
	if (!test_bit(vector, ioapic->handled_vectors))
		return;
G
Gleb Natapov 已提交
262 263 264
	mutex_lock(&ioapic->lock);
	__kvm_ioapic_update_eoi(ioapic, vector, trigger_mode);
	mutex_unlock(&ioapic->lock);
265 266
}

G
Gregory Haskins 已提交
267 268 269 270 271
static inline struct kvm_ioapic *to_ioapic(struct kvm_io_device *dev)
{
	return container_of(dev, struct kvm_ioapic, dev);
}

272
static inline int ioapic_in_range(struct kvm_ioapic *ioapic, gpa_t addr)
E
Eddie Dong 已提交
273 274 275 276 277
{
	return ((addr >= ioapic->base_address &&
		 (addr < ioapic->base_address + IOAPIC_MEM_LENGTH)));
}

278 279
static int ioapic_mmio_read(struct kvm_io_device *this, gpa_t addr, int len,
			    void *val)
E
Eddie Dong 已提交
280
{
G
Gregory Haskins 已提交
281
	struct kvm_ioapic *ioapic = to_ioapic(this);
E
Eddie Dong 已提交
282
	u32 result;
283 284
	if (!ioapic_in_range(ioapic, addr))
		return -EOPNOTSUPP;
E
Eddie Dong 已提交
285

286
	ioapic_debug("addr %lx\n", (unsigned long)addr);
E
Eddie Dong 已提交
287 288 289
	ASSERT(!(addr & 0xf));	/* check alignment */

	addr &= 0xff;
G
Gleb Natapov 已提交
290
	mutex_lock(&ioapic->lock);
E
Eddie Dong 已提交
291 292 293 294 295 296 297 298 299 300 301 302 303
	switch (addr) {
	case IOAPIC_REG_SELECT:
		result = ioapic->ioregsel;
		break;

	case IOAPIC_REG_WINDOW:
		result = ioapic_read_indirect(ioapic, addr, len);
		break;

	default:
		result = 0;
		break;
	}
G
Gleb Natapov 已提交
304 305
	mutex_unlock(&ioapic->lock);

E
Eddie Dong 已提交
306 307 308 309 310 311 312 313 314 315 316 317
	switch (len) {
	case 8:
		*(u64 *) val = result;
		break;
	case 1:
	case 2:
	case 4:
		memcpy(val, (char *)&result, len);
		break;
	default:
		printk(KERN_WARNING "ioapic: wrong length %d\n", len);
	}
318
	return 0;
E
Eddie Dong 已提交
319 320
}

321 322
static int ioapic_mmio_write(struct kvm_io_device *this, gpa_t addr, int len,
			     const void *val)
E
Eddie Dong 已提交
323
{
G
Gregory Haskins 已提交
324
	struct kvm_ioapic *ioapic = to_ioapic(this);
E
Eddie Dong 已提交
325
	u32 data;
326 327
	if (!ioapic_in_range(ioapic, addr))
		return -EOPNOTSUPP;
E
Eddie Dong 已提交
328

329 330
	ioapic_debug("ioapic_mmio_write addr=%p len=%d val=%p\n",
		     (void*)addr, len, val);
E
Eddie Dong 已提交
331
	ASSERT(!(addr & 0xf));	/* check alignment */
332

E
Eddie Dong 已提交
333 334 335 336
	if (len == 4 || len == 8)
		data = *(u32 *) val;
	else {
		printk(KERN_WARNING "ioapic: Unsupported size %d\n", len);
G
Gleb Natapov 已提交
337
		return 0;
E
Eddie Dong 已提交
338 339 340
	}

	addr &= 0xff;
G
Gleb Natapov 已提交
341
	mutex_lock(&ioapic->lock);
E
Eddie Dong 已提交
342 343 344 345 346 347 348 349
	switch (addr) {
	case IOAPIC_REG_SELECT:
		ioapic->ioregsel = data;
		break;

	case IOAPIC_REG_WINDOW:
		ioapic_write_indirect(ioapic, data);
		break;
350 351
#ifdef	CONFIG_IA64
	case IOAPIC_REG_EOI:
G
Gleb Natapov 已提交
352
		__kvm_ioapic_update_eoi(ioapic, data, IOAPIC_LEVEL_TRIG);
353 354
		break;
#endif
E
Eddie Dong 已提交
355 356 357 358

	default:
		break;
	}
G
Gleb Natapov 已提交
359
	mutex_unlock(&ioapic->lock);
360
	return 0;
E
Eddie Dong 已提交
361 362
}

363 364 365 366 367 368 369 370 371 372
void kvm_ioapic_reset(struct kvm_ioapic *ioapic)
{
	int i;

	for (i = 0; i < IOAPIC_NUM_PINS; i++)
		ioapic->redirtbl[i].fields.mask = 1;
	ioapic->base_address = IOAPIC_DEFAULT_BASE_ADDRESS;
	ioapic->ioregsel = 0;
	ioapic->irr = 0;
	ioapic->id = 0;
373
	update_handled_vectors(ioapic);
374 375
}

G
Gregory Haskins 已提交
376 377 378 379 380
static const struct kvm_io_device_ops ioapic_mmio_ops = {
	.read     = ioapic_mmio_read,
	.write    = ioapic_mmio_write,
};

E
Eddie Dong 已提交
381 382 383
int kvm_ioapic_init(struct kvm *kvm)
{
	struct kvm_ioapic *ioapic;
384
	int ret;
E
Eddie Dong 已提交
385 386 387 388

	ioapic = kzalloc(sizeof(struct kvm_ioapic), GFP_KERNEL);
	if (!ioapic)
		return -ENOMEM;
G
Gleb Natapov 已提交
389
	mutex_init(&ioapic->lock);
390
	kvm->arch.vioapic = ioapic;
391
	kvm_ioapic_reset(ioapic);
G
Gregory Haskins 已提交
392
	kvm_iodevice_init(&ioapic->dev, &ioapic_mmio_ops);
E
Eddie Dong 已提交
393
	ioapic->kvm = kvm;
394
	mutex_lock(&kvm->slots_lock);
M
Marcelo Tosatti 已提交
395
	ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, &ioapic->dev);
396
	mutex_unlock(&kvm->slots_lock);
397 398
	if (ret < 0) {
		kvm->arch.vioapic = NULL;
399
		kfree(ioapic);
400
	}
401 402

	return ret;
E
Eddie Dong 已提交
403
}
404

405 406 407 408 409 410 411 412 413 414 415
void kvm_ioapic_destroy(struct kvm *kvm)
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;

	if (ioapic) {
		kvm_io_bus_unregister_dev(kvm, KVM_MMIO_BUS, &ioapic->dev);
		kvm->arch.vioapic = NULL;
		kfree(ioapic);
	}
}

G
Gleb Natapov 已提交
416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435
int kvm_get_ioapic(struct kvm *kvm, struct kvm_ioapic_state *state)
{
	struct kvm_ioapic *ioapic = ioapic_irqchip(kvm);
	if (!ioapic)
		return -EINVAL;

	mutex_lock(&ioapic->lock);
	memcpy(state, ioapic, sizeof(struct kvm_ioapic_state));
	mutex_unlock(&ioapic->lock);
	return 0;
}

int kvm_set_ioapic(struct kvm *kvm, struct kvm_ioapic_state *state)
{
	struct kvm_ioapic *ioapic = ioapic_irqchip(kvm);
	if (!ioapic)
		return -EINVAL;

	mutex_lock(&ioapic->lock);
	memcpy(ioapic, state, sizeof(struct kvm_ioapic_state));
436
	update_handled_vectors(ioapic);
G
Gleb Natapov 已提交
437 438 439
	mutex_unlock(&ioapic->lock);
	return 0;
}