ioapic.c 11.3 KB
Newer Older
E
Eddie Dong 已提交
1 2
/*
 *  Copyright (C) 2001  MandrakeSoft S.A.
A
Avi Kivity 已提交
3
 *  Copyright 2010 Red Hat, Inc. and/or its affiliates.
E
Eddie Dong 已提交
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
 *
 *    MandrakeSoft S.A.
 *    43, rue d'Aboukir
 *    75002 Paris - France
 *    http://www.linux-mandrake.com/
 *    http://www.mandrakesoft.com/
 *
 *  This library is free software; you can redistribute it and/or
 *  modify it under the terms of the GNU Lesser General Public
 *  License as published by the Free Software Foundation; either
 *  version 2 of the License, or (at your option) any later version.
 *
 *  This library is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 *  Lesser General Public License for more details.
 *
 *  You should have received a copy of the GNU Lesser General Public
 *  License along with this library; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 *
 *  Yunhong Jiang <yunhong.jiang@intel.com>
 *  Yaozu (Eddie) Dong <eddie.dong@intel.com>
 *  Based on Xen 3.1 code.
 */

30
#include <linux/kvm_host.h>
E
Eddie Dong 已提交
31 32 33 34 35 36
#include <linux/kvm.h>
#include <linux/mm.h>
#include <linux/highmem.h>
#include <linux/smp.h>
#include <linux/hrtimer.h>
#include <linux/io.h>
37
#include <linux/slab.h>
E
Eddie Dong 已提交
38 39 40
#include <asm/processor.h>
#include <asm/page.h>
#include <asm/current.h>
41
#include <trace/events/kvm.h>
42 43 44

#include "ioapic.h"
#include "lapic.h"
M
Marcelo Tosatti 已提交
45
#include "irq.h"
46

47 48 49
#if 0
#define ioapic_debug(fmt,arg...) printk(KERN_WARNING fmt,##arg)
#else
E
Eddie Dong 已提交
50
#define ioapic_debug(fmt, arg...)
51
#endif
52
static int ioapic_deliver(struct kvm_ioapic *vioapic, int irq);
E
Eddie Dong 已提交
53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88

static unsigned long ioapic_read_indirect(struct kvm_ioapic *ioapic,
					  unsigned long addr,
					  unsigned long length)
{
	unsigned long result = 0;

	switch (ioapic->ioregsel) {
	case IOAPIC_REG_VERSION:
		result = ((((IOAPIC_NUM_PINS - 1) & 0xff) << 16)
			  | (IOAPIC_VERSION_ID & 0xff));
		break;

	case IOAPIC_REG_APIC_ID:
	case IOAPIC_REG_ARB_ID:
		result = ((ioapic->id & 0xf) << 24);
		break;

	default:
		{
			u32 redir_index = (ioapic->ioregsel - 0x10) >> 1;
			u64 redir_content;

			ASSERT(redir_index < IOAPIC_NUM_PINS);

			redir_content = ioapic->redirtbl[redir_index].bits;
			result = (ioapic->ioregsel & 0x1) ?
			    (redir_content >> 32) & 0xffffffff :
			    redir_content & 0xffffffff;
			break;
		}
	}

	return result;
}

89
static int ioapic_service(struct kvm_ioapic *ioapic, unsigned int idx)
E
Eddie Dong 已提交
90
{
S
Sheng Yang 已提交
91
	union kvm_ioapic_redirect_entry *pent;
92
	int injected = -1;
E
Eddie Dong 已提交
93 94 95 96

	pent = &ioapic->redirtbl[idx];

	if (!pent->fields.mask) {
97
		injected = ioapic_deliver(ioapic, idx);
98
		if (injected && pent->fields.trig_mode == IOAPIC_LEVEL_TRIG)
E
Eddie Dong 已提交
99 100
			pent->fields.remote_irr = 1;
	}
101 102

	return injected;
E
Eddie Dong 已提交
103 104
}

105 106 107 108 109 110 111 112 113 114 115 116 117
static void update_handled_vectors(struct kvm_ioapic *ioapic)
{
	DECLARE_BITMAP(handled_vectors, 256);
	int i;

	memset(handled_vectors, 0, sizeof(handled_vectors));
	for (i = 0; i < IOAPIC_NUM_PINS; ++i)
		__set_bit(ioapic->redirtbl[i].fields.vector, handled_vectors);
	memcpy(ioapic->handled_vectors, handled_vectors,
	       sizeof(handled_vectors));
	smp_wmb();
}

E
Eddie Dong 已提交
118 119 120
static void ioapic_write_indirect(struct kvm_ioapic *ioapic, u32 val)
{
	unsigned index;
121
	bool mask_before, mask_after;
122
	union kvm_ioapic_redirect_entry *e;
E
Eddie Dong 已提交
123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138

	switch (ioapic->ioregsel) {
	case IOAPIC_REG_VERSION:
		/* Writes are ignored. */
		break;

	case IOAPIC_REG_APIC_ID:
		ioapic->id = (val >> 24) & 0xf;
		break;

	case IOAPIC_REG_ARB_ID:
		break;

	default:
		index = (ioapic->ioregsel - 0x10) >> 1;

139
		ioapic_debug("change redir index %x val %x\n", index, val);
E
Eddie Dong 已提交
140 141
		if (index >= IOAPIC_NUM_PINS)
			return;
142 143
		e = &ioapic->redirtbl[index];
		mask_before = e->fields.mask;
E
Eddie Dong 已提交
144
		if (ioapic->ioregsel & 1) {
145 146
			e->bits &= 0xffffffff;
			e->bits |= (u64) val << 32;
E
Eddie Dong 已提交
147
		} else {
148 149 150
			e->bits &= ~0xffffffffULL;
			e->bits |= (u32) val;
			e->fields.remote_irr = 0;
E
Eddie Dong 已提交
151
		}
152
		update_handled_vectors(ioapic);
153
		mask_after = e->fields.mask;
154
		if (mask_before != mask_after)
155
			kvm_fire_mask_notifiers(ioapic->kvm, KVM_IRQCHIP_IOAPIC, index, mask_after);
156
		if (e->fields.trig_mode == IOAPIC_LEVEL_TRIG
157
		    && ioapic->irr & (1 << index))
E
Eddie Dong 已提交
158 159 160 161 162
			ioapic_service(ioapic, index);
		break;
	}
}

163 164
static int ioapic_deliver(struct kvm_ioapic *ioapic, int irq)
{
165 166
	union kvm_ioapic_redirect_entry *entry = &ioapic->redirtbl[irq];
	struct kvm_lapic_irq irqe;
167 168 169

	ioapic_debug("dest=%x dest_mode=%x delivery_mode=%x "
		     "vector=%x trig_mode=%x\n",
170
		     entry->fields.dest_id, entry->fields.dest_mode,
171 172 173 174 175 176 177 178 179 180
		     entry->fields.delivery_mode, entry->fields.vector,
		     entry->fields.trig_mode);

	irqe.dest_id = entry->fields.dest_id;
	irqe.vector = entry->fields.vector;
	irqe.dest_mode = entry->fields.dest_mode;
	irqe.trig_mode = entry->fields.trig_mode;
	irqe.delivery_mode = entry->fields.delivery_mode << 8;
	irqe.level = 1;
	irqe.shorthand = 0;
181 182 183 184

#ifdef CONFIG_X86
	/* Always delivery PIT interrupt to vcpu 0 */
	if (irq == 0) {
185
		irqe.dest_mode = 0; /* Physical mode. */
186 187
		/* need to read apic_id from apic regiest since
		 * it can be rewritten */
188
		irqe.dest_id = ioapic->kvm->bsp_vcpu_id;
189 190
	}
#endif
191
	return kvm_irq_delivery_to_apic(ioapic->kvm, NULL, &irqe);
192 193
}

194 195
int kvm_ioapic_set_irq(struct kvm_ioapic *ioapic, int irq, int irq_source_id,
		       int level)
E
Eddie Dong 已提交
196
{
197
	u32 old_irr;
E
Eddie Dong 已提交
198
	u32 mask = 1 << irq;
S
Sheng Yang 已提交
199
	union kvm_ioapic_redirect_entry entry;
200
	int ret = 1;
E
Eddie Dong 已提交
201

202
	spin_lock(&ioapic->lock);
203
	old_irr = ioapic->irr;
E
Eddie Dong 已提交
204
	if (irq >= 0 && irq < IOAPIC_NUM_PINS) {
205 206
		int irq_level = __kvm_irq_line_state(&ioapic->irq_states[irq],
						     irq_source_id, level);
E
Eddie Dong 已提交
207
		entry = ioapic->redirtbl[irq];
208 209
		irq_level ^= entry.fields.polarity;
		if (!irq_level)
E
Eddie Dong 已提交
210 211
			ioapic->irr &= ~mask;
		else {
212
			int edge = (entry.fields.trig_mode == IOAPIC_EDGE_TRIG);
E
Eddie Dong 已提交
213
			ioapic->irr |= mask;
214 215
			if ((edge && old_irr != ioapic->irr) ||
			    (!edge && !entry.fields.remote_irr))
216
				ret = ioapic_service(ioapic, irq);
217 218
			else
				ret = 0; /* report coalesced interrupt */
E
Eddie Dong 已提交
219
		}
220
		trace_kvm_ioapic_set_irq(entry.bits, irq, ret == 0);
E
Eddie Dong 已提交
221
	}
222
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
223

224
	return ret;
E
Eddie Dong 已提交
225 226
}

227 228 229 230 231 232 233 234 235 236
void kvm_ioapic_clear_all(struct kvm_ioapic *ioapic, int irq_source_id)
{
	int i;

	spin_lock(&ioapic->lock);
	for (i = 0; i < KVM_IOAPIC_NUM_PINS; i++)
		__clear_bit(irq_source_id, &ioapic->irq_states[i]);
	spin_unlock(&ioapic->lock);
}

G
Gleb Natapov 已提交
237 238
static void __kvm_ioapic_update_eoi(struct kvm_ioapic *ioapic, int vector,
				     int trigger_mode)
E
Eddie Dong 已提交
239
{
G
Gleb Natapov 已提交
240 241 242 243
	int i;

	for (i = 0; i < IOAPIC_NUM_PINS; i++) {
		union kvm_ioapic_redirect_entry *ent = &ioapic->redirtbl[i];
E
Eddie Dong 已提交
244

G
Gleb Natapov 已提交
245 246
		if (ent->fields.vector != vector)
			continue;
E
Eddie Dong 已提交
247

G
Gleb Natapov 已提交
248 249 250 251 252 253 254 255
		/*
		 * We are dropping lock while calling ack notifiers because ack
		 * notifier callbacks for assigned devices call into IOAPIC
		 * recursively. Since remote_irr is cleared only after call
		 * to notifiers if the same vector will be delivered while lock
		 * is dropped it will be put into irr and will be delivered
		 * after ack notifier returns.
		 */
256
		spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
257
		kvm_notify_acked_irq(ioapic->kvm, KVM_IRQCHIP_IOAPIC, i);
258
		spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
259 260 261

		if (trigger_mode != IOAPIC_LEVEL_TRIG)
			continue;
M
Marcelo Tosatti 已提交
262 263 264

		ASSERT(ent->fields.trig_mode == IOAPIC_LEVEL_TRIG);
		ent->fields.remote_irr = 0;
G
Gleb Natapov 已提交
265 266
		if (!ent->fields.mask && (ioapic->irr & (1 << i)))
			ioapic_service(ioapic, i);
M
Marcelo Tosatti 已提交
267
	}
E
Eddie Dong 已提交
268 269
}

M
Michael S. Tsirkin 已提交
270 271 272 273 274 275 276
bool kvm_ioapic_handles_vector(struct kvm *kvm, int vector)
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;
	smp_rmb();
	return test_bit(vector, ioapic->handled_vectors);
}

M
Marcelo Tosatti 已提交
277
void kvm_ioapic_update_eoi(struct kvm *kvm, int vector, int trigger_mode)
278 279 280
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;

281
	spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
282
	__kvm_ioapic_update_eoi(ioapic, vector, trigger_mode);
283
	spin_unlock(&ioapic->lock);
284 285
}

G
Gregory Haskins 已提交
286 287 288 289 290
static inline struct kvm_ioapic *to_ioapic(struct kvm_io_device *dev)
{
	return container_of(dev, struct kvm_ioapic, dev);
}

291
static inline int ioapic_in_range(struct kvm_ioapic *ioapic, gpa_t addr)
E
Eddie Dong 已提交
292 293 294 295 296
{
	return ((addr >= ioapic->base_address &&
		 (addr < ioapic->base_address + IOAPIC_MEM_LENGTH)));
}

297 298
static int ioapic_mmio_read(struct kvm_io_device *this, gpa_t addr, int len,
			    void *val)
E
Eddie Dong 已提交
299
{
G
Gregory Haskins 已提交
300
	struct kvm_ioapic *ioapic = to_ioapic(this);
E
Eddie Dong 已提交
301
	u32 result;
302 303
	if (!ioapic_in_range(ioapic, addr))
		return -EOPNOTSUPP;
E
Eddie Dong 已提交
304

305
	ioapic_debug("addr %lx\n", (unsigned long)addr);
E
Eddie Dong 已提交
306 307 308
	ASSERT(!(addr & 0xf));	/* check alignment */

	addr &= 0xff;
309
	spin_lock(&ioapic->lock);
E
Eddie Dong 已提交
310 311 312 313 314 315 316 317 318 319 320 321 322
	switch (addr) {
	case IOAPIC_REG_SELECT:
		result = ioapic->ioregsel;
		break;

	case IOAPIC_REG_WINDOW:
		result = ioapic_read_indirect(ioapic, addr, len);
		break;

	default:
		result = 0;
		break;
	}
323
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
324

E
Eddie Dong 已提交
325 326 327 328 329 330 331 332 333 334 335 336
	switch (len) {
	case 8:
		*(u64 *) val = result;
		break;
	case 1:
	case 2:
	case 4:
		memcpy(val, (char *)&result, len);
		break;
	default:
		printk(KERN_WARNING "ioapic: wrong length %d\n", len);
	}
337
	return 0;
E
Eddie Dong 已提交
338 339
}

340 341
static int ioapic_mmio_write(struct kvm_io_device *this, gpa_t addr, int len,
			     const void *val)
E
Eddie Dong 已提交
342
{
G
Gregory Haskins 已提交
343
	struct kvm_ioapic *ioapic = to_ioapic(this);
E
Eddie Dong 已提交
344
	u32 data;
345 346
	if (!ioapic_in_range(ioapic, addr))
		return -EOPNOTSUPP;
E
Eddie Dong 已提交
347

348 349
	ioapic_debug("ioapic_mmio_write addr=%p len=%d val=%p\n",
		     (void*)addr, len, val);
E
Eddie Dong 已提交
350
	ASSERT(!(addr & 0xf));	/* check alignment */
351

352 353 354
	switch (len) {
	case 8:
	case 4:
E
Eddie Dong 已提交
355
		data = *(u32 *) val;
356 357 358 359 360 361 362 363
		break;
	case 2:
		data = *(u16 *) val;
		break;
	case 1:
		data = *(u8  *) val;
		break;
	default:
E
Eddie Dong 已提交
364
		printk(KERN_WARNING "ioapic: Unsupported size %d\n", len);
G
Gleb Natapov 已提交
365
		return 0;
E
Eddie Dong 已提交
366 367 368
	}

	addr &= 0xff;
369
	spin_lock(&ioapic->lock);
E
Eddie Dong 已提交
370 371
	switch (addr) {
	case IOAPIC_REG_SELECT:
372
		ioapic->ioregsel = data & 0xFF; /* 8-bit register */
E
Eddie Dong 已提交
373 374 375 376 377
		break;

	case IOAPIC_REG_WINDOW:
		ioapic_write_indirect(ioapic, data);
		break;
378 379
#ifdef	CONFIG_IA64
	case IOAPIC_REG_EOI:
G
Gleb Natapov 已提交
380
		__kvm_ioapic_update_eoi(ioapic, data, IOAPIC_LEVEL_TRIG);
381 382
		break;
#endif
E
Eddie Dong 已提交
383 384 385 386

	default:
		break;
	}
387
	spin_unlock(&ioapic->lock);
388
	return 0;
E
Eddie Dong 已提交
389 390
}

391 392 393 394 395 396 397 398 399 400
void kvm_ioapic_reset(struct kvm_ioapic *ioapic)
{
	int i;

	for (i = 0; i < IOAPIC_NUM_PINS; i++)
		ioapic->redirtbl[i].fields.mask = 1;
	ioapic->base_address = IOAPIC_DEFAULT_BASE_ADDRESS;
	ioapic->ioregsel = 0;
	ioapic->irr = 0;
	ioapic->id = 0;
401
	update_handled_vectors(ioapic);
402 403
}

G
Gregory Haskins 已提交
404 405 406 407 408
static const struct kvm_io_device_ops ioapic_mmio_ops = {
	.read     = ioapic_mmio_read,
	.write    = ioapic_mmio_write,
};

E
Eddie Dong 已提交
409 410 411
int kvm_ioapic_init(struct kvm *kvm)
{
	struct kvm_ioapic *ioapic;
412
	int ret;
E
Eddie Dong 已提交
413 414 415 416

	ioapic = kzalloc(sizeof(struct kvm_ioapic), GFP_KERNEL);
	if (!ioapic)
		return -ENOMEM;
417
	spin_lock_init(&ioapic->lock);
418
	kvm->arch.vioapic = ioapic;
419
	kvm_ioapic_reset(ioapic);
G
Gregory Haskins 已提交
420
	kvm_iodevice_init(&ioapic->dev, &ioapic_mmio_ops);
E
Eddie Dong 已提交
421
	ioapic->kvm = kvm;
422
	mutex_lock(&kvm->slots_lock);
423 424
	ret = kvm_io_bus_register_dev(kvm, KVM_MMIO_BUS, ioapic->base_address,
				      IOAPIC_MEM_LENGTH, &ioapic->dev);
425
	mutex_unlock(&kvm->slots_lock);
426 427
	if (ret < 0) {
		kvm->arch.vioapic = NULL;
428
		kfree(ioapic);
429
	}
430 431

	return ret;
E
Eddie Dong 已提交
432
}
433

434 435 436 437 438 439 440 441 442 443 444
void kvm_ioapic_destroy(struct kvm *kvm)
{
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;

	if (ioapic) {
		kvm_io_bus_unregister_dev(kvm, KVM_MMIO_BUS, &ioapic->dev);
		kvm->arch.vioapic = NULL;
		kfree(ioapic);
	}
}

G
Gleb Natapov 已提交
445 446 447 448 449 450
int kvm_get_ioapic(struct kvm *kvm, struct kvm_ioapic_state *state)
{
	struct kvm_ioapic *ioapic = ioapic_irqchip(kvm);
	if (!ioapic)
		return -EINVAL;

451
	spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
452
	memcpy(state, ioapic, sizeof(struct kvm_ioapic_state));
453
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
454 455 456 457 458 459 460 461 462
	return 0;
}

int kvm_set_ioapic(struct kvm *kvm, struct kvm_ioapic_state *state)
{
	struct kvm_ioapic *ioapic = ioapic_irqchip(kvm);
	if (!ioapic)
		return -EINVAL;

463
	spin_lock(&ioapic->lock);
G
Gleb Natapov 已提交
464
	memcpy(ioapic, state, sizeof(struct kvm_ioapic_state));
465
	update_handled_vectors(ioapic);
466
	spin_unlock(&ioapic->lock);
G
Gleb Natapov 已提交
467 468
	return 0;
}