irq_comm.c 10.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19
/*
 * irq_comm.c: Common API for in kernel interrupt controller
 * Copyright (c) 2007, Intel Corporation.
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms and conditions of the GNU General Public License,
 * version 2, as published by the Free Software Foundation.
 *
 * This program is distributed in the hope it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
 * more details.
 *
 * You should have received a copy of the GNU General Public License along with
 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
 * Place - Suite 330, Boston, MA 02111-1307 USA.
 * Authors:
 *   Yaozu (Eddie) Dong <Eddie.dong@intel.com>
 *
N
Nicolas Kaiser 已提交
20
 * Copyright 2010 Red Hat, Inc. and/or its affiliates.
21 22 23
 */

#include <linux/kvm_host.h>
24
#include <linux/slab.h>
25
#include <linux/export.h>
26
#include <trace/events/kvm.h>
S
Sheng Yang 已提交
27 28 29

#include <asm/msidef.h>

30 31 32 33
#include "irq.h"

#include "ioapic.h"

34 35
#include "lapic.h"

36
static int kvm_set_pic_irq(struct kvm_kernel_irq_routing_entry *e,
37 38
			   struct kvm *kvm, int irq_source_id, int level,
			   bool line_status)
39
{
40
	struct kvm_pic *pic = pic_irqchip(kvm);
41
	return kvm_pic_set_irq(pic, e->irqchip.pin, irq_source_id, level);
42 43
}

44
static int kvm_set_ioapic_irq(struct kvm_kernel_irq_routing_entry *e,
45 46
			      struct kvm *kvm, int irq_source_id, int level,
			      bool line_status)
47
{
48
	struct kvm_ioapic *ioapic = kvm->arch.vioapic;
49 50
	return kvm_ioapic_set_irq(ioapic, e->irqchip.pin, irq_source_id, level,
				line_status);
51 52
}

53
int kvm_irq_delivery_to_apic(struct kvm *kvm, struct kvm_lapic *src,
54
		struct kvm_lapic_irq *irq, unsigned long *dest_map)
55 56 57 58 59
{
	int i, r = -1;
	struct kvm_vcpu *vcpu, *lowest = NULL;

	if (irq->dest_mode == 0 && irq->dest_id == 0xff &&
60
			kvm_lowest_prio_delivery(irq)) {
61
		printk(KERN_INFO "kvm: apic: phys broadcast and lowest prio\n");
62 63 64
		irq->delivery_mode = APIC_DM_FIXED;
	}

65
	if (kvm_irq_delivery_to_apic_fast(kvm, src, irq, &r, dest_map))
66
		return r;
67

68 69
	kvm_for_each_vcpu(i, vcpu, kvm) {
		if (!kvm_apic_present(vcpu))
70 71
			continue;

72 73
		if (!kvm_apic_match_dest(vcpu, src, irq->shorthand,
					irq->dest_id, irq->dest_mode))
74 75
			continue;

76
		if (!kvm_lowest_prio_delivery(irq)) {
77 78
			if (r < 0)
				r = 0;
79
			r += kvm_apic_set_irq(vcpu, irq, dest_map);
80
		} else if (kvm_lapic_enabled(vcpu)) {
81 82 83 84
			if (!lowest)
				lowest = vcpu;
			else if (kvm_apic_compare_prio(vcpu, lowest) < 0)
				lowest = vcpu;
85
		}
86 87
	}

88
	if (lowest)
89
		r = kvm_apic_set_irq(lowest, irq, dest_map);
90 91

	return r;
92 93
}

F
Feng Wu 已提交
94 95
void kvm_set_msi_irq(struct kvm_kernel_irq_routing_entry *e,
		     struct kvm_lapic_irq *irq)
M
Michael S. Tsirkin 已提交
96 97 98 99 100 101 102 103 104 105
{
	trace_kvm_msi_set_irq(e->msi.address_lo, e->msi.data);

	irq->dest_id = (e->msi.address_lo &
			MSI_ADDR_DEST_ID_MASK) >> MSI_ADDR_DEST_ID_SHIFT;
	irq->vector = (e->msi.data &
			MSI_DATA_VECTOR_MASK) >> MSI_DATA_VECTOR_SHIFT;
	irq->dest_mode = (1 << MSI_ADDR_DEST_MODE_SHIFT) & e->msi.address_lo;
	irq->trig_mode = (1 << MSI_DATA_TRIGGER_SHIFT) & e->msi.data;
	irq->delivery_mode = e->msi.data & 0x700;
106 107
	irq->msi_redir_hint = ((e->msi.address_lo
		& MSI_ADDR_REDIRECTION_LOWPRI) > 0);
M
Michael S. Tsirkin 已提交
108 109 110
	irq->level = 1;
	irq->shorthand = 0;
}
F
Feng Wu 已提交
111
EXPORT_SYMBOL_GPL(kvm_set_msi_irq);
M
Michael S. Tsirkin 已提交
112

113
int kvm_set_msi(struct kvm_kernel_irq_routing_entry *e,
114
		struct kvm *kvm, int irq_source_id, int level, bool line_status)
S
Sheng Yang 已提交
115
{
116
	struct kvm_lapic_irq irq;
S
Sheng Yang 已提交
117

118 119 120
	if (!level)
		return -1;

M
Michael S. Tsirkin 已提交
121
	kvm_set_msi_irq(e, &irq);
122

123
	return kvm_irq_delivery_to_apic(kvm, NULL, &irq, NULL);
S
Sheng Yang 已提交
124 125
}

M
Michael S. Tsirkin 已提交
126 127 128 129 130 131 132 133 134

static int kvm_set_msi_inatomic(struct kvm_kernel_irq_routing_entry *e,
			 struct kvm *kvm)
{
	struct kvm_lapic_irq irq;
	int r;

	kvm_set_msi_irq(e, &irq);

135
	if (kvm_irq_delivery_to_apic_fast(kvm, NULL, &irq, &r, NULL))
M
Michael S. Tsirkin 已提交
136 137 138 139 140 141 142 143 144 145 146 147 148 149
		return r;
	else
		return -EWOULDBLOCK;
}

/*
 * Deliver an IRQ in an atomic context if we can, or return a failure,
 * user can retry in a process context.
 * Return value:
 *  -EWOULDBLOCK - Can't deliver in atomic context: retry in a process context.
 *  Other values - No need to retry.
 */
int kvm_set_irq_inatomic(struct kvm *kvm, int irq_source_id, u32 irq, int level)
{
150
	struct kvm_kernel_irq_routing_entry entries[KVM_NR_IRQCHIPS];
M
Michael S. Tsirkin 已提交
151 152
	struct kvm_kernel_irq_routing_entry *e;
	int ret = -EINVAL;
153
	int idx;
M
Michael S. Tsirkin 已提交
154 155 156 157 158 159 160 161 162 163 164

	trace_kvm_set_irq(irq, level, irq_source_id);

	/*
	 * Injection into either PIC or IOAPIC might need to scan all CPUs,
	 * which would need to be retried from thread context;  when same GSI
	 * is connected to both PIC and IOAPIC, we'd have to report a
	 * partial failure here.
	 * Since there's no easy way to do this, we only support injecting MSI
	 * which is limited to 1:1 GSI mapping.
	 */
165
	idx = srcu_read_lock(&kvm->irq_srcu);
166
	if (kvm_irq_map_gsi(kvm, entries, irq) > 0) {
167 168 169 170 171 172
		e = &entries[0];
		if (likely(e->type == KVM_IRQ_ROUTING_MSI))
			ret = kvm_set_msi_inatomic(e, kvm);
		else
			ret = -EWOULDBLOCK;
	}
173
	srcu_read_unlock(&kvm->irq_srcu, idx);
M
Michael S. Tsirkin 已提交
174 175 176
	return ret;
}

177 178 179
int kvm_request_irq_source_id(struct kvm *kvm)
{
	unsigned long *bitmap = &kvm->arch.irq_sources_bitmap;
180 181 182
	int irq_source_id;

	mutex_lock(&kvm->irq_lock);
183
	irq_source_id = find_first_zero_bit(bitmap, BITS_PER_LONG);
184

185
	if (irq_source_id >= BITS_PER_LONG) {
186
		printk(KERN_WARNING "kvm: exhaust allocatable IRQ sources!\n");
187 188
		irq_source_id = -EFAULT;
		goto unlock;
189 190 191
	}

	ASSERT(irq_source_id != KVM_USERSPACE_IRQ_SOURCE_ID);
192
	ASSERT(irq_source_id != KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID);
193
	set_bit(irq_source_id, bitmap);
194
unlock:
195
	mutex_unlock(&kvm->irq_lock);
196

197 198 199 200 201
	return irq_source_id;
}

void kvm_free_irq_source_id(struct kvm *kvm, int irq_source_id)
{
202
	ASSERT(irq_source_id != KVM_USERSPACE_IRQ_SOURCE_ID);
203
	ASSERT(irq_source_id != KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID);
204

205
	mutex_lock(&kvm->irq_lock);
206
	if (irq_source_id < 0 ||
207
	    irq_source_id >= BITS_PER_LONG) {
208
		printk(KERN_ERR "kvm: IRQ source ID out of range!\n");
209
		goto unlock;
210
	}
211
	clear_bit(irq_source_id, &kvm->arch.irq_sources_bitmap);
212
	if (!ioapic_in_kernel(kvm))
213 214
		goto unlock;

215 216
	kvm_ioapic_clear_all(kvm->arch.vioapic, irq_source_id);
	kvm_pic_clear_all(pic_irqchip(kvm), irq_source_id);
217
unlock:
218
	mutex_unlock(&kvm->irq_lock);
219
}
220 221 222 223

void kvm_register_irq_mask_notifier(struct kvm *kvm, int irq,
				    struct kvm_irq_mask_notifier *kimn)
{
224
	mutex_lock(&kvm->irq_lock);
225
	kimn->irq = irq;
226
	hlist_add_head_rcu(&kimn->link, &kvm->arch.mask_notifier_list);
227
	mutex_unlock(&kvm->irq_lock);
228 229 230 231 232
}

void kvm_unregister_irq_mask_notifier(struct kvm *kvm, int irq,
				      struct kvm_irq_mask_notifier *kimn)
{
233
	mutex_lock(&kvm->irq_lock);
234
	hlist_del_rcu(&kimn->link);
235
	mutex_unlock(&kvm->irq_lock);
236
	synchronize_srcu(&kvm->irq_srcu);
237 238
}

239 240
void kvm_fire_mask_notifiers(struct kvm *kvm, unsigned irqchip, unsigned pin,
			     bool mask)
241 242
{
	struct kvm_irq_mask_notifier *kimn;
243
	int idx, gsi;
244

245
	idx = srcu_read_lock(&kvm->irq_srcu);
246
	gsi = kvm_irq_map_chip_pin(kvm, irqchip, pin);
247
	if (gsi != -1)
248
		hlist_for_each_entry_rcu(kimn, &kvm->arch.mask_notifier_list, link)
249 250
			if (kimn->irq == gsi)
				kimn->func(kimn, mask);
251
	srcu_read_unlock(&kvm->irq_srcu, idx);
252 253
}

254
int kvm_set_routing_entry(struct kvm_kernel_irq_routing_entry *e,
255
			  const struct kvm_irq_routing_entry *ue)
256 257 258
{
	int r = -EINVAL;
	int delta;
259
	unsigned max_pin;
260

261 262 263 264 265 266
	switch (ue->type) {
	case KVM_IRQ_ROUTING_IRQCHIP:
		delta = 0;
		switch (ue->u.irqchip.irqchip) {
		case KVM_IRQCHIP_PIC_MASTER:
			e->set = kvm_set_pic_irq;
267
			max_pin = PIC_NUM_PINS;
268 269
			break;
		case KVM_IRQCHIP_PIC_SLAVE:
270
			e->set = kvm_set_pic_irq;
271
			max_pin = PIC_NUM_PINS;
272 273 274
			delta = 8;
			break;
		case KVM_IRQCHIP_IOAPIC:
275
			max_pin = KVM_IOAPIC_NUM_PINS;
276
			e->set = kvm_set_ioapic_irq;
277 278 279 280 281 282
			break;
		default:
			goto out;
		}
		e->irqchip.irqchip = ue->u.irqchip.irqchip;
		e->irqchip.pin = ue->u.irqchip.pin + delta;
283
		if (e->irqchip.pin >= max_pin)
284
			goto out;
285
		break;
S
Sheng Yang 已提交
286 287 288 289 290 291
	case KVM_IRQ_ROUTING_MSI:
		e->set = kvm_set_msi;
		e->msi.address_lo = ue->u.msi.address_lo;
		e->msi.address_hi = ue->u.msi.address_hi;
		e->msi.data = ue->u.msi.data;
		break;
292 293 294
	default:
		goto out;
	}
295

296 297 298 299 300
	r = 0;
out:
	return r;
}

301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327
bool kvm_intr_is_single_vcpu(struct kvm *kvm, struct kvm_lapic_irq *irq,
			     struct kvm_vcpu **dest_vcpu)
{
	int i, r = 0;
	struct kvm_vcpu *vcpu;

	if (kvm_intr_is_single_vcpu_fast(kvm, irq, dest_vcpu))
		return true;

	kvm_for_each_vcpu(i, vcpu, kvm) {
		if (!kvm_apic_present(vcpu))
			continue;

		if (!kvm_apic_match_dest(vcpu, NULL, irq->shorthand,
					irq->dest_id, irq->dest_mode))
			continue;

		if (++r == 2)
			return false;

		*dest_vcpu = vcpu;
	}

	return r == 1;
}
EXPORT_SYMBOL_GPL(kvm_intr_is_single_vcpu);

328 329
#define IOAPIC_ROUTING_ENTRY(irq) \
	{ .gsi = irq, .type = KVM_IRQ_ROUTING_IRQCHIP,	\
330
	  .u.irqchip = { .irqchip = KVM_IRQCHIP_IOAPIC, .pin = (irq) } }
331 332
#define ROUTING_ENTRY1(irq) IOAPIC_ROUTING_ENTRY(irq)

333
#define PIC_ROUTING_ENTRY(irq) \
334
	{ .gsi = irq, .type = KVM_IRQ_ROUTING_IRQCHIP,	\
335
	  .u.irqchip = { .irqchip = SELECT_PIC(irq), .pin = (irq) % 8 } }
336
#define ROUTING_ENTRY2(irq) \
337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358
	IOAPIC_ROUTING_ENTRY(irq), PIC_ROUTING_ENTRY(irq)

static const struct kvm_irq_routing_entry default_routing[] = {
	ROUTING_ENTRY2(0), ROUTING_ENTRY2(1),
	ROUTING_ENTRY2(2), ROUTING_ENTRY2(3),
	ROUTING_ENTRY2(4), ROUTING_ENTRY2(5),
	ROUTING_ENTRY2(6), ROUTING_ENTRY2(7),
	ROUTING_ENTRY2(8), ROUTING_ENTRY2(9),
	ROUTING_ENTRY2(10), ROUTING_ENTRY2(11),
	ROUTING_ENTRY2(12), ROUTING_ENTRY2(13),
	ROUTING_ENTRY2(14), ROUTING_ENTRY2(15),
	ROUTING_ENTRY1(16), ROUTING_ENTRY1(17),
	ROUTING_ENTRY1(18), ROUTING_ENTRY1(19),
	ROUTING_ENTRY1(20), ROUTING_ENTRY1(21),
	ROUTING_ENTRY1(22), ROUTING_ENTRY1(23),
};

int kvm_setup_default_irq_routing(struct kvm *kvm)
{
	return kvm_set_irq_routing(kvm, default_routing,
				   ARRAY_SIZE(default_routing), 0);
}
359 360 361 362 363 364 365

static const struct kvm_irq_routing_entry empty_routing[] = {};

int kvm_setup_empty_irq_routing(struct kvm *kvm)
{
	return kvm_set_irq_routing(kvm, empty_routing, 0, 0);
}
366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391

void kvm_arch_irq_routing_update(struct kvm *kvm)
{
	if (ioapic_in_kernel(kvm) || !irqchip_in_kernel(kvm))
		return;
	kvm_make_scan_ioapic_request(kvm);
}

void kvm_scan_ioapic_routes(struct kvm_vcpu *vcpu, u64 *eoi_exit_bitmap)
{
	struct kvm *kvm = vcpu->kvm;
	struct kvm_kernel_irq_routing_entry *entry;
	struct kvm_irq_routing_table *table;
	u32 i, nr_ioapic_pins;
	int idx;

	/* kvm->irq_routing must be read after clearing
	 * KVM_SCAN_IOAPIC. */
	smp_mb();
	idx = srcu_read_lock(&kvm->irq_srcu);
	table = srcu_dereference(kvm->irq_routing, &kvm->irq_srcu);
	nr_ioapic_pins = min_t(u32, table->nr_rt_entries,
			       kvm->arch.nr_reserved_ioapic_pins);
	for (i = 0; i < nr_ioapic_pins; ++i) {
		hlist_for_each_entry(entry, &table->map[i], link) {
			u32 dest_id, dest_mode;
392
			bool level;
393 394 395 396 397

			if (entry->type != KVM_IRQ_ROUTING_MSI)
				continue;
			dest_id = (entry->msi.address_lo >> 12) & 0xff;
			dest_mode = (entry->msi.address_lo >> 2) & 0x1;
398 399 400
			level = entry->msi.data & MSI_DATA_TRIGGER_LEVEL;
			if (level && kvm_apic_match_dest(vcpu, NULL, 0,
						dest_id, dest_mode)) {
401 402 403 404 405 406 407 408 409
				u32 vector = entry->msi.data & 0xff;

				__set_bit(vector,
					  (unsigned long *) eoi_exit_bitmap);
			}
		}
	}
	srcu_read_unlock(&kvm->irq_srcu, idx);
}