irq_remapping.c 8.6 KB
Newer Older
1
#include <linux/seq_file.h>
2
#include <linux/cpumask.h>
3 4 5
#include <linux/kernel.h>
#include <linux/string.h>
#include <linux/errno.h>
J
Joerg Roedel 已提交
6
#include <linux/msi.h>
7 8
#include <linux/irq.h>
#include <linux/pci.h>
J
Joerg Roedel 已提交
9 10 11

#include <asm/hw_irq.h>
#include <asm/irq_remapping.h>
12 13 14
#include <asm/processor.h>
#include <asm/x86_init.h>
#include <asm/apic.h>
15

16
#include "irq_remapping.h"
17

18
int irq_remapping_enabled;
19

20
int disable_irq_remap;
21
int irq_remap_broken;
22 23 24 25 26
int disable_sourceid_checking;
int no_x2apic_optout;

static struct irq_remap_ops *remap_ops;

27 28 29
static int msi_alloc_remapped_irq(struct pci_dev *pdev, int irq, int nvec);
static int msi_setup_remapped_irq(struct pci_dev *pdev, unsigned int irq,
				  int index, int sub_handle);
30 31 32
static int set_remapped_irq_affinity(struct irq_data *data,
				     const struct cpumask *mask,
				     bool force);
33

34 35 36 37 38
static bool irq_remapped(struct irq_cfg *cfg)
{
	return (cfg->remapped == 1);
}

39 40 41 42 43 44 45 46 47 48 49 50 51
static void irq_remapping_disable_io_apic(void)
{
	/*
	 * With interrupt-remapping, for now we will use virtual wire A
	 * mode, as virtual wire B is little complex (need to configure
	 * both IOAPIC RTE as well as interrupt-remapping table entry).
	 * As this gets called during crash dump, keep this simple for
	 * now.
	 */
	if (cpu_has_apic || apic_from_smp_config())
		disconnect_bsp_APIC(0);
}

52 53
static int do_setup_msi_irqs(struct pci_dev *dev, int nvec)
{
54
	int node, ret, sub_handle, nvec_pow2, index = 0;
55 56 57 58 59 60 61
	unsigned int irq;
	struct msi_desc *msidesc;

	WARN_ON(!list_is_singular(&dev->msi_list));
	msidesc = list_entry(dev->msi_list.next, struct msi_desc, list);
	WARN_ON(msidesc->irq);
	WARN_ON(msidesc->msi_attrib.multiple);
62
	WARN_ON(msidesc->nvec_used);
63 64 65 66 67 68

	node = dev_to_node(&dev->dev);
	irq = __create_irqs(get_nr_irqs_gsi(), nvec, node);
	if (irq == 0)
		return -ENOSPC;

69 70 71
	nvec_pow2 = __roundup_pow_of_two(nvec);
	msidesc->nvec_used = nvec;
	msidesc->msi_attrib.multiple = ilog2(nvec_pow2);
72 73
	for (sub_handle = 0; sub_handle < nvec; sub_handle++) {
		if (!sub_handle) {
74
			index = msi_alloc_remapped_irq(dev, irq, nvec_pow2);
75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98
			if (index < 0) {
				ret = index;
				goto error;
			}
		} else {
			ret = msi_setup_remapped_irq(dev, irq + sub_handle,
						     index, sub_handle);
			if (ret < 0)
				goto error;
		}
		ret = setup_msi_irq(dev, msidesc, irq, sub_handle);
		if (ret < 0)
			goto error;
	}
	return 0;

error:
	destroy_irqs(irq, nvec);

	/*
	 * Restore altered MSI descriptor fields and prevent just destroyed
	 * IRQs from tearing down again in default_teardown_msi_irqs()
	 */
	msidesc->irq = 0;
99
	msidesc->nvec_used = 0;
100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152
	msidesc->msi_attrib.multiple = 0;

	return ret;
}

static int do_setup_msix_irqs(struct pci_dev *dev, int nvec)
{
	int node, ret, sub_handle, index = 0;
	struct msi_desc *msidesc;
	unsigned int irq;

	node		= dev_to_node(&dev->dev);
	irq		= get_nr_irqs_gsi();
	sub_handle	= 0;

	list_for_each_entry(msidesc, &dev->msi_list, list) {

		irq = create_irq_nr(irq, node);
		if (irq == 0)
			return -1;

		if (sub_handle == 0)
			ret = index = msi_alloc_remapped_irq(dev, irq, nvec);
		else
			ret = msi_setup_remapped_irq(dev, irq, index, sub_handle);

		if (ret < 0)
			goto error;

		ret = setup_msi_irq(dev, msidesc, irq, 0);
		if (ret < 0)
			goto error;

		sub_handle += 1;
		irq        += 1;
	}

	return 0;

error:
	destroy_irq(irq);
	return ret;
}

static int irq_remapping_setup_msi_irqs(struct pci_dev *dev,
					int nvec, int type)
{
	if (type == PCI_CAP_ID_MSI)
		return do_setup_msi_irqs(dev, nvec);
	else
		return do_setup_msix_irqs(dev, nvec);
}

153 154 155 156 157 158 159 160 161 162 163
void eoi_ioapic_pin_remapped(int apic, int pin, int vector)
{
	/*
	 * Intr-remapping uses pin number as the virtual vector
	 * in the RTE. Actual vector is programmed in
	 * intr-remapping table entry. Hence for the io-apic
	 * EOI we use the pin number.
	 */
	io_apic_eoi(apic, pin);
}

164 165
static void __init irq_remapping_modify_x86_ops(void)
{
166
	x86_io_apic_ops.disable		= irq_remapping_disable_io_apic;
167
	x86_io_apic_ops.set_affinity	= set_remapped_irq_affinity;
168
	x86_io_apic_ops.setup_entry	= setup_ioapic_remapped_entry;
169
	x86_io_apic_ops.eoi_ioapic_pin	= eoi_ioapic_pin_remapped;
170
	x86_msi.setup_msi_irqs		= irq_remapping_setup_msi_irqs;
171
	x86_msi.setup_hpet_msi		= setup_hpet_msi_remapped;
172
	x86_msi.compose_msi_msg		= compose_remapped_msi_msg;
173 174
}

175 176
static __init int setup_nointremap(char *str)
{
177
	disable_irq_remap = 1;
178 179 180 181
	return 0;
}
early_param("nointremap", setup_nointremap);

182
static __init int setup_irqremap(char *str)
183 184 185 186 187 188
{
	if (!str)
		return -EINVAL;

	while (*str) {
		if (!strncmp(str, "on", 2))
189
			disable_irq_remap = 0;
190
		else if (!strncmp(str, "off", 3))
191
			disable_irq_remap = 1;
192 193 194 195 196 197 198 199 200 201 202 203
		else if (!strncmp(str, "nosid", 5))
			disable_sourceid_checking = 1;
		else if (!strncmp(str, "no_x2apic_optout", 16))
			no_x2apic_optout = 1;

		str += strcspn(str, ",");
		while (*str == ',')
			str++;
	}

	return 0;
}
204
early_param("intremap", setup_irqremap);
205

206
void __init setup_irq_remapping_ops(void)
207 208
{
	remap_ops = &intel_irq_remap_ops;
209 210 211 212 213

#ifdef CONFIG_AMD_IOMMU
	if (amd_iommu_irq_ops.prepare() == 0)
		remap_ops = &amd_iommu_irq_ops;
#endif
214 215
}

216 217 218 219 220
void set_irq_remapping_broken(void)
{
	irq_remap_broken = 1;
}

221
int irq_remapping_supported(void)
222
{
223
	if (disable_irq_remap)
224 225 226 227 228 229 230 231
		return 0;

	if (!remap_ops || !remap_ops->supported)
		return 0;

	return remap_ops->supported();
}

232
int __init irq_remapping_prepare(void)
233
{
234
	if (!remap_ops || !remap_ops->prepare)
235 236
		return -ENODEV;

237
	return remap_ops->prepare();
238 239
}

240
int __init irq_remapping_enable(void)
241
{
242 243
	int ret;

244
	if (!remap_ops || !remap_ops->enable)
245 246
		return -ENODEV;

247 248 249 250 251 252
	ret = remap_ops->enable();

	if (irq_remapping_enabled)
		irq_remapping_modify_x86_ops();

	return ret;
253
}
254

255
void irq_remapping_disable(void)
256
{
257 258 259
	if (!irq_remapping_enabled ||
	    !remap_ops ||
	    !remap_ops->disable)
260 261
		return;

262
	remap_ops->disable();
263 264
}

265
int irq_remapping_reenable(int mode)
266
{
267 268 269
	if (!irq_remapping_enabled ||
	    !remap_ops ||
	    !remap_ops->reenable)
270 271
		return 0;

272
	return remap_ops->reenable(mode);
273 274
}

275
int __init irq_remap_enable_fault_handling(void)
276
{
277 278 279
	if (!irq_remapping_enabled)
		return 0;

280 281 282 283 284
	if (!remap_ops || !remap_ops->enable_faulting)
		return -ENODEV;

	return remap_ops->enable_faulting();
}
285

286 287 288 289
int setup_ioapic_remapped_entry(int irq,
				struct IO_APIC_route_entry *entry,
				unsigned int destination, int vector,
				struct io_apic_irq_attr *attr)
290 291 292 293 294 295 296
{
	if (!remap_ops || !remap_ops->setup_ioapic_entry)
		return -ENODEV;

	return remap_ops->setup_ioapic_entry(irq, entry, destination,
					     vector, attr);
}
297

298 299
int set_remapped_irq_affinity(struct irq_data *data, const struct cpumask *mask,
			      bool force)
300
{
301 302
	if (!config_enabled(CONFIG_SMP) || !remap_ops ||
	    !remap_ops->set_affinity)
303 304 305 306
		return 0;

	return remap_ops->set_affinity(data, mask, force);
}
307

308
void free_remapped_irq(int irq)
309
{
310 311
	struct irq_cfg *cfg = irq_get_chip_data(irq);

312 313 314
	if (!remap_ops || !remap_ops->free_irq)
		return;

315 316
	if (irq_remapped(cfg))
		remap_ops->free_irq(irq);
317
}
318

319 320 321
void compose_remapped_msi_msg(struct pci_dev *pdev,
			      unsigned int irq, unsigned int dest,
			      struct msi_msg *msg, u8 hpet_id)
322
{
323
	struct irq_cfg *cfg = irq_get_chip_data(irq);
324

325 326 327 328
	if (!irq_remapped(cfg))
		native_compose_msi_msg(pdev, irq, dest, msg, hpet_id);
	else if (remap_ops && remap_ops->compose_msi_msg)
		remap_ops->compose_msi_msg(pdev, irq, dest, msg, hpet_id);
329 330
}

331
static int msi_alloc_remapped_irq(struct pci_dev *pdev, int irq, int nvec)
332 333 334 335 336 337 338
{
	if (!remap_ops || !remap_ops->msi_alloc_irq)
		return -ENODEV;

	return remap_ops->msi_alloc_irq(pdev, irq, nvec);
}

339 340
static int msi_setup_remapped_irq(struct pci_dev *pdev, unsigned int irq,
				  int index, int sub_handle)
341 342 343 344 345 346 347
{
	if (!remap_ops || !remap_ops->msi_setup_irq)
		return -ENODEV;

	return remap_ops->msi_setup_irq(pdev, irq, index, sub_handle);
}

348
int setup_hpet_msi_remapped(unsigned int irq, unsigned int id)
349 350 351 352 353 354
{
	if (!remap_ops || !remap_ops->setup_hpet_msi)
		return -ENODEV;

	return remap_ops->setup_hpet_msi(irq, id);
}
355 356 357 358 359 360

void panic_if_irq_remap(const char *msg)
{
	if (irq_remapping_enabled)
		panic(msg);
}
361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384

static void ir_ack_apic_edge(struct irq_data *data)
{
	ack_APIC_irq();
}

static void ir_ack_apic_level(struct irq_data *data)
{
	ack_APIC_irq();
	eoi_ioapic_irq(data->irq, data->chip_data);
}

static void ir_print_prefix(struct irq_data *data, struct seq_file *p)
{
	seq_printf(p, " IR-%s", data->chip->name);
}

void irq_remap_modify_chip_defaults(struct irq_chip *chip)
{
	chip->irq_print_chip = ir_print_prefix;
	chip->irq_ack = ir_ack_apic_edge;
	chip->irq_eoi = ir_ack_apic_level;
	chip->irq_set_affinity = x86_io_apic_ops.set_affinity;
}
385 386 387 388 389 390 391 392 393

bool setup_remapped_irq(int irq, struct irq_cfg *cfg, struct irq_chip *chip)
{
	if (!irq_remapped(cfg))
		return false;
	irq_set_status_flags(irq, IRQ_MOVE_PCNTXT);
	irq_remap_modify_chip_defaults(chip);
	return true;
}