msi.c 17.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8
/*
 * File:	msi.c
 * Purpose:	PCI Message Signaled Interrupt (MSI)
 *
 * Copyright (C) 2003-2004 Intel
 * Copyright (C) Tom Long Nguyen (tom.l.nguyen@intel.com)
 */

9
#include <linux/err.h>
L
Linus Torvalds 已提交
10 11 12 13 14 15 16
#include <linux/mm.h>
#include <linux/irq.h>
#include <linux/interrupt.h>
#include <linux/init.h>
#include <linux/ioport.h>
#include <linux/pci.h>
#include <linux/proc_fs.h>
17
#include <linux/msi.h>
D
Dan Williams 已提交
18
#include <linux/smp.h>
L
Linus Torvalds 已提交
19 20 21 22 23 24 25 26 27

#include <asm/errno.h>
#include <asm/io.h>

#include "pci.h"
#include "msi.h"

static int pci_msi_enable = 1;

28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
static void msi_set_enable(struct pci_dev *dev, int enable)
{
	int pos;
	u16 control;

	pos = pci_find_capability(dev, PCI_CAP_ID_MSI);
	if (pos) {
		pci_read_config_word(dev, pos + PCI_MSI_FLAGS, &control);
		control &= ~PCI_MSI_FLAGS_ENABLE;
		if (enable)
			control |= PCI_MSI_FLAGS_ENABLE;
		pci_write_config_word(dev, pos + PCI_MSI_FLAGS, control);
	}
}

static void msix_set_enable(struct pci_dev *dev, int enable)
{
	int pos;
	u16 control;

	pos = pci_find_capability(dev, PCI_CAP_ID_MSIX);
	if (pos) {
		pci_read_config_word(dev, pos + PCI_MSIX_FLAGS, &control);
		control &= ~PCI_MSIX_FLAGS_ENABLE;
		if (enable)
			control |= PCI_MSIX_FLAGS_ENABLE;
		pci_write_config_word(dev, pos + PCI_MSIX_FLAGS, control);
	}
}

M
Mitch Williams 已提交
58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
static void msix_flush_writes(unsigned int irq)
{
	struct msi_desc *entry;

	entry = get_irq_msi(irq);
	BUG_ON(!entry || !entry->dev);
	switch (entry->msi_attrib.type) {
	case PCI_CAP_ID_MSI:
		/* nothing to do */
		break;
	case PCI_CAP_ID_MSIX:
	{
		int offset = entry->msi_attrib.entry_nr * PCI_MSIX_ENTRY_SIZE +
			PCI_MSIX_ENTRY_VECTOR_CTRL_OFFSET;
		readl(entry->mask_base + offset);
		break;
	}
	default:
		BUG();
		break;
	}
}

81
static void msi_set_mask_bit(unsigned int irq, int flag)
L
Linus Torvalds 已提交
82 83 84
{
	struct msi_desc *entry;

85
	entry = get_irq_msi(irq);
86
	BUG_ON(!entry || !entry->dev);
L
Linus Torvalds 已提交
87 88
	switch (entry->msi_attrib.type) {
	case PCI_CAP_ID_MSI:
89
		if (entry->msi_attrib.maskbit) {
S
Satoru Takeuchi 已提交
90 91
			int pos;
			u32 mask_bits;
92 93 94 95 96 97

			pos = (long)entry->mask_base;
			pci_read_config_dword(entry->dev, pos, &mask_bits);
			mask_bits &= ~(1);
			mask_bits |= flag;
			pci_write_config_dword(entry->dev, pos, mask_bits);
98 99
		} else {
			msi_set_enable(entry->dev, !flag);
100
		}
L
Linus Torvalds 已提交
101 102 103 104 105 106
		break;
	case PCI_CAP_ID_MSIX:
	{
		int offset = entry->msi_attrib.entry_nr * PCI_MSIX_ENTRY_SIZE +
			PCI_MSIX_ENTRY_VECTOR_CTRL_OFFSET;
		writel(flag, entry->mask_base + offset);
107
		readl(entry->mask_base + offset);
L
Linus Torvalds 已提交
108 109 110
		break;
	}
	default:
111
		BUG();
L
Linus Torvalds 已提交
112 113
		break;
	}
114
	entry->msi_attrib.masked = !!flag;
L
Linus Torvalds 已提交
115 116
}

117
void read_msi_msg(unsigned int irq, struct msi_msg *msg)
L
Linus Torvalds 已提交
118
{
119
	struct msi_desc *entry = get_irq_msi(irq);
120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
	switch(entry->msi_attrib.type) {
	case PCI_CAP_ID_MSI:
	{
		struct pci_dev *dev = entry->dev;
		int pos = entry->msi_attrib.pos;
		u16 data;

		pci_read_config_dword(dev, msi_lower_address_reg(pos),
					&msg->address_lo);
		if (entry->msi_attrib.is_64) {
			pci_read_config_dword(dev, msi_upper_address_reg(pos),
						&msg->address_hi);
			pci_read_config_word(dev, msi_data_reg(pos, 1), &data);
		} else {
			msg->address_hi = 0;
135
			pci_read_config_word(dev, msi_data_reg(pos, 0), &data);
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154
		}
		msg->data = data;
		break;
	}
	case PCI_CAP_ID_MSIX:
	{
		void __iomem *base;
		base = entry->mask_base +
			entry->msi_attrib.entry_nr * PCI_MSIX_ENTRY_SIZE;

		msg->address_lo = readl(base + PCI_MSIX_ENTRY_LOWER_ADDR_OFFSET);
		msg->address_hi = readl(base + PCI_MSIX_ENTRY_UPPER_ADDR_OFFSET);
		msg->data = readl(base + PCI_MSIX_ENTRY_DATA_OFFSET);
 		break;
 	}
 	default:
		BUG();
	}
}
L
Linus Torvalds 已提交
155

156
void write_msi_msg(unsigned int irq, struct msi_msg *msg)
157
{
158
	struct msi_desc *entry = get_irq_msi(irq);
L
Linus Torvalds 已提交
159 160 161
	switch (entry->msi_attrib.type) {
	case PCI_CAP_ID_MSI:
	{
162 163 164 165 166 167 168 169 170 171 172 173 174 175
		struct pci_dev *dev = entry->dev;
		int pos = entry->msi_attrib.pos;

		pci_write_config_dword(dev, msi_lower_address_reg(pos),
					msg->address_lo);
		if (entry->msi_attrib.is_64) {
			pci_write_config_dword(dev, msi_upper_address_reg(pos),
						msg->address_hi);
			pci_write_config_word(dev, msi_data_reg(pos, 1),
						msg->data);
		} else {
			pci_write_config_word(dev, msi_data_reg(pos, 0),
						msg->data);
		}
L
Linus Torvalds 已提交
176 177 178 179
		break;
	}
	case PCI_CAP_ID_MSIX:
	{
180 181 182 183 184 185 186 187 188
		void __iomem *base;
		base = entry->mask_base +
			entry->msi_attrib.entry_nr * PCI_MSIX_ENTRY_SIZE;

		writel(msg->address_lo,
			base + PCI_MSIX_ENTRY_LOWER_ADDR_OFFSET);
		writel(msg->address_hi,
			base + PCI_MSIX_ENTRY_UPPER_ADDR_OFFSET);
		writel(msg->data, base + PCI_MSIX_ENTRY_DATA_OFFSET);
L
Linus Torvalds 已提交
189 190 191
		break;
	}
	default:
192
		BUG();
L
Linus Torvalds 已提交
193
	}
194
	entry->msg = *msg;
L
Linus Torvalds 已提交
195
}
196

197
void mask_msi_irq(unsigned int irq)
L
Linus Torvalds 已提交
198
{
199
	msi_set_mask_bit(irq, 1);
M
Mitch Williams 已提交
200
	msix_flush_writes(irq);
L
Linus Torvalds 已提交
201 202
}

203
void unmask_msi_irq(unsigned int irq)
L
Linus Torvalds 已提交
204
{
205
	msi_set_mask_bit(irq, 0);
M
Mitch Williams 已提交
206
	msix_flush_writes(irq);
L
Linus Torvalds 已提交
207 208
}

209
static int msi_free_irqs(struct pci_dev* dev);
S
Satoru Takeuchi 已提交
210

L
Linus Torvalds 已提交
211 212 213 214 215

static struct msi_desc* alloc_msi_entry(void)
{
	struct msi_desc *entry;

M
Michael Ellerman 已提交
216
	entry = kzalloc(sizeof(struct msi_desc), GFP_KERNEL);
L
Linus Torvalds 已提交
217 218 219
	if (!entry)
		return NULL;

220 221
	INIT_LIST_HEAD(&entry->list);
	entry->irq = 0;
L
Linus Torvalds 已提交
222 223 224 225 226
	entry->dev = NULL;

	return entry;
}

227 228 229 230 231 232
static void pci_intx_for_msi(struct pci_dev *dev, int enable)
{
	if (!(dev->dev_flags & PCI_DEV_FLAGS_MSI_INTX_DISABLE_BUG))
		pci_intx(dev, enable);
}

233
static void __pci_restore_msi_state(struct pci_dev *dev)
234
{
235
	int pos;
236
	u16 control;
237
	struct msi_desc *entry;
238

239 240 241
	if (!dev->msi_enabled)
		return;

242 243
	entry = get_irq_msi(dev->irq);
	pos = entry->msi_attrib.pos;
244

245
	pci_intx_for_msi(dev, 0);
246
	msi_set_enable(dev, 0);
247 248 249 250 251 252 253 254
	write_msi_msg(dev->irq, &entry->msg);
	if (entry->msi_attrib.maskbit)
		msi_set_mask_bit(dev->irq, entry->msi_attrib.masked);

	pci_read_config_word(dev, pos + PCI_MSI_FLAGS, &control);
	control &= ~(PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE);
	if (entry->msi_attrib.maskbit || !entry->msi_attrib.masked)
		control |= PCI_MSI_FLAGS_ENABLE;
255
	pci_write_config_word(dev, pos + PCI_MSI_FLAGS, control);
256 257 258
}

static void __pci_restore_msix_state(struct pci_dev *dev)
259 260 261
{
	int pos;
	struct msi_desc *entry;
262
	u16 control;
263

E
Eric W. Biederman 已提交
264 265 266
	if (!dev->msix_enabled)
		return;

267
	/* route the table */
268
	pci_intx_for_msi(dev, 0);
269
	msix_set_enable(dev, 0);
270

271 272 273
	list_for_each_entry(entry, &dev->msi_list, list) {
		write_msi_msg(entry->irq, &entry->msg);
		msi_set_mask_bit(entry->irq, entry->msi_attrib.masked);
274 275
	}

276 277
	BUG_ON(list_empty(&dev->msi_list));
	entry = list_entry(dev->msi_list.next, struct msi_desc, list);
278
	pos = entry->msi_attrib.pos;
279 280 281 282
	pci_read_config_word(dev, pos + PCI_MSIX_FLAGS, &control);
	control &= ~PCI_MSIX_FLAGS_MASKALL;
	control |= PCI_MSIX_FLAGS_ENABLE;
	pci_write_config_word(dev, pos + PCI_MSIX_FLAGS, control);
283
}
284 285 286 287 288 289

void pci_restore_msi_state(struct pci_dev *dev)
{
	__pci_restore_msi_state(dev);
	__pci_restore_msix_state(dev);
}
290
EXPORT_SYMBOL_GPL(pci_restore_msi_state);
291

L
Linus Torvalds 已提交
292 293 294 295
/**
 * msi_capability_init - configure device's MSI capability structure
 * @dev: pointer to the pci_dev data structure of MSI device function
 *
296
 * Setup the MSI capability structure of device function with a single
297
 * MSI irq, regardless of device function is capable of handling
L
Linus Torvalds 已提交
298
 * multiple messages. A return of zero indicates the successful setup
299
 * of an entry zero with the new MSI irq or non-zero for otherwise.
L
Linus Torvalds 已提交
300 301 302 303
 **/
static int msi_capability_init(struct pci_dev *dev)
{
	struct msi_desc *entry;
304
	int pos, ret;
L
Linus Torvalds 已提交
305 306
	u16 control;

307 308
	msi_set_enable(dev, 0);	/* Ensure msi is disabled as I set it up */

L
Linus Torvalds 已提交
309 310 311
   	pos = pci_find_capability(dev, PCI_CAP_ID_MSI);
	pci_read_config_word(dev, msi_control_reg(pos), &control);
	/* MSI Entry Initialization */
312 313 314
	entry = alloc_msi_entry();
	if (!entry)
		return -ENOMEM;
315

L
Linus Torvalds 已提交
316
	entry->msi_attrib.type = PCI_CAP_ID_MSI;
317
	entry->msi_attrib.is_64 = is_64bit_address(control);
L
Linus Torvalds 已提交
318 319
	entry->msi_attrib.entry_nr = 0;
	entry->msi_attrib.maskbit = is_mask_bit_support(control);
320
	entry->msi_attrib.masked = 1;
321
	entry->msi_attrib.default_irq = dev->irq;	/* Save IOAPIC IRQ */
322
	entry->msi_attrib.pos = pos;
L
Linus Torvalds 已提交
323 324 325 326
	if (is_mask_bit_support(control)) {
		entry->mask_base = (void __iomem *)(long)msi_mask_bits_reg(pos,
				is_64bit_address(control));
	}
327 328 329 330 331 332 333 334 335 336 337 338 339 340
	entry->dev = dev;
	if (entry->msi_attrib.maskbit) {
		unsigned int maskbits, temp;
		/* All MSIs are unmasked by default, Mask them all */
		pci_read_config_dword(dev,
			msi_mask_bits_reg(pos, is_64bit_address(control)),
			&maskbits);
		temp = (1 << multi_msi_capable(control));
		temp = ((temp - 1) & ~temp);
		maskbits |= temp;
		pci_write_config_dword(dev,
			msi_mask_bits_reg(pos, is_64bit_address(control)),
			maskbits);
	}
341
	list_add_tail(&entry->list, &dev->msi_list);
342

L
Linus Torvalds 已提交
343
	/* Configure MSI capability structure */
344
	ret = arch_setup_msi_irqs(dev, 1, PCI_CAP_ID_MSI);
345
	if (ret) {
346
		msi_free_irqs(dev);
347
		return ret;
348
	}
349

L
Linus Torvalds 已提交
350
	/* Set MSI enabled bits	 */
351
	pci_intx_for_msi(dev, 0);
352 353
	msi_set_enable(dev, 1);
	dev->msi_enabled = 1;
L
Linus Torvalds 已提交
354

355
	dev->irq = entry->irq;
L
Linus Torvalds 已提交
356 357 358 359 360 361
	return 0;
}

/**
 * msix_capability_init - configure device's MSI-X capability
 * @dev: pointer to the pci_dev data structure of MSI-X device function
R
Randy Dunlap 已提交
362 363
 * @entries: pointer to an array of struct msix_entry entries
 * @nvec: number of @entries
L
Linus Torvalds 已提交
364
 *
365
 * Setup the MSI-X capability structure of device function with a
366 367
 * single MSI-X irq. A return of zero indicates the successful setup of
 * requested MSI-X entries with allocated irqs or non-zero for otherwise.
L
Linus Torvalds 已提交
368 369 370 371
 **/
static int msix_capability_init(struct pci_dev *dev,
				struct msix_entry *entries, int nvec)
{
372
	struct msi_desc *entry;
373
	int pos, i, j, nr_entries, ret;
374 375
	unsigned long phys_addr;
	u32 table_offset;
L
Linus Torvalds 已提交
376 377 378 379
 	u16 control;
	u8 bir;
	void __iomem *base;

380 381
	msix_set_enable(dev, 0);/* Ensure msix is disabled as I set it up */

L
Linus Torvalds 已提交
382 383 384 385
   	pos = pci_find_capability(dev, PCI_CAP_ID_MSIX);
	/* Request & Map MSI-X table region */
 	pci_read_config_word(dev, msi_control_reg(pos), &control);
	nr_entries = multi_msix_capable(control);
386 387

 	pci_read_config_dword(dev, msix_table_offset_reg(pos), &table_offset);
L
Linus Torvalds 已提交
388
	bir = (u8)(table_offset & PCI_MSIX_FLAGS_BIRMASK);
389 390
	table_offset &= ~PCI_MSIX_FLAGS_BIRMASK;
	phys_addr = pci_resource_start (dev, bir) + table_offset;
L
Linus Torvalds 已提交
391 392 393 394 395 396
	base = ioremap_nocache(phys_addr, nr_entries * PCI_MSIX_ENTRY_SIZE);
	if (base == NULL)
		return -ENOMEM;

	/* MSI-X Table Initialization */
	for (i = 0; i < nvec; i++) {
397 398
		entry = alloc_msi_entry();
		if (!entry)
L
Linus Torvalds 已提交
399 400 401 402
			break;

 		j = entries[i].entry;
		entry->msi_attrib.type = PCI_CAP_ID_MSIX;
403
		entry->msi_attrib.is_64 = 1;
L
Linus Torvalds 已提交
404 405
		entry->msi_attrib.entry_nr = j;
		entry->msi_attrib.maskbit = 1;
406
		entry->msi_attrib.masked = 1;
407
		entry->msi_attrib.default_irq = dev->irq;
408
		entry->msi_attrib.pos = pos;
L
Linus Torvalds 已提交
409 410
		entry->dev = dev;
		entry->mask_base = base;
411

412
		list_add_tail(&entry->list, &dev->msi_list);
L
Linus Torvalds 已提交
413
	}
414 415 416 417 418 419 420 421

	ret = arch_setup_msi_irqs(dev, nvec, PCI_CAP_ID_MSIX);
	if (ret) {
		int avail = 0;
		list_for_each_entry(entry, &dev->msi_list, list) {
			if (entry->irq != 0) {
				avail++;
			}
L
Linus Torvalds 已提交
422
		}
423

424 425
		msi_free_irqs(dev);

426 427 428
		/* If we had some success report the number of irqs
		 * we succeeded in setting up.
		 */
429 430
		if (avail == 0)
			avail = ret;
431
		return avail;
L
Linus Torvalds 已提交
432
	}
433 434 435 436 437 438 439

	i = 0;
	list_for_each_entry(entry, &dev->msi_list, list) {
		entries[i].vector = entry->irq;
		set_irq_msi(entry->irq, entry);
		i++;
	}
L
Linus Torvalds 已提交
440
	/* Set MSI-X enabled bits */
441
	pci_intx_for_msi(dev, 0);
442 443
	msix_set_enable(dev, 1);
	dev->msix_enabled = 1;
L
Linus Torvalds 已提交
444 445 446 447

	return 0;
}

448
/**
449
 * pci_msi_check_device - check whether MSI may be enabled on a device
450
 * @dev: pointer to the pci_dev data structure of MSI device function
451
 * @nvec: how many MSIs have been requested ?
452
 * @type: are we checking for MSI or MSI-X ?
453
 *
454
 * Look at global flags, the device itself, and its parent busses
455 456
 * to determine if MSI/-X are supported for the device. If MSI/-X is
 * supported return 0, else return an error code.
457
 **/
458
static int pci_msi_check_device(struct pci_dev* dev, int nvec, int type)
459 460
{
	struct pci_bus *bus;
461
	int ret;
462

463
	/* MSI must be globally enabled and supported by the device */
464 465 466
	if (!pci_msi_enable || !dev || dev->no_msi)
		return -EINVAL;

467 468 469 470 471 472 473 474
	/*
	 * You can't ask to have 0 or less MSIs configured.
	 *  a) it's stupid ..
	 *  b) the list manipulation code assumes nvec >= 1.
	 */
	if (nvec < 1)
		return -ERANGE;

475 476 477 478 479 480
	/* Any bridge which does NOT route MSI transactions from it's
	 * secondary bus to it's primary bus must set NO_MSI flag on
	 * the secondary pci_bus.
	 * We expect only arch-specific PCI host bus controller driver
	 * or quirks for specific PCI bridges to be setting NO_MSI.
	 */
481 482 483 484
	for (bus = dev->bus; bus; bus = bus->parent)
		if (bus->bus_flags & PCI_BUS_FLAGS_NO_MSI)
			return -EINVAL;

485 486 487 488
	ret = arch_msi_check_device(dev, nvec, type);
	if (ret)
		return ret;

489 490 491
	if (!pci_find_capability(dev, type))
		return -EINVAL;

492 493 494
	return 0;
}

L
Linus Torvalds 已提交
495 496 497 498 499
/**
 * pci_enable_msi - configure device's MSI capability structure
 * @dev: pointer to the pci_dev data structure of MSI device function
 *
 * Setup the MSI capability structure of device function with
500
 * a single MSI irq upon its software driver call to request for
L
Linus Torvalds 已提交
501 502
 * MSI mode enabled on its hardware device function. A return of zero
 * indicates the successful setup of an entry zero with the new MSI
503
 * irq or non-zero for otherwise.
L
Linus Torvalds 已提交
504 505 506
 **/
int pci_enable_msi(struct pci_dev* dev)
{
507
	int status;
L
Linus Torvalds 已提交
508

509 510 511
	status = pci_msi_check_device(dev, 1, PCI_CAP_ID_MSI);
	if (status)
		return status;
L
Linus Torvalds 已提交
512

E
Eric W. Biederman 已提交
513
	WARN_ON(!!dev->msi_enabled);
L
Linus Torvalds 已提交
514

515
	/* Check whether driver already requested for MSI-X irqs */
516 517 518 519 520
	if (dev->msix_enabled) {
		printk(KERN_INFO "PCI: %s: Can't enable MSI.  "
			"Device already has MSI-X enabled\n",
			pci_name(dev));
		return -EINVAL;
L
Linus Torvalds 已提交
521 522 523 524
	}
	status = msi_capability_init(dev);
	return status;
}
525
EXPORT_SYMBOL(pci_enable_msi);
L
Linus Torvalds 已提交
526 527 528 529

void pci_disable_msi(struct pci_dev* dev)
{
	struct msi_desc *entry;
530
	int default_irq;
L
Linus Torvalds 已提交
531

532
	if (!pci_msi_enable || !dev || !dev->msi_enabled)
E
Eric W. Biederman 已提交
533 534
		return;

535
	msi_set_enable(dev, 0);
536
	pci_intx_for_msi(dev, 1);
537
	dev->msi_enabled = 0;
538

539 540 541
	BUG_ON(list_empty(&dev->msi_list));
	entry = list_entry(dev->msi_list.next, struct msi_desc, list);
	if (!entry->dev || entry->msi_attrib.type != PCI_CAP_ID_MSI) {
L
Linus Torvalds 已提交
542 543
		return;
	}
544 545

	default_irq = entry->msi_attrib.default_irq;
546
	msi_free_irqs(dev);
547 548 549

	/* Restore dev->irq to its default pin-assertion irq */
	dev->irq = default_irq;
L
Linus Torvalds 已提交
550
}
551
EXPORT_SYMBOL(pci_disable_msi);
L
Linus Torvalds 已提交
552

553
static int msi_free_irqs(struct pci_dev* dev)
L
Linus Torvalds 已提交
554
{
555
	struct msi_desc *entry, *tmp;
M
Michael Ellerman 已提交
556

557 558 559 560
	list_for_each_entry(entry, &dev->msi_list, list) {
		if (entry->irq)
			BUG_ON(irq_has_action(entry->irq));
	}
L
Linus Torvalds 已提交
561

562
	arch_teardown_msi_irqs(dev);
L
Linus Torvalds 已提交
563

564 565 566 567 568
	list_for_each_entry_safe(entry, tmp, &dev->msi_list, list) {
		if (entry->msi_attrib.type == PCI_CAP_ID_MSIX) {
			writel(1, entry->mask_base + entry->msi_attrib.entry_nr
				  * PCI_MSIX_ENTRY_SIZE
				  + PCI_MSIX_ENTRY_VECTOR_CTRL_OFFSET);
569 570 571

			if (list_is_last(&entry->list, &dev->msi_list))
				iounmap(entry->mask_base);
572 573 574
		}
		list_del(&entry->list);
		kfree(entry);
L
Linus Torvalds 已提交
575 576 577 578 579 580 581 582
	}

	return 0;
}

/**
 * pci_enable_msix - configure device's MSI-X capability structure
 * @dev: pointer to the pci_dev data structure of MSI-X device function
583
 * @entries: pointer to an array of MSI-X entries
584
 * @nvec: number of MSI-X irqs requested for allocation by device driver
L
Linus Torvalds 已提交
585 586
 *
 * Setup the MSI-X capability structure of device function with the number
587
 * of requested irqs upon its software driver call to request for
L
Linus Torvalds 已提交
588 589
 * MSI-X mode enabled on its hardware device function. A return of zero
 * indicates the successful configuration of MSI-X capability structure
590
 * with new allocated MSI-X irqs. A return of < 0 indicates a failure.
L
Linus Torvalds 已提交
591
 * Or a return of > 0 indicates that driver request is exceeding the number
592
 * of irqs available. Driver should use the returned value to re-send
L
Linus Torvalds 已提交
593 594 595 596
 * its request.
 **/
int pci_enable_msix(struct pci_dev* dev, struct msix_entry *entries, int nvec)
{
597
	int status, pos, nr_entries;
E
Eric W. Biederman 已提交
598
	int i, j;
L
Linus Torvalds 已提交
599 600
	u16 control;

601
	if (!entries)
L
Linus Torvalds 已提交
602 603
 		return -EINVAL;

604 605 606 607
	status = pci_msi_check_device(dev, nvec, PCI_CAP_ID_MSIX);
	if (status)
		return status;

608
	pos = pci_find_capability(dev, PCI_CAP_ID_MSIX);
L
Linus Torvalds 已提交
609 610 611 612 613 614 615 616 617 618 619 620 621 622
	pci_read_config_word(dev, msi_control_reg(pos), &control);
	nr_entries = multi_msix_capable(control);
	if (nvec > nr_entries)
		return -EINVAL;

	/* Check for any invalid entries */
	for (i = 0; i < nvec; i++) {
		if (entries[i].entry >= nr_entries)
			return -EINVAL;		/* invalid entry */
		for (j = i + 1; j < nvec; j++) {
			if (entries[i].entry == entries[j].entry)
				return -EINVAL;	/* duplicate entry */
		}
	}
E
Eric W. Biederman 已提交
623
	WARN_ON(!!dev->msix_enabled);
624

625
	/* Check whether driver already requested for MSI irq */
626
   	if (dev->msi_enabled) {
L
Linus Torvalds 已提交
627
		printk(KERN_INFO "PCI: %s: Can't enable MSI-X.  "
628
		       "Device already has an MSI irq assigned\n",
L
Linus Torvalds 已提交
629 630 631 632 633 634
		       pci_name(dev));
		return -EINVAL;
	}
	status = msix_capability_init(dev, entries, nvec);
	return status;
}
635
EXPORT_SYMBOL(pci_enable_msix);
L
Linus Torvalds 已提交
636

637
static void msix_free_all_irqs(struct pci_dev *dev)
L
Linus Torvalds 已提交
638
{
639
	msi_free_irqs(dev);
640 641 642 643
}

void pci_disable_msix(struct pci_dev* dev)
{
644
	if (!pci_msi_enable || !dev || !dev->msix_enabled)
E
Eric W. Biederman 已提交
645 646
		return;

647
	msix_set_enable(dev, 0);
648
	pci_intx_for_msi(dev, 1);
649
	dev->msix_enabled = 0;
650

651
	msix_free_all_irqs(dev);
L
Linus Torvalds 已提交
652
}
653
EXPORT_SYMBOL(pci_disable_msix);
L
Linus Torvalds 已提交
654 655

/**
656
 * msi_remove_pci_irq_vectors - reclaim MSI(X) irqs to unused state
L
Linus Torvalds 已提交
657 658
 * @dev: pointer to the pci_dev data structure of MSI(X) device function
 *
659
 * Being called during hotplug remove, from which the device function
660
 * is hot-removed. All previous assigned MSI/MSI-X irqs, if
L
Linus Torvalds 已提交
661 662 663 664 665 666 667 668
 * allocated for this device function, are reclaimed to unused state,
 * which may be used later on.
 **/
void msi_remove_pci_irq_vectors(struct pci_dev* dev)
{
	if (!pci_msi_enable || !dev)
 		return;

669 670
	if (dev->msi_enabled)
		msi_free_irqs(dev);
L
Linus Torvalds 已提交
671

672 673
	if (dev->msix_enabled)
		msix_free_all_irqs(dev);
L
Linus Torvalds 已提交
674 675
}

676 677 678 679
void pci_no_msi(void)
{
	pci_msi_enable = 0;
}
680

681 682 683 684 685
void pci_msi_init_pci_dev(struct pci_dev *dev)
{
	INIT_LIST_HEAD(&dev->msi_list);
}

686 687 688 689 690 691 692 693 694

/* Arch hooks */

int __attribute__ ((weak))
arch_msi_check_device(struct pci_dev* dev, int nvec, int type)
{
	return 0;
}

695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714
int __attribute__ ((weak))
arch_setup_msi_irq(struct pci_dev *dev, struct msi_desc *entry)
{
	return 0;
}

int __attribute__ ((weak))
arch_setup_msi_irqs(struct pci_dev *dev, int nvec, int type)
{
	struct msi_desc *entry;
	int ret;

	list_for_each_entry(entry, &dev->msi_list, list) {
		ret = arch_setup_msi_irq(dev, entry);
		if (ret)
			return ret;
	}

	return 0;
}
715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730

void __attribute__ ((weak)) arch_teardown_msi_irq(unsigned int irq)
{
	return;
}

void __attribute__ ((weak))
arch_teardown_msi_irqs(struct pci_dev *dev)
{
	struct msi_desc *entry;

	list_for_each_entry(entry, &dev->msi_list, list) {
		if (entry->irq != 0)
			arch_teardown_msi_irq(entry->irq);
	}
}