portdrv_core.c 15.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * File:	portdrv_core.c
 * Purpose:	PCI Express Port Bus Driver's Core Functions
 *
 * Copyright (C) 2004 Intel
 * Copyright (C) Tom Long Nguyen (tom.l.nguyen@intel.com)
 */

#include <linux/module.h>
#include <linux/pci.h>
#include <linux/kernel.h>
#include <linux/errno.h>
#include <linux/pm.h>
14
#include <linux/pm_runtime.h>
T
Tim Schmielau 已提交
15 16
#include <linux/string.h>
#include <linux/slab.h>
L
Linus Torvalds 已提交
17
#include <linux/pcieport_if.h>
18
#include <linux/aer.h>
L
Linus Torvalds 已提交
19

20
#include "../pci.h"
L
Linus Torvalds 已提交
21 22
#include "portdrv.h"

23 24 25 26 27 28 29 30 31 32 33
bool pciehp_msi_disabled;

static int __init pciehp_setup(char *str)
{
	if (!strncmp(str, "nomsi", 5))
		pciehp_msi_disabled = true;

	return 1;
}
__setup("pcie_hp=", pciehp_setup);

34 35 36 37 38 39
/**
 * release_pcie_device - free PCI Express port service device structure
 * @dev: Port service device to release
 *
 * Invoked automatically when device is being removed in response to
 * device_unregister(dev).  Release all resources being claimed.
L
Linus Torvalds 已提交
40 41 42
 */
static void release_pcie_device(struct device *dev)
{
43
	kfree(to_pcie_device(dev));
L
Linus Torvalds 已提交
44 45
}

46
/**
47 48
 * pcie_port_enable_irq_vec - try to set up MSI-X or MSI as interrupt mode
 * for given port
49
 * @dev: PCI Express port to handle
50
 * @irqs: Array of interrupt vectors to populate
51 52 53 54
 * @mask: Bitmask of port capabilities returned by get_port_device_capability()
 *
 * Return value: 0 on success, error code on failure
 */
55
static int pcie_port_enable_irq_vec(struct pci_dev *dev, int *irqs, int mask)
56
{
57
	int nr_entries, entry, nvec = 0;
58 59 60 61 62 63 64

	/*
	 * Allocate as many entries as the port wants, so that we can check
	 * which of them will be useful.  Moreover, if nr_entries is correctly
	 * equal to the number of entries this port actually uses, we'll happily
	 * go through without any tricks.
	 */
65 66
	nr_entries = pci_alloc_irq_vectors(dev, 1, PCIE_PORT_MAX_MSI_ENTRIES,
			PCI_IRQ_MSIX | PCI_IRQ_MSI);
67 68
	if (nr_entries < 0)
		return nr_entries;
69 70

	if (mask & (PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP)) {
71
		u16 reg16;
72 73

		/*
74 75 76 77 78 79 80 81 82 83 84 85 86
		 * Per PCIe r3.1, sec 6.1.6, "PME and Hot-Plug Event
		 * interrupts (when both are implemented) always share the
		 * same MSI or MSI-X vector, as indicated by the Interrupt
		 * Message Number field in the PCI Express Capabilities
		 * register".
		 *
		 * Per sec 7.8.2, "For MSI, the [Interrupt Message Number]
		 * indicates the offset between the base Message Data and
		 * the interrupt message that is generated."
		 *
		 * "For MSI-X, the [Interrupt Message Number] indicates
		 * which MSI-X Table entry is used to generate the
		 * interrupt message."
87
		 */
88
		pcie_capability_read_word(dev, PCI_EXP_FLAGS, &reg16);
89
		entry = (reg16 & PCI_EXP_FLAGS_IRQ) >> 9;
90
		if (entry >= nr_entries)
91
			goto out_free_irqs;
92

93 94
		irqs[PCIE_PORT_SERVICE_PME_SHIFT] = pci_irq_vector(dev, entry);
		irqs[PCIE_PORT_SERVICE_HP_SHIFT] = pci_irq_vector(dev, entry);
95

96
		nvec = max(nvec, entry + 1);
97 98 99
	}

	if (mask & PCIE_PORT_SERVICE_AER) {
100
		u32 reg32, pos;
101 102

		/*
103 104 105 106 107 108 109 110 111 112 113
		 * Per PCIe r3.1, sec 7.10.10, the Advanced Error Interrupt
		 * Message Number in the Root Error Status register
		 * indicates which MSI/MSI-X vector is used for AER.
		 *
		 * "For MSI, the [Advanced Error Interrupt Message Number]
		 * indicates the offset between the base Message Data and
		 * the interrupt message that is generated."
		 *
		 * "For MSI-X, the [Advanced Error Interrupt Message
		 * Number] indicates which MSI-X Table entry is used to
		 * generate the interrupt message."
114 115 116 117 118
		 */
		pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ERR);
		pci_read_config_dword(dev, pos + PCI_ERR_ROOT_STATUS, &reg32);
		entry = reg32 >> 27;
		if (entry >= nr_entries)
119
			goto out_free_irqs;
120

121
		irqs[PCIE_PORT_SERVICE_AER_SHIFT] = pci_irq_vector(dev, entry);
122

123
		nvec = max(nvec, entry + 1);
124 125
	}

126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152
	if (mask & PCIE_PORT_SERVICE_DPC) {
		u16 reg16, pos;

		/*
		 * Per PCIe r4.0 (v0.9), sec 7.9.15.2, the DPC Interrupt
		 * Message Number in the DPC Capability register indicates
		 * which MSI/MSI-X vector is used for DPC.
		 *
		 * "For MSI, the [DPC Interrupt Message Number] indicates
		 * the offset between the base Message Data and the
		 * interrupt message that is generated."
		 *
		 * "For MSI-X, the [DPC Interrupt Message Number] indicates
		 * which MSI-X Table entry is used to generate the
		 * interrupt message."
		 */
		pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_DPC);
		pci_read_config_word(dev, pos + PCI_EXP_DPC_CAP, &reg16);
		entry = reg16 & 0x1f;
		if (entry >= nr_entries)
			goto out_free_irqs;

		irqs[PCIE_PORT_SERVICE_DPC_SHIFT] = pci_irq_vector(dev, entry);

		nvec = max(nvec, entry + 1);
	}

153 154 155 156 157
	/*
	 * If nvec is equal to the allocated number of entries, we can just use
	 * what we have.  Otherwise, the port has some extra entries not for the
	 * services we know and we need to work around that.
	 */
158
	if (nvec != nr_entries) {
159
		/* Drop the temporary MSI-X setup */
160
		pci_free_irq_vectors(dev);
161 162

		/* Now allocate the MSI-X vectors for real */
163
		nr_entries = pci_alloc_irq_vectors(dev, nvec, nvec,
164
				PCI_IRQ_MSIX | PCI_IRQ_MSI);
165 166
		if (nr_entries < 0)
			return nr_entries;
167 168
	}

169
	return 0;
170

171 172 173
out_free_irqs:
	pci_free_irq_vectors(dev);
	return -EIO;
174 175
}

176
/**
177
 * pcie_init_service_irqs - initialize irqs for PCI Express port services
178
 * @dev: PCI Express port to handle
179
 * @irqs: Array of irqs to populate
180 181 182 183
 * @mask: Bitmask of port capabilities returned by get_port_device_capability()
 *
 * Return value: Interrupt mode associated with the port
 */
184
static int pcie_init_service_irqs(struct pci_dev *dev, int *irqs, int mask)
L
Linus Torvalds 已提交
185
{
186 187 188 189
	int ret, i;

	for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++)
		irqs[i] = -1;
190

191
	/*
192 193 194
	 * If we support PME or hotplug, but we can't use MSI/MSI-X for
	 * them, we have to fall back to INTx or other interrupts, e.g., a
	 * system shared interrupt.
195
	 */
196 197 198 199 200 201 202 203 204
	if ((mask & PCIE_PORT_SERVICE_PME) && pcie_pme_no_msi())
		goto legacy_irq;

	if ((mask & PCIE_PORT_SERVICE_HP) && pciehp_no_msi())
		goto legacy_irq;

	/* Try to use MSI-X or MSI if supported */
	if (pcie_port_enable_irq_vec(dev, irqs, mask) == 0)
		return 0;
205

206 207 208
legacy_irq:
	/* fall back to legacy IRQ */
	ret = pci_alloc_irq_vectors(dev, 1, 1, PCI_IRQ_LEGACY);
209 210
	if (ret < 0)
		return -ENODEV;
211

212 213 214 215
	for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) {
		if (i != PCIE_PORT_SERVICE_VC_SHIFT)
			irqs[i] = pci_irq_vector(dev, 0);
	}
L
Linus Torvalds 已提交
216

217
	return 0;
L
Linus Torvalds 已提交
218 219
}

220 221 222 223 224 225 226 227 228 229
/**
 * get_port_device_capability - discover capabilities of a PCI Express port
 * @dev: PCI Express port to examine
 *
 * The capabilities are read from the port's PCI Express configuration registers
 * as described in PCI Express Base Specification 1.0a sections 7.8.2, 7.8.9 and
 * 7.9 - 7.11.
 *
 * Return value: Bitmask of discovered port capabilities
 */
L
Linus Torvalds 已提交
230 231
static int get_port_device_capability(struct pci_dev *dev)
{
232
	int services = 0;
233
	int cap_mask = 0;
234

235 236 237
	if (pcie_ports_disabled)
		return 0;

238
	cap_mask = PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP
239
			| PCIE_PORT_SERVICE_VC | PCIE_PORT_SERVICE_DPC;
240 241 242
	if (pci_aer_available())
		cap_mask |= PCIE_PORT_SERVICE_AER;

243 244
	if (pcie_ports_auto)
		pcie_port_platform_notify(dev, &cap_mask);
L
Linus Torvalds 已提交
245 246

	/* Hot-Plug Capable */
247 248 249 250 251 252 253 254
	if ((cap_mask & PCIE_PORT_SERVICE_HP) && dev->is_hotplug_bridge) {
		services |= PCIE_PORT_SERVICE_HP;
		/*
		 * Disable hot-plug interrupts in case they have been enabled
		 * by the BIOS and the hot-plug service driver is not loaded.
		 */
		pcie_capability_clear_word(dev, PCI_EXP_SLTCTL,
			  PCI_EXP_SLTCTL_CCIE | PCI_EXP_SLTCTL_HPIE);
255 256
	}
	/* AER capable */
257
	if ((cap_mask & PCIE_PORT_SERVICE_AER)
258
	    && pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ERR)) {
259
		services |= PCIE_PORT_SERVICE_AER;
260 261 262 263 264 265
		/*
		 * Disable AER on this port in case it's been enabled by the
		 * BIOS (the AER service driver will enable it when necessary).
		 */
		pci_disable_pcie_error_reporting(dev);
	}
266
	/* VC support */
267 268
	if (pci_find_ext_capability(dev, PCI_EXT_CAP_ID_VC))
		services |= PCIE_PORT_SERVICE_VC;
269
	/* Root ports are capable of generating PME too */
270
	if ((cap_mask & PCIE_PORT_SERVICE_PME)
271
	    && pci_pcie_type(dev) == PCI_EXP_TYPE_ROOT_PORT) {
272
		services |= PCIE_PORT_SERVICE_PME;
273 274 275 276 277 278 279
		/*
		 * Disable PME interrupt on this port in case it's been enabled
		 * by the BIOS (the PME service driver will enable it when
		 * necessary).
		 */
		pcie_pme_interrupt_enable(dev, false);
	}
280 281
	if (pci_find_ext_capability(dev, PCI_EXT_CAP_ID_DPC))
		services |= PCIE_PORT_SERVICE_DPC;
L
Linus Torvalds 已提交
282 283 284 285

	return services;
}

286
/**
287 288 289
 * pcie_device_init - allocate and initialize PCI Express port service device
 * @pdev: PCI Express port to associate the service device with
 * @service: Type of service to associate with the service device
290 291
 * @irq: Interrupt vector to associate with the service device
 */
292
static int pcie_device_init(struct pci_dev *pdev, int service, int irq)
L
Linus Torvalds 已提交
293
{
294 295
	int retval;
	struct pcie_device *pcie;
L
Linus Torvalds 已提交
296 297
	struct device *device;

298 299 300 301 302 303
	pcie = kzalloc(sizeof(*pcie), GFP_KERNEL);
	if (!pcie)
		return -ENOMEM;
	pcie->port = pdev;
	pcie->irq = irq;
	pcie->service = service;
L
Linus Torvalds 已提交
304 305

	/* Initialize generic device interface */
306
	device = &pcie->device;
L
Linus Torvalds 已提交
307 308
	device->bus = &pcie_port_bus_type;
	device->release = release_pcie_device;	/* callback to free pcie dev */
309
	dev_set_name(device, "%s:pcie%03x",
310
		     pci_name(pdev),
311
		     get_descriptor_id(pci_pcie_type(pdev), service));
312
	device->parent = &pdev->dev;
313
	device_enable_async_suspend(device);
314 315

	retval = device_register(device);
B
Bjorn Helgaas 已提交
316
	if (retval) {
317
		put_device(device);
B
Bjorn Helgaas 已提交
318 319 320
		return retval;
	}

321 322
	pm_runtime_no_callbacks(device);

B
Bjorn Helgaas 已提交
323
	return 0;
L
Linus Torvalds 已提交
324 325
}

326 327 328 329 330 331 332
/**
 * pcie_port_device_register - register PCI Express port
 * @dev: PCI Express port to register
 *
 * Allocate the port extension structure and register services associated with
 * the port.
 */
L
Linus Torvalds 已提交
333 334
int pcie_port_device_register(struct pci_dev *dev)
{
335
	int status, capabilities, i, nr_service;
336
	int irqs[PCIE_PORT_DEVICE_MAXSERVICES];
L
Linus Torvalds 已提交
337

338 339 340
	/* Enable PCI Express port device */
	status = pci_enable_device(dev);
	if (status)
341
		return status;
342 343 344

	/* Get and check PCI Express port services */
	capabilities = get_port_device_capability(dev);
345
	if (!capabilities)
346 347
		return 0;

348
	pci_set_master(dev);
349 350 351
	/*
	 * Initialize service irqs. Don't use service devices that
	 * require interrupts if there is no way to generate them.
352 353 354
	 * However, some drivers may have a polling mode (e.g. pciehp_poll_mode)
	 * that can be used in the absence of irqs.  Allow them to determine
	 * if that is to be used.
355
	 */
356
	status = pcie_init_service_irqs(dev, irqs, capabilities);
357
	if (status) {
358
		capabilities &= PCIE_PORT_SERVICE_VC | PCIE_PORT_SERVICE_HP;
359
		if (!capabilities)
360
			goto error_disable;
361
	}
L
Linus Torvalds 已提交
362 363

	/* Allocate child services if any */
364 365 366
	status = -ENODEV;
	nr_service = 0;
	for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) {
367 368 369
		int service = 1 << i;
		if (!(capabilities & service))
			continue;
370 371
		if (!pcie_device_init(dev, service, irqs[i]))
			nr_service++;
372
	}
373
	if (!nr_service)
374
		goto error_cleanup_irqs;
375

L
Linus Torvalds 已提交
376
	return 0;
377

378
error_cleanup_irqs:
379
	pci_free_irq_vectors(dev);
380 381
error_disable:
	pci_disable_device(dev);
382
	return status;
L
Linus Torvalds 已提交
383 384 385
}

#ifdef CONFIG_PM
386
static int suspend_iter(struct device *dev, void *data)
L
Linus Torvalds 已提交
387 388
{
	struct pcie_port_service_driver *service_driver;
389

390 391 392 393 394
	if ((dev->bus == &pcie_port_bus_type) && dev->driver) {
		service_driver = to_service_driver(dev->driver);
		if (service_driver->suspend)
			service_driver->suspend(to_pcie_device(dev));
	}
395 396
	return 0;
}
L
Linus Torvalds 已提交
397

398 399 400 401
/**
 * pcie_port_device_suspend - suspend port services associated with a PCIe port
 * @dev: PCI Express port to handle
 */
402
int pcie_port_device_suspend(struct device *dev)
403
{
404
	return device_for_each_child(dev, NULL, suspend_iter);
L
Linus Torvalds 已提交
405 406
}

407 408
static int resume_iter(struct device *dev, void *data)
{
L
Linus Torvalds 已提交
409 410
	struct pcie_port_service_driver *service_driver;

411 412 413 414 415
	if ((dev->bus == &pcie_port_bus_type) &&
	    (dev->driver)) {
		service_driver = to_service_driver(dev->driver);
		if (service_driver->resume)
			service_driver->resume(to_pcie_device(dev));
L
Linus Torvalds 已提交
416
	}
417 418
	return 0;
}
L
Linus Torvalds 已提交
419

420
/**
421
 * pcie_port_device_resume - resume port services associated with a PCIe port
422 423
 * @dev: PCI Express port to handle
 */
424
int pcie_port_device_resume(struct device *dev)
425
{
426
	return device_for_each_child(dev, NULL, resume_iter);
L
Linus Torvalds 已提交
427
}
428
#endif /* PM */
L
Linus Torvalds 已提交
429

430
static int remove_iter(struct device *dev, void *data)
L
Linus Torvalds 已提交
431
{
432
	if (dev->bus == &pcie_port_bus_type)
433
		device_unregister(dev);
434 435 436
	return 0;
}

437 438 439 440 441 442 443
/**
 * pcie_port_device_remove - unregister PCI Express port service devices
 * @dev: PCI Express port the service devices to unregister are associated with
 *
 * Remove PCI Express port service devices associated with given port and
 * disable MSI-X or MSI for the port.
 */
444 445
void pcie_port_device_remove(struct pci_dev *dev)
{
446
	device_for_each_child(&dev->dev, NULL, remove_iter);
447
	pci_free_irq_vectors(dev);
448
	pci_disable_device(dev);
L
Linus Torvalds 已提交
449 450
}

451 452 453 454 455 456 457 458
/**
 * pcie_port_probe_service - probe driver for given PCI Express port service
 * @dev: PCI Express port service device to probe against
 *
 * If PCI Express port service driver is registered with
 * pcie_port_service_register(), this function will be called by the driver core
 * whenever match is found between the driver and a port service device.
 */
459
static int pcie_port_probe_service(struct device *dev)
L
Linus Torvalds 已提交
460
{
461 462 463 464 465 466 467 468 469 470 471 472
	struct pcie_device *pciedev;
	struct pcie_port_service_driver *driver;
	int status;

	if (!dev || !dev->driver)
		return -ENODEV;

	driver = to_service_driver(dev->driver);
	if (!driver || !driver->probe)
		return -ENODEV;

	pciedev = to_pcie_device(dev);
473
	status = driver->probe(pciedev);
B
Bjorn Helgaas 已提交
474 475 476 477 478
	if (status)
		return status;

	get_device(dev);
	return 0;
L
Linus Torvalds 已提交
479 480
}

481 482 483 484 485 486 487 488 489
/**
 * pcie_port_remove_service - detach driver from given PCI Express port service
 * @dev: PCI Express port service device to handle
 *
 * If PCI Express port service driver is registered with
 * pcie_port_service_register(), this function will be called by the driver core
 * when device_unregister() is called for the port service device associated
 * with the driver.
 */
490
static int pcie_port_remove_service(struct device *dev)
L
Linus Torvalds 已提交
491
{
492 493 494 495 496 497 498 499 500 501 502 503 504
	struct pcie_device *pciedev;
	struct pcie_port_service_driver *driver;

	if (!dev || !dev->driver)
		return 0;

	pciedev = to_pcie_device(dev);
	driver = to_service_driver(dev->driver);
	if (driver && driver->remove) {
		driver->remove(pciedev);
		put_device(dev);
	}
	return 0;
L
Linus Torvalds 已提交
505 506
}

507 508 509 510 511 512 513 514 515
/**
 * pcie_port_shutdown_service - shut down given PCI Express port service
 * @dev: PCI Express port service device to handle
 *
 * If PCI Express port service driver is registered with
 * pcie_port_service_register(), this function will be called by the driver core
 * when device_shutdown() is called for the port service device associated
 * with the driver.
 */
516 517
static void pcie_port_shutdown_service(struct device *dev) {}

518 519 520 521
/**
 * pcie_port_service_register - register PCI Express port service driver
 * @new: PCI Express port service driver to register
 */
L
Linus Torvalds 已提交
522 523
int pcie_port_service_register(struct pcie_port_service_driver *new)
{
524 525 526
	if (pcie_ports_disabled)
		return -ENODEV;

527
	new->driver.name = new->name;
L
Linus Torvalds 已提交
528 529 530 531 532 533
	new->driver.bus = &pcie_port_bus_type;
	new->driver.probe = pcie_port_probe_service;
	new->driver.remove = pcie_port_remove_service;
	new->driver.shutdown = pcie_port_shutdown_service;

	return driver_register(&new->driver);
534
}
535
EXPORT_SYMBOL(pcie_port_service_register);
L
Linus Torvalds 已提交
536

537 538 539 540
/**
 * pcie_port_service_unregister - unregister PCI Express port service driver
 * @drv: PCI Express port service driver to unregister
 */
541
void pcie_port_service_unregister(struct pcie_port_service_driver *drv)
L
Linus Torvalds 已提交
542
{
543
	driver_unregister(&drv->driver);
L
Linus Torvalds 已提交
544 545
}
EXPORT_SYMBOL(pcie_port_service_unregister);