portdrv_core.c 13.7 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * File:	portdrv_core.c
 * Purpose:	PCI Express Port Bus Driver's Core Functions
 *
 * Copyright (C) 2004 Intel
 * Copyright (C) Tom Long Nguyen (tom.l.nguyen@intel.com)
 */

#include <linux/module.h>
#include <linux/pci.h>
#include <linux/kernel.h>
#include <linux/errno.h>
#include <linux/pm.h>
15
#include <linux/pm_runtime.h>
T
Tim Schmielau 已提交
16 17
#include <linux/string.h>
#include <linux/slab.h>
18
#include <linux/aer.h>
L
Linus Torvalds 已提交
19

20
#include "../pci.h"
L
Linus Torvalds 已提交
21 22
#include "portdrv.h"

23 24 25 26 27 28
/**
 * release_pcie_device - free PCI Express port service device structure
 * @dev: Port service device to release
 *
 * Invoked automatically when device is being removed in response to
 * device_unregister(dev).  Release all resources being claimed.
L
Linus Torvalds 已提交
29 30 31
 */
static void release_pcie_device(struct device *dev)
{
32
	kfree(to_pcie_device(dev));
L
Linus Torvalds 已提交
33 34
}

35 36 37 38
/*
 * Fill in *pme, *aer, *dpc with the relevant Interrupt Message Numbers if
 * services are enabled in "mask".  Return the number of MSI/MSI-X vectors
 * required to accommodate the largest Message Number.
39
 */
40 41
static int pcie_message_numbers(struct pci_dev *dev, int mask,
				u32 *pme, u32 *aer, u32 *dpc)
42
{
43
	u32 nvec = 0, pos;
44
	u16 reg16;
45 46

	/*
47 48 49 50
	 * The Interrupt Message Number indicates which vector is used, i.e.,
	 * the MSI-X table entry or the MSI offset between the base Message
	 * Data and the generated interrupt message.  See PCIe r3.1, sec
	 * 7.8.2, 7.10.10, 7.31.2.
51 52 53
	 */

	if (mask & (PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP)) {
54
		pcie_capability_read_word(dev, PCI_EXP_FLAGS, &reg16);
55 56
		*pme = (reg16 & PCI_EXP_FLAGS_IRQ) >> 9;
		nvec = *pme + 1;
57 58
	}

59
#ifdef CONFIG_PCIEAER
60
	if (mask & PCIE_PORT_SERVICE_AER) {
61 62 63
		u32 reg32;

		pos = dev->aer_cap;
64 65 66 67 68 69
		if (pos) {
			pci_read_config_dword(dev, pos + PCI_ERR_ROOT_STATUS,
					      &reg32);
			*aer = (reg32 & PCI_ERR_ROOT_AER_IRQ) >> 27;
			nvec = max(nvec, *aer + 1);
		}
70
	}
71
#endif
72

73 74
	if (mask & PCIE_PORT_SERVICE_DPC) {
		pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_DPC);
75 76 77 78 79 80 81 82 83 84 85
		if (pos) {
			pci_read_config_word(dev, pos + PCI_EXP_DPC_CAP,
					     &reg16);
			*dpc = reg16 & PCI_EXP_DPC_IRQ;
			nvec = max(nvec, *dpc + 1);
		}
	}

	return nvec;
}

86
/**
87 88
 * pcie_port_enable_irq_vec - try to set up MSI-X or MSI as interrupt mode
 * for given port
89
 * @dev: PCI Express port to handle
90
 * @irqs: Array of interrupt vectors to populate
91 92 93 94
 * @mask: Bitmask of port capabilities returned by get_port_device_capability()
 *
 * Return value: 0 on success, error code on failure
 */
95
static int pcie_port_enable_irq_vec(struct pci_dev *dev, int *irqs, int mask)
96
{
97 98
	int nr_entries, nvec;
	u32 pme = 0, aer = 0, dpc = 0;
99

B
Bjorn Helgaas 已提交
100
	/* Allocate the maximum possible number of MSI/MSI-X vectors */
101 102
	nr_entries = pci_alloc_irq_vectors(dev, 1, PCIE_PORT_MAX_MSI_ENTRIES,
			PCI_IRQ_MSIX | PCI_IRQ_MSI);
103 104
	if (nr_entries < 0)
		return nr_entries;
105

106 107 108 109 110
	/* See how many and which Interrupt Message Numbers we actually use */
	nvec = pcie_message_numbers(dev, mask, &pme, &aer, &dpc);
	if (nvec > nr_entries) {
		pci_free_irq_vectors(dev);
		return -EIO;
111 112
	}

113
	/*
114 115 116 117 118 119 120 121 122
	 * If we allocated more than we need, free them and reallocate fewer.
	 *
	 * Reallocating may change the specific vectors we get, so
	 * pci_irq_vector() must be done *after* the reallocation.
	 *
	 * If we're using MSI, hardware is *allowed* to change the Interrupt
	 * Message Numbers when we free and reallocate the vectors, but we
	 * assume it won't because we allocate enough vectors for the
	 * biggest Message Number we found.
123
	 */
124 125
	if (nvec != nr_entries) {
		pci_free_irq_vectors(dev);
126

127
		nr_entries = pci_alloc_irq_vectors(dev, nvec, nvec,
128
				PCI_IRQ_MSIX | PCI_IRQ_MSI);
129 130
		if (nr_entries < 0)
			return nr_entries;
131 132
	}

133 134 135 136
	/* PME and hotplug share an MSI/MSI-X vector */
	if (mask & (PCIE_PORT_SERVICE_PME | PCIE_PORT_SERVICE_HP)) {
		irqs[PCIE_PORT_SERVICE_PME_SHIFT] = pci_irq_vector(dev, pme);
		irqs[PCIE_PORT_SERVICE_HP_SHIFT] = pci_irq_vector(dev, pme);
137 138
	}

139 140
	if (mask & PCIE_PORT_SERVICE_AER)
		irqs[PCIE_PORT_SERVICE_AER_SHIFT] = pci_irq_vector(dev, aer);
141

142 143
	if (mask & PCIE_PORT_SERVICE_DPC)
		irqs[PCIE_PORT_SERVICE_DPC_SHIFT] = pci_irq_vector(dev, dpc);
144

145
	return 0;
146 147
}

148
/**
149
 * pcie_init_service_irqs - initialize irqs for PCI Express port services
150
 * @dev: PCI Express port to handle
151
 * @irqs: Array of irqs to populate
152 153 154 155
 * @mask: Bitmask of port capabilities returned by get_port_device_capability()
 *
 * Return value: Interrupt mode associated with the port
 */
156
static int pcie_init_service_irqs(struct pci_dev *dev, int *irqs, int mask)
L
Linus Torvalds 已提交
157
{
158 159 160 161
	int ret, i;

	for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++)
		irqs[i] = -1;
162

163
	/*
164 165 166
	 * If we support PME but can't use MSI/MSI-X for it, we have to
	 * fall back to INTx or other interrupts, e.g., a system shared
	 * interrupt.
167
	 */
168 169 170 171 172 173
	if ((mask & PCIE_PORT_SERVICE_PME) && pcie_pme_no_msi())
		goto legacy_irq;

	/* Try to use MSI-X or MSI if supported */
	if (pcie_port_enable_irq_vec(dev, irqs, mask) == 0)
		return 0;
174

175 176 177
legacy_irq:
	/* fall back to legacy IRQ */
	ret = pci_alloc_irq_vectors(dev, 1, 1, PCI_IRQ_LEGACY);
178 179
	if (ret < 0)
		return -ENODEV;
180

181 182
	for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++)
		irqs[i] = pci_irq_vector(dev, 0);
L
Linus Torvalds 已提交
183

184
	return 0;
L
Linus Torvalds 已提交
185 186
}

187 188 189 190 191 192 193 194 195 196
/**
 * get_port_device_capability - discover capabilities of a PCI Express port
 * @dev: PCI Express port to examine
 *
 * The capabilities are read from the port's PCI Express configuration registers
 * as described in PCI Express Base Specification 1.0a sections 7.8.2, 7.8.9 and
 * 7.9 - 7.11.
 *
 * Return value: Bitmask of discovered port capabilities
 */
L
Linus Torvalds 已提交
197 198
static int get_port_device_capability(struct pci_dev *dev)
{
199
	struct pci_host_bridge *host = pci_find_host_bridge(dev->bus);
200
	int services = 0;
201

202 203
	if (dev->is_hotplug_bridge &&
	    (pcie_ports_native || host->native_hotplug)) {
204
		services |= PCIE_PORT_SERVICE_HP;
205

206 207 208 209 210 211
		/*
		 * Disable hot-plug interrupts in case they have been enabled
		 * by the BIOS and the hot-plug service driver is not loaded.
		 */
		pcie_capability_clear_word(dev, PCI_EXP_SLTCTL,
			  PCI_EXP_SLTCTL_CCIE | PCI_EXP_SLTCTL_HPIE);
212
	}
213

214 215 216
#ifdef CONFIG_PCIEAER
	if (dev->aer_cap && pci_aer_available() &&
	    (pcie_ports_native || host->native_aer)) {
217
		services |= PCIE_PORT_SERVICE_AER;
218

219 220 221 222 223 224
		/*
		 * Disable AER on this port in case it's been enabled by the
		 * BIOS (the AER service driver will enable it when necessary).
		 */
		pci_disable_pcie_error_reporting(dev);
	}
225
#endif
226 227 228 229 230 231 232

	/*
	 * Root ports are capable of generating PME too.  Root Complex
	 * Event Collectors can also generate PMEs, but we don't handle
	 * those yet.
	 */
	if (pci_pcie_type(dev) == PCI_EXP_TYPE_ROOT_PORT &&
233
	    (pcie_ports_native || host->native_pme)) {
234
		services |= PCIE_PORT_SERVICE_PME;
235

236 237 238 239 240 241 242
		/*
		 * Disable PME interrupt on this port in case it's been enabled
		 * by the BIOS (the PME service driver will enable it when
		 * necessary).
		 */
		pcie_pme_interrupt_enable(dev, false);
	}
243 244

	if (pci_find_ext_capability(dev, PCI_EXT_CAP_ID_DPC) &&
245
	    pci_aer_available() && services & PCIE_PORT_SERVICE_AER)
246
		services |= PCIE_PORT_SERVICE_DPC;
L
Linus Torvalds 已提交
247 248 249 250

	return services;
}

251
/**
252 253 254
 * pcie_device_init - allocate and initialize PCI Express port service device
 * @pdev: PCI Express port to associate the service device with
 * @service: Type of service to associate with the service device
255 256
 * @irq: Interrupt vector to associate with the service device
 */
257
static int pcie_device_init(struct pci_dev *pdev, int service, int irq)
L
Linus Torvalds 已提交
258
{
259 260
	int retval;
	struct pcie_device *pcie;
L
Linus Torvalds 已提交
261 262
	struct device *device;

263 264 265 266 267 268
	pcie = kzalloc(sizeof(*pcie), GFP_KERNEL);
	if (!pcie)
		return -ENOMEM;
	pcie->port = pdev;
	pcie->irq = irq;
	pcie->service = service;
L
Linus Torvalds 已提交
269 270

	/* Initialize generic device interface */
271
	device = &pcie->device;
L
Linus Torvalds 已提交
272 273
	device->bus = &pcie_port_bus_type;
	device->release = release_pcie_device;	/* callback to free pcie dev */
274
	dev_set_name(device, "%s:pcie%03x",
275
		     pci_name(pdev),
276
		     get_descriptor_id(pci_pcie_type(pdev), service));
277
	device->parent = &pdev->dev;
278
	device_enable_async_suspend(device);
279 280

	retval = device_register(device);
B
Bjorn Helgaas 已提交
281
	if (retval) {
282
		put_device(device);
B
Bjorn Helgaas 已提交
283 284 285
		return retval;
	}

286 287
	pm_runtime_no_callbacks(device);

B
Bjorn Helgaas 已提交
288
	return 0;
L
Linus Torvalds 已提交
289 290
}

291 292 293 294 295 296 297
/**
 * pcie_port_device_register - register PCI Express port
 * @dev: PCI Express port to register
 *
 * Allocate the port extension structure and register services associated with
 * the port.
 */
L
Linus Torvalds 已提交
298 299
int pcie_port_device_register(struct pci_dev *dev)
{
300
	int status, capabilities, i, nr_service;
301
	int irqs[PCIE_PORT_DEVICE_MAXSERVICES];
L
Linus Torvalds 已提交
302

303 304 305
	/* Enable PCI Express port device */
	status = pci_enable_device(dev);
	if (status)
306
		return status;
307 308 309

	/* Get and check PCI Express port services */
	capabilities = get_port_device_capability(dev);
310
	if (!capabilities)
311 312
		return 0;

313
	pci_set_master(dev);
314 315 316
	/*
	 * Initialize service irqs. Don't use service devices that
	 * require interrupts if there is no way to generate them.
317 318 319
	 * However, some drivers may have a polling mode (e.g. pciehp_poll_mode)
	 * that can be used in the absence of irqs.  Allow them to determine
	 * if that is to be used.
320
	 */
321
	status = pcie_init_service_irqs(dev, irqs, capabilities);
322
	if (status) {
323
		capabilities &= PCIE_PORT_SERVICE_HP;
324
		if (!capabilities)
325
			goto error_disable;
326
	}
L
Linus Torvalds 已提交
327 328

	/* Allocate child services if any */
329 330 331
	status = -ENODEV;
	nr_service = 0;
	for (i = 0; i < PCIE_PORT_DEVICE_MAXSERVICES; i++) {
332 333 334
		int service = 1 << i;
		if (!(capabilities & service))
			continue;
335 336
		if (!pcie_device_init(dev, service, irqs[i]))
			nr_service++;
337
	}
338
	if (!nr_service)
339
		goto error_cleanup_irqs;
340

L
Linus Torvalds 已提交
341
	return 0;
342

343
error_cleanup_irqs:
344
	pci_free_irq_vectors(dev);
345 346
error_disable:
	pci_disable_device(dev);
347
	return status;
L
Linus Torvalds 已提交
348 349 350
}

#ifdef CONFIG_PM
351
static int suspend_iter(struct device *dev, void *data)
L
Linus Torvalds 已提交
352 353
{
	struct pcie_port_service_driver *service_driver;
354

355 356 357 358 359
	if ((dev->bus == &pcie_port_bus_type) && dev->driver) {
		service_driver = to_service_driver(dev->driver);
		if (service_driver->suspend)
			service_driver->suspend(to_pcie_device(dev));
	}
360 361
	return 0;
}
L
Linus Torvalds 已提交
362

363 364 365 366
/**
 * pcie_port_device_suspend - suspend port services associated with a PCIe port
 * @dev: PCI Express port to handle
 */
367
int pcie_port_device_suspend(struct device *dev)
368
{
369
	return device_for_each_child(dev, NULL, suspend_iter);
L
Linus Torvalds 已提交
370 371
}

372 373
static int resume_iter(struct device *dev, void *data)
{
L
Linus Torvalds 已提交
374 375
	struct pcie_port_service_driver *service_driver;

376 377 378 379 380
	if ((dev->bus == &pcie_port_bus_type) &&
	    (dev->driver)) {
		service_driver = to_service_driver(dev->driver);
		if (service_driver->resume)
			service_driver->resume(to_pcie_device(dev));
L
Linus Torvalds 已提交
381
	}
382 383
	return 0;
}
L
Linus Torvalds 已提交
384

385
/**
386
 * pcie_port_device_resume - resume port services associated with a PCIe port
387 388
 * @dev: PCI Express port to handle
 */
389
int pcie_port_device_resume(struct device *dev)
390
{
391
	return device_for_each_child(dev, NULL, resume_iter);
L
Linus Torvalds 已提交
392
}
393
#endif /* PM */
L
Linus Torvalds 已提交
394

395
static int remove_iter(struct device *dev, void *data)
L
Linus Torvalds 已提交
396
{
397
	if (dev->bus == &pcie_port_bus_type)
398
		device_unregister(dev);
399 400 401
	return 0;
}

402 403 404 405 406 407 408
/**
 * pcie_port_device_remove - unregister PCI Express port service devices
 * @dev: PCI Express port the service devices to unregister are associated with
 *
 * Remove PCI Express port service devices associated with given port and
 * disable MSI-X or MSI for the port.
 */
409 410
void pcie_port_device_remove(struct pci_dev *dev)
{
411
	device_for_each_child(&dev->dev, NULL, remove_iter);
412
	pci_free_irq_vectors(dev);
413
	pci_disable_device(dev);
L
Linus Torvalds 已提交
414 415
}

416 417 418 419 420 421 422 423
/**
 * pcie_port_probe_service - probe driver for given PCI Express port service
 * @dev: PCI Express port service device to probe against
 *
 * If PCI Express port service driver is registered with
 * pcie_port_service_register(), this function will be called by the driver core
 * whenever match is found between the driver and a port service device.
 */
424
static int pcie_port_probe_service(struct device *dev)
L
Linus Torvalds 已提交
425
{
426 427 428 429 430 431 432 433 434 435 436 437
	struct pcie_device *pciedev;
	struct pcie_port_service_driver *driver;
	int status;

	if (!dev || !dev->driver)
		return -ENODEV;

	driver = to_service_driver(dev->driver);
	if (!driver || !driver->probe)
		return -ENODEV;

	pciedev = to_pcie_device(dev);
438
	status = driver->probe(pciedev);
B
Bjorn Helgaas 已提交
439 440 441 442 443
	if (status)
		return status;

	get_device(dev);
	return 0;
L
Linus Torvalds 已提交
444 445
}

446 447 448 449 450 451 452 453 454
/**
 * pcie_port_remove_service - detach driver from given PCI Express port service
 * @dev: PCI Express port service device to handle
 *
 * If PCI Express port service driver is registered with
 * pcie_port_service_register(), this function will be called by the driver core
 * when device_unregister() is called for the port service device associated
 * with the driver.
 */
455
static int pcie_port_remove_service(struct device *dev)
L
Linus Torvalds 已提交
456
{
457 458 459 460 461 462 463 464 465 466 467 468 469
	struct pcie_device *pciedev;
	struct pcie_port_service_driver *driver;

	if (!dev || !dev->driver)
		return 0;

	pciedev = to_pcie_device(dev);
	driver = to_service_driver(dev->driver);
	if (driver && driver->remove) {
		driver->remove(pciedev);
		put_device(dev);
	}
	return 0;
L
Linus Torvalds 已提交
470 471
}

472 473 474 475 476 477 478 479 480
/**
 * pcie_port_shutdown_service - shut down given PCI Express port service
 * @dev: PCI Express port service device to handle
 *
 * If PCI Express port service driver is registered with
 * pcie_port_service_register(), this function will be called by the driver core
 * when device_shutdown() is called for the port service device associated
 * with the driver.
 */
481 482
static void pcie_port_shutdown_service(struct device *dev) {}

483 484 485 486
/**
 * pcie_port_service_register - register PCI Express port service driver
 * @new: PCI Express port service driver to register
 */
L
Linus Torvalds 已提交
487 488
int pcie_port_service_register(struct pcie_port_service_driver *new)
{
489 490 491
	if (pcie_ports_disabled)
		return -ENODEV;

492
	new->driver.name = new->name;
L
Linus Torvalds 已提交
493 494 495 496 497 498
	new->driver.bus = &pcie_port_bus_type;
	new->driver.probe = pcie_port_probe_service;
	new->driver.remove = pcie_port_remove_service;
	new->driver.shutdown = pcie_port_shutdown_service;

	return driver_register(&new->driver);
499
}
500
EXPORT_SYMBOL(pcie_port_service_register);
L
Linus Torvalds 已提交
501

502 503 504 505
/**
 * pcie_port_service_unregister - unregister PCI Express port service driver
 * @drv: PCI Express port service driver to unregister
 */
506
void pcie_port_service_unregister(struct pcie_port_service_driver *drv)
L
Linus Torvalds 已提交
507
{
508
	driver_unregister(&drv->driver);
L
Linus Torvalds 已提交
509 510
}
EXPORT_SYMBOL(pcie_port_service_unregister);