probe.c 33.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11
/*
 * probe.c - PCI detection and setup code
 */

#include <linux/kernel.h>
#include <linux/delay.h>
#include <linux/init.h>
#include <linux/pci.h>
#include <linux/slab.h>
#include <linux/module.h>
#include <linux/cpumask.h>
S
Shaohua Li 已提交
12
#include <linux/pci-aspm.h>
13
#include <linux/iommu.h>
14
#include <acpi/acpi_hest.h>
15
#include <xen/xen.h>
16
#include "pci.h"
L
Linus Torvalds 已提交
17 18 19 20 21 22 23 24

#define CARDBUS_LATENCY_TIMER	176	/* secondary latency timer */
#define CARDBUS_RESERVE_BUSNR	3

/* Ugh.  Need to stop exporting this to modules. */
LIST_HEAD(pci_root_buses);
EXPORT_SYMBOL(pci_root_buses);

25 26 27 28 29

static int find_anything(struct device *dev, void *data)
{
	return 1;
}
L
Linus Torvalds 已提交
30

Z
Zhang, Yanmin 已提交
31 32 33
/*
 * Some device drivers need know if pci is initiated.
 * Basically, we think pci is not initiated when there
34
 * is no device to be found on the pci_bus_type.
Z
Zhang, Yanmin 已提交
35 36 37
 */
int no_pci_devices(void)
{
38 39
	struct device *dev;
	int no_devices;
Z
Zhang, Yanmin 已提交
40

41 42 43 44 45
	dev = bus_find_device(&pci_bus_type, NULL, NULL, find_anything);
	no_devices = (dev == NULL);
	put_device(dev);
	return no_devices;
}
Z
Zhang, Yanmin 已提交
46 47
EXPORT_SYMBOL(no_pci_devices);

L
Linus Torvalds 已提交
48 49 50
/*
 * PCI Bus Class Devices
 */
51
static ssize_t pci_bus_show_cpuaffinity(struct device *dev,
52
					int type,
53
					struct device_attribute *attr,
54
					char *buf)
L
Linus Torvalds 已提交
55 56
{
	int ret;
57
	const struct cpumask *cpumask;
L
Linus Torvalds 已提交
58

59
	cpumask = cpumask_of_pcibus(to_pci_bus(dev));
60
	ret = type?
61 62
		cpulist_scnprintf(buf, PAGE_SIZE-2, cpumask) :
		cpumask_scnprintf(buf, PAGE_SIZE-2, cpumask);
63 64
	buf[ret++] = '\n';
	buf[ret] = '\0';
L
Linus Torvalds 已提交
65 66
	return ret;
}
67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83

static ssize_t inline pci_bus_show_cpumaskaffinity(struct device *dev,
					struct device_attribute *attr,
					char *buf)
{
	return pci_bus_show_cpuaffinity(dev, 0, attr, buf);
}

static ssize_t inline pci_bus_show_cpulistaffinity(struct device *dev,
					struct device_attribute *attr,
					char *buf)
{
	return pci_bus_show_cpuaffinity(dev, 1, attr, buf);
}

DEVICE_ATTR(cpuaffinity,     S_IRUGO, pci_bus_show_cpumaskaffinity, NULL);
DEVICE_ATTR(cpulistaffinity, S_IRUGO, pci_bus_show_cpulistaffinity, NULL);
L
Linus Torvalds 已提交
84 85 86 87

/*
 * PCI Bus Class
 */
88
static void release_pcibus_dev(struct device *dev)
L
Linus Torvalds 已提交
89
{
90
	struct pci_bus *pci_bus = to_pci_bus(dev);
L
Linus Torvalds 已提交
91 92 93 94 95 96 97 98

	if (pci_bus->bridge)
		put_device(pci_bus->bridge);
	kfree(pci_bus);
}

static struct class pcibus_class = {
	.name		= "pci_bus",
99
	.dev_release	= &release_pcibus_dev,
L
Linus Torvalds 已提交
100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122
};

static int __init pcibus_class_init(void)
{
	return class_register(&pcibus_class);
}
postcore_initcall(pcibus_class_init);

/*
 * Translate the low bits of the PCI base
 * to the resource type
 */
static inline unsigned int pci_calc_resource_flags(unsigned int flags)
{
	if (flags & PCI_BASE_ADDRESS_SPACE_IO)
		return IORESOURCE_IO;

	if (flags & PCI_BASE_ADDRESS_MEM_PREFETCH)
		return IORESOURCE_MEM | IORESOURCE_PREFETCH;

	return IORESOURCE_MEM;
}

123
static u64 pci_size(u64 base, u64 maxbase, u64 mask)
L
Linus Torvalds 已提交
124
{
125
	u64 size = mask & maxbase;	/* Find the significant bits */
L
Linus Torvalds 已提交
126 127 128 129 130 131 132 133 134 135 136 137 138 139 140
	if (!size)
		return 0;

	/* Get the lowest of them to find the decode size, and
	   from that the extent.  */
	size = (size & ~(size-1)) - 1;

	/* base == maxbase can be valid only if the BAR has
	   already been programmed with all 1s.  */
	if (base == maxbase && ((base | size) & mask) != mask)
		return 0;

	return size;
}

141 142 143 144 145 146
static inline enum pci_bar_type decode_bar(struct resource *res, u32 bar)
{
	if ((bar & PCI_BASE_ADDRESS_SPACE) == PCI_BASE_ADDRESS_SPACE_IO) {
		res->flags = bar & ~PCI_BASE_ADDRESS_IO_MASK;
		return pci_bar_io;
	}
147

148
	res->flags = bar & ~PCI_BASE_ADDRESS_MEM_MASK;
149

150
	if (res->flags & PCI_BASE_ADDRESS_MEM_TYPE_64)
151 152
		return pci_bar_mem64;
	return pci_bar_mem32;
153 154
}

Y
Yu Zhao 已提交
155 156 157 158 159 160 161 162
/**
 * pci_read_base - read a PCI BAR
 * @dev: the PCI device
 * @type: type of the BAR
 * @res: resource buffer to be filled in
 * @pos: BAR position in the config space
 *
 * Returns 1 if the BAR is 64-bit, or 0 if 32-bit.
163
 */
Y
Yu Zhao 已提交
164
int __pci_read_base(struct pci_dev *dev, enum pci_bar_type type,
165
			struct resource *res, unsigned int pos)
166
{
167 168
	u32 l, sz, mask;

169
	mask = type ? PCI_ROM_ADDRESS_MASK : ~0;
170 171 172 173

	res->name = pci_name(dev);

	pci_read_config_dword(dev, pos, &l);
174
	pci_write_config_dword(dev, pos, l | mask);
175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
	pci_read_config_dword(dev, pos, &sz);
	pci_write_config_dword(dev, pos, l);

	/*
	 * All bits set in sz means the device isn't working properly.
	 * If the BAR isn't implemented, all bits must be 0.  If it's a
	 * memory BAR or a ROM, bit 0 must be clear; if it's an io BAR, bit
	 * 1 must be clear.
	 */
	if (!sz || sz == 0xffffffff)
		goto fail;

	/*
	 * I don't know how l can have all bits set.  Copied from old code.
	 * Maybe it fixes a bug on some ancient platform.
	 */
	if (l == 0xffffffff)
		l = 0;

	if (type == pci_bar_unknown) {
		type = decode_bar(res, l);
		res->flags |= pci_calc_resource_flags(l) | IORESOURCE_SIZEALIGN;
		if (type == pci_bar_io) {
			l &= PCI_BASE_ADDRESS_IO_MASK;
199
			mask = PCI_BASE_ADDRESS_IO_MASK & IO_SPACE_LIMIT;
200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227
		} else {
			l &= PCI_BASE_ADDRESS_MEM_MASK;
			mask = (u32)PCI_BASE_ADDRESS_MEM_MASK;
		}
	} else {
		res->flags |= (l & IORESOURCE_ROM_ENABLE);
		l &= PCI_ROM_ADDRESS_MASK;
		mask = (u32)PCI_ROM_ADDRESS_MASK;
	}

	if (type == pci_bar_mem64) {
		u64 l64 = l;
		u64 sz64 = sz;
		u64 mask64 = mask | (u64)~0 << 32;

		pci_read_config_dword(dev, pos + 4, &l);
		pci_write_config_dword(dev, pos + 4, ~0);
		pci_read_config_dword(dev, pos + 4, &sz);
		pci_write_config_dword(dev, pos + 4, l);

		l64 |= ((u64)l << 32);
		sz64 |= ((u64)sz << 32);

		sz64 = pci_size(l64, sz64, mask64);

		if (!sz64)
			goto fail;

228
		if ((sizeof(resource_size_t) < 8) && (sz64 > 0x100000000ULL)) {
229 230
			dev_err(&dev->dev, "can't handle 64-bit BAR\n");
			goto fail;
231 232 233 234
		}

		res->flags |= IORESOURCE_MEM_64;
		if ((sizeof(resource_size_t) < 8) && l) {
235 236 237 238 239 240 241 242
			/* Address above 32-bit boundary; disable the BAR */
			pci_write_config_dword(dev, pos, 0);
			pci_write_config_dword(dev, pos + 4, 0);
			res->start = 0;
			res->end = sz64;
		} else {
			res->start = l64;
			res->end = l64 + sz64;
243
			dev_printk(KERN_DEBUG, &dev->dev, "reg %x: %pR\n",
244
				   pos, res);
245 246 247 248 249 250 251 252 253
		}
	} else {
		sz = pci_size(l, sz, mask);

		if (!sz)
			goto fail;

		res->start = l;
		res->end = l + sz;
254

255
		dev_printk(KERN_DEBUG, &dev->dev, "reg %x: %pR\n", pos, res);
256 257 258 259 260 261 262
	}

 out:
	return (type == pci_bar_mem64) ? 1 : 0;
 fail:
	res->flags = 0;
	goto out;
263 264
}

L
Linus Torvalds 已提交
265 266
static void pci_read_bases(struct pci_dev *dev, unsigned int howmany, int rom)
{
267
	unsigned int pos, reg;
268

269 270
	for (pos = 0; pos < howmany; pos++) {
		struct resource *res = &dev->resource[pos];
L
Linus Torvalds 已提交
271
		reg = PCI_BASE_ADDRESS_0 + (pos << 2);
272
		pos += __pci_read_base(dev, pci_bar_unknown, res, reg);
L
Linus Torvalds 已提交
273
	}
274

L
Linus Torvalds 已提交
275
	if (rom) {
276
		struct resource *res = &dev->resource[PCI_ROM_RESOURCE];
L
Linus Torvalds 已提交
277
		dev->rom_base_reg = rom;
278 279 280 281
		res->flags = IORESOURCE_MEM | IORESOURCE_PREFETCH |
				IORESOURCE_READONLY | IORESOURCE_CACHEABLE |
				IORESOURCE_SIZEALIGN;
		__pci_read_base(dev, pci_bar_mem32, res, rom);
L
Linus Torvalds 已提交
282 283 284
	}
}

285
void __devinit pci_read_bridge_bases(struct pci_bus *child)
L
Linus Torvalds 已提交
286 287 288 289 290 291 292 293
{
	struct pci_dev *dev = child->self;
	u8 io_base_lo, io_limit_lo;
	u16 mem_base_lo, mem_limit_lo;
	unsigned long base, limit;
	struct resource *res;
	int i;

294
	if (pci_is_root_bus(child))	/* It's a host bus, nothing to read */
L
Linus Torvalds 已提交
295 296 297
		return;

	if (dev->transparent) {
298
		dev_info(&dev->dev, "transparent bridge\n");
299 300
		for(i = 3; i < PCI_BUS_NUM_RESOURCES; i++)
			child->resource[i] = child->parent->resource[i - 3];
L
Linus Torvalds 已提交
301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318
	}

	res = child->resource[0];
	pci_read_config_byte(dev, PCI_IO_BASE, &io_base_lo);
	pci_read_config_byte(dev, PCI_IO_LIMIT, &io_limit_lo);
	base = (io_base_lo & PCI_IO_RANGE_MASK) << 8;
	limit = (io_limit_lo & PCI_IO_RANGE_MASK) << 8;

	if ((io_base_lo & PCI_IO_RANGE_TYPE_MASK) == PCI_IO_RANGE_TYPE_32) {
		u16 io_base_hi, io_limit_hi;
		pci_read_config_word(dev, PCI_IO_BASE_UPPER16, &io_base_hi);
		pci_read_config_word(dev, PCI_IO_LIMIT_UPPER16, &io_limit_hi);
		base |= (io_base_hi << 16);
		limit |= (io_limit_hi << 16);
	}

	if (base <= limit) {
		res->flags = (io_base_lo & PCI_IO_RANGE_TYPE_MASK) | IORESOURCE_IO;
319 320 321 322
		if (!res->start)
			res->start = base;
		if (!res->end)
			res->end = limit + 0xfff;
323
		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
L
Linus Torvalds 已提交
324 325 326 327 328 329 330 331 332 333 334
	}

	res = child->resource[1];
	pci_read_config_word(dev, PCI_MEMORY_BASE, &mem_base_lo);
	pci_read_config_word(dev, PCI_MEMORY_LIMIT, &mem_limit_lo);
	base = (mem_base_lo & PCI_MEMORY_RANGE_MASK) << 16;
	limit = (mem_limit_lo & PCI_MEMORY_RANGE_MASK) << 16;
	if (base <= limit) {
		res->flags = (mem_base_lo & PCI_MEMORY_RANGE_TYPE_MASK) | IORESOURCE_MEM;
		res->start = base;
		res->end = limit + 0xfffff;
335
		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
L
Linus Torvalds 已提交
336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359
	}

	res = child->resource[2];
	pci_read_config_word(dev, PCI_PREF_MEMORY_BASE, &mem_base_lo);
	pci_read_config_word(dev, PCI_PREF_MEMORY_LIMIT, &mem_limit_lo);
	base = (mem_base_lo & PCI_PREF_RANGE_MASK) << 16;
	limit = (mem_limit_lo & PCI_PREF_RANGE_MASK) << 16;

	if ((mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) == PCI_PREF_RANGE_TYPE_64) {
		u32 mem_base_hi, mem_limit_hi;
		pci_read_config_dword(dev, PCI_PREF_BASE_UPPER32, &mem_base_hi);
		pci_read_config_dword(dev, PCI_PREF_LIMIT_UPPER32, &mem_limit_hi);

		/*
		 * Some bridges set the base > limit by default, and some
		 * (broken) BIOSes do not initialize them.  If we find
		 * this, just assume they are not being used.
		 */
		if (mem_base_hi <= mem_limit_hi) {
#if BITS_PER_LONG == 64
			base |= ((long) mem_base_hi) << 32;
			limit |= ((long) mem_limit_hi) << 32;
#else
			if (mem_base_hi || mem_limit_hi) {
360 361
				dev_err(&dev->dev, "can't handle 64-bit "
					"address space for bridge\n");
L
Linus Torvalds 已提交
362 363 364 365 366 367
				return;
			}
#endif
		}
	}
	if (base <= limit) {
368 369 370 371
		res->flags = (mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) |
					 IORESOURCE_MEM | IORESOURCE_PREFETCH;
		if (res->flags & PCI_PREF_RANGE_TYPE_64)
			res->flags |= IORESOURCE_MEM_64;
L
Linus Torvalds 已提交
372 373
		res->start = base;
		res->end = limit + 0xfffff;
374
		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
L
Linus Torvalds 已提交
375 376 377
	}
}

378
static struct pci_bus * pci_alloc_bus(void)
L
Linus Torvalds 已提交
379 380 381
{
	struct pci_bus *b;

382
	b = kzalloc(sizeof(*b), GFP_KERNEL);
L
Linus Torvalds 已提交
383 384 385 386
	if (b) {
		INIT_LIST_HEAD(&b->node);
		INIT_LIST_HEAD(&b->children);
		INIT_LIST_HEAD(&b->devices);
A
Alex Chiang 已提交
387
		INIT_LIST_HEAD(&b->slots);
L
Linus Torvalds 已提交
388 389 390 391
	}
	return b;
}

392 393
static struct pci_bus *pci_alloc_child_bus(struct pci_bus *parent,
					   struct pci_dev *bridge, int busnr)
L
Linus Torvalds 已提交
394 395 396 397 398 399 400 401 402 403 404 405 406 407
{
	struct pci_bus *child;
	int i;

	/*
	 * Allocate a new bus, and inherit stuff from the parent..
	 */
	child = pci_alloc_bus();
	if (!child)
		return NULL;

	child->parent = parent;
	child->ops = parent->ops;
	child->sysdata = parent->sysdata;
408
	child->bus_flags = parent->bus_flags;
L
Linus Torvalds 已提交
409

410 411 412 413 414
	/* initialize some portions of the bus device, but don't register it
	 * now as the parent is not properly set up yet.  This device will get
	 * registered later in pci_bus_add_devices()
	 */
	child->dev.class = &pcibus_class;
415
	dev_set_name(&child->dev, "%04x:%02x", pci_domain_nr(child), busnr);
L
Linus Torvalds 已提交
416 417 418 419 420 421 422 423 424

	/*
	 * Set up the primary, secondary and subordinate
	 * bus numbers.
	 */
	child->number = child->secondary = busnr;
	child->primary = parent->secondary;
	child->subordinate = 0xff;

425 426 427 428 429 430
	if (!bridge)
		return child;

	child->self = bridge;
	child->bridge = get_device(&bridge->dev);

L
Linus Torvalds 已提交
431
	/* Set up default resource pointers and names.. */
432
	for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++) {
L
Linus Torvalds 已提交
433 434 435 436 437 438 439 440
		child->resource[i] = &bridge->resource[PCI_BRIDGE_RESOURCES+i];
		child->resource[i]->name = child->name;
	}
	bridge->subordinate = child;

	return child;
}

441
struct pci_bus *__ref pci_add_new_bus(struct pci_bus *parent, struct pci_dev *dev, int busnr)
L
Linus Torvalds 已提交
442 443 444 445
{
	struct pci_bus *child;

	child = pci_alloc_child_bus(parent, dev, busnr);
446
	if (child) {
447
		down_write(&pci_bus_sem);
L
Linus Torvalds 已提交
448
		list_add_tail(&child->node, &parent->children);
449
		up_write(&pci_bus_sem);
450
	}
L
Linus Torvalds 已提交
451 452 453
	return child;
}

454
static void pci_fixup_parent_subordinate_busnr(struct pci_bus *child, int max)
455 456
{
	struct pci_bus *parent = child->parent;
457 458 459 460 461 462

	/* Attempts to fix that up are really dangerous unless
	   we're going to re-assign all bus numbers. */
	if (!pcibios_assign_all_busses())
		return;

463 464 465 466 467 468 469
	while (parent->parent && parent->subordinate < max) {
		parent->subordinate = max;
		pci_write_config_byte(parent->self, PCI_SUBORDINATE_BUS, max);
		parent = parent->parent;
	}
}

L
Linus Torvalds 已提交
470 471 472 473 474 475 476 477 478 479
/*
 * If it's a bridge, configure it and scan the bus behind it.
 * For CardBus bridges, we don't scan behind as the devices will
 * be handled by the bridge driver itself.
 *
 * We need to process bridges in two passes -- first we scan those
 * already configured by the BIOS and after we are done with all of
 * them, we proceed to assigning numbers to the remaining buses in
 * order to avoid overlaps between old and new bus numbers.
 */
480
int __devinit pci_scan_bridge(struct pci_bus *bus, struct pci_dev *dev, int max, int pass)
L
Linus Torvalds 已提交
481 482 483
{
	struct pci_bus *child;
	int is_cardbus = (dev->hdr_type == PCI_HEADER_TYPE_CARDBUS);
484
	u32 buses, i, j = 0;
L
Linus Torvalds 已提交
485
	u16 bctl;
486
	int broken = 0;
L
Linus Torvalds 已提交
487 488 489

	pci_read_config_dword(dev, PCI_PRIMARY_BUS, &buses);

490 491
	dev_dbg(&dev->dev, "scanning behind bridge, config %06x, pass %d\n",
		buses & 0xffffff, pass);
L
Linus Torvalds 已提交
492

493 494 495 496 497 498 499
	/* Check if setup is sensible at all */
	if (!pass &&
	    ((buses & 0xff) != bus->number || ((buses >> 8) & 0xff) <= bus->number)) {
		dev_dbg(&dev->dev, "bus configuration invalid, reconfiguring\n");
		broken = 1;
	}

L
Linus Torvalds 已提交
500 501 502 503 504 505
	/* Disable MasterAbortMode during probing to avoid reporting
	   of bus errors (in some architectures) */ 
	pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &bctl);
	pci_write_config_word(dev, PCI_BRIDGE_CONTROL,
			      bctl & ~PCI_BRIDGE_CTL_MASTER_ABORT);

506
	if ((buses & 0xffff00) && !pcibios_assign_all_busses() && !is_cardbus && !broken) {
L
Linus Torvalds 已提交
507 508 509 510 511 512
		unsigned int cmax, busnr;
		/*
		 * Bus already configured by firmware, process it in the first
		 * pass and just note the configuration.
		 */
		if (pass)
513
			goto out;
L
Linus Torvalds 已提交
514 515 516 517
		busnr = (buses >> 8) & 0xFF;

		/*
		 * If we already got to this bus through a different bridge,
A
Alex Chiang 已提交
518 519 520 521
		 * don't re-add it. This can happen with the i450NX chipset.
		 *
		 * However, we continue to descend down the hierarchy and
		 * scan remaining child buses.
L
Linus Torvalds 已提交
522
		 */
A
Alex Chiang 已提交
523 524 525 526 527 528 529 530
		child = pci_find_bus(pci_domain_nr(bus), busnr);
		if (!child) {
			child = pci_add_new_bus(bus, dev, busnr);
			if (!child)
				goto out;
			child->primary = buses & 0xFF;
			child->subordinate = (buses >> 16) & 0xFF;
			child->bridge_ctl = bctl;
L
Linus Torvalds 已提交
531 532 533 534 535 536 537 538 539 540 541 542
		}

		cmax = pci_scan_child_bus(child);
		if (cmax > max)
			max = cmax;
		if (child->subordinate > max)
			max = child->subordinate;
	} else {
		/*
		 * We need to assign a number to this bus which we always
		 * do in the second pass.
		 */
543
		if (!pass) {
544
			if (pcibios_assign_all_busses() || broken)
545 546 547 548 549 550 551 552
				/* Temporarily disable forwarding of the
				   configuration cycles on all bridges in
				   this bus segment to avoid possible
				   conflicts in the second pass between two
				   bridges programmed with overlapping
				   bus ranges. */
				pci_write_config_dword(dev, PCI_PRIMARY_BUS,
						       buses & ~0xffffff);
553
			goto out;
554
		}
L
Linus Torvalds 已提交
555 556 557 558

		/* Clear errors */
		pci_write_config_word(dev, PCI_STATUS, 0xffff);

559 560 561
		/* Prevent assigning a bus number that already exists.
		 * This can happen when a bridge is hot-plugged */
		if (pci_find_bus(pci_domain_nr(bus), max+1))
562
			goto out;
563
		child = pci_add_new_bus(bus, dev, ++max);
L
Linus Torvalds 已提交
564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583
		buses = (buses & 0xff000000)
		      | ((unsigned int)(child->primary)     <<  0)
		      | ((unsigned int)(child->secondary)   <<  8)
		      | ((unsigned int)(child->subordinate) << 16);

		/*
		 * yenta.c forces a secondary latency timer of 176.
		 * Copy that behaviour here.
		 */
		if (is_cardbus) {
			buses &= ~0xff000000;
			buses |= CARDBUS_LATENCY_TIMER << 24;
		}
			
		/*
		 * We need to blast all three values with a single write.
		 */
		pci_write_config_dword(dev, PCI_PRIMARY_BUS, buses);

		if (!is_cardbus) {
584
			child->bridge_ctl = bctl;
585 586 587 588 589 590 591
			/*
			 * Adjust subordinate busnr in parent buses.
			 * We do this before scanning for children because
			 * some devices may not be detected if the bios
			 * was lazy.
			 */
			pci_fixup_parent_subordinate_busnr(child, max);
L
Linus Torvalds 已提交
592 593
			/* Now we can scan all subordinate buses... */
			max = pci_scan_child_bus(child);
594 595 596 597 598
			/*
			 * now fix it up again since we have found
			 * the real value of max.
			 */
			pci_fixup_parent_subordinate_busnr(child, max);
L
Linus Torvalds 已提交
599 600 601 602 603 604
		} else {
			/*
			 * For CardBus bridges, we leave 4 bus numbers
			 * as cards with a PCI-to-PCI bridge can be
			 * inserted later.
			 */
605 606
			for (i=0; i<CARDBUS_RESERVE_BUSNR; i++) {
				struct pci_bus *parent = bus;
607 608 609
				if (pci_find_bus(pci_domain_nr(bus),
							max+i+1))
					break;
610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627
				while (parent->parent) {
					if ((!pcibios_assign_all_busses()) &&
					    (parent->subordinate > max) &&
					    (parent->subordinate <= max+i)) {
						j = 1;
					}
					parent = parent->parent;
				}
				if (j) {
					/*
					 * Often, there are two cardbus bridges
					 * -- try to leave one valid bus number
					 * for each one.
					 */
					i /= 2;
					break;
				}
			}
628
			max += i;
629
			pci_fixup_parent_subordinate_busnr(child, max);
L
Linus Torvalds 已提交
630 631 632 633 634 635 636 637
		}
		/*
		 * Set the subordinate bus number to its real value.
		 */
		child->subordinate = max;
		pci_write_config_byte(dev, PCI_SUBORDINATE_BUS, max);
	}

638 639 640
	sprintf(child->name,
		(is_cardbus ? "PCI CardBus %04x:%02x" : "PCI Bus %04x:%02x"),
		pci_domain_nr(bus), child->number);
L
Linus Torvalds 已提交
641

642
	/* Has only triggered on CardBus, fixup is in yenta_socket */
643 644 645 646 647
	while (bus->parent) {
		if ((child->subordinate > bus->subordinate) ||
		    (child->number > bus->subordinate) ||
		    (child->number < bus->number) ||
		    (child->subordinate < bus->number)) {
648
			pr_debug("PCI: Bus #%02x (-#%02x) is %s "
649 650 651 652
				"hidden behind%s bridge #%02x (-#%02x)\n",
				child->number, child->subordinate,
				(bus->number > child->subordinate &&
				 bus->subordinate < child->number) ?
653 654
					"wholly" : "partially",
				bus->self->transparent ? " transparent" : "",
655
				bus->number, bus->subordinate);
656 657 658 659
		}
		bus = bus->parent;
	}

660 661 662
out:
	pci_write_config_word(dev, PCI_BRIDGE_CONTROL, bctl);

L
Linus Torvalds 已提交
663 664 665 666 667 668 669 670 671 672 673 674
	return max;
}

/*
 * Read interrupt line and base address registers.
 * The architecture-dependent code can tweak these, of course.
 */
static void pci_read_irq(struct pci_dev *dev)
{
	unsigned char irq;

	pci_read_config_byte(dev, PCI_INTERRUPT_PIN, &irq);
675
	dev->pin = irq;
L
Linus Torvalds 已提交
676 677 678 679 680
	if (irq)
		pci_read_config_byte(dev, PCI_INTERRUPT_LINE, &irq);
	dev->irq = irq;
}

Y
Yu Zhao 已提交
681 682 683 684 685 686 687 688 689 690 691 692 693
static void set_pcie_port_type(struct pci_dev *pdev)
{
	int pos;
	u16 reg16;

	pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);
	if (!pos)
		return;
	pdev->is_pcie = 1;
	pci_read_config_word(pdev, pos + PCI_EXP_FLAGS, &reg16);
	pdev->pcie_type = (reg16 & PCI_EXP_FLAGS_TYPE) >> 4;
}

694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710
static void set_pcie_hotplug_bridge(struct pci_dev *pdev)
{
	int pos;
	u16 reg16;
	u32 reg32;

	pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);
	if (!pos)
		return;
	pci_read_config_word(pdev, pos + PCI_EXP_FLAGS, &reg16);
	if (!(reg16 & PCI_EXP_FLAGS_SLOT))
		return;
	pci_read_config_dword(pdev, pos + PCI_EXP_SLTCAP, &reg32);
	if (reg32 & PCI_EXP_SLTCAP_HPC)
		pdev->is_hotplug_bridge = 1;
}

711 712 713 714 715 716
static void set_pci_aer_firmware_first(struct pci_dev *pdev)
{
	if (acpi_hest_firmware_first_pci(pdev))
		pdev->aer_firmware_first = 1;
}

717
#define LEGACY_IO_RESOURCE	(IORESOURCE_IO | IORESOURCE_PCI_FIXED)
718

L
Linus Torvalds 已提交
719 720 721 722 723 724 725
/**
 * pci_setup_device - fill in class and map information of a device
 * @dev: the device structure to fill
 *
 * Initialize the device structure with information about the device's 
 * vendor,class,memory and IO-space addresses,IRQ lines etc.
 * Called at initialisation of the PCI subsystem and by CardBus services.
Y
Yu Zhao 已提交
726 727
 * Returns 0 on success and negative if unknown type of device (not normal,
 * bridge or CardBus).
L
Linus Torvalds 已提交
728
 */
Y
Yu Zhao 已提交
729
int pci_setup_device(struct pci_dev *dev)
L
Linus Torvalds 已提交
730 731
{
	u32 class;
Y
Yu Zhao 已提交
732 733
	u8 hdr_type;
	struct pci_slot *slot;
734
	int pos = 0;
Y
Yu Zhao 已提交
735 736 737 738 739 740 741 742 743 744 745

	if (pci_read_config_byte(dev, PCI_HEADER_TYPE, &hdr_type))
		return -EIO;

	dev->sysdata = dev->bus->sysdata;
	dev->dev.parent = dev->bus->bridge;
	dev->dev.bus = &pci_bus_type;
	dev->hdr_type = hdr_type & 0x7f;
	dev->multifunction = !!(hdr_type & 0x80);
	dev->error_state = pci_channel_io_normal;
	set_pcie_port_type(dev);
746
	set_pci_aer_firmware_first(dev);
Y
Yu Zhao 已提交
747 748 749 750 751 752 753 754

	list_for_each_entry(slot, &dev->bus->slots, list)
		if (PCI_SLOT(dev->devfn) == slot->number)
			dev->slot = slot;

	/* Assume 32-bit PCI; let 64-bit PCI cards (which are far rarer)
	   set this higher, assuming the system even supports it.  */
	dev->dma_mask = 0xffffffff;
L
Linus Torvalds 已提交
755

756 757 758
	dev_set_name(&dev->dev, "%04x:%02x:%02x.%d", pci_domain_nr(dev->bus),
		     dev->bus->number, PCI_SLOT(dev->devfn),
		     PCI_FUNC(dev->devfn));
L
Linus Torvalds 已提交
759 760

	pci_read_config_dword(dev, PCI_CLASS_REVISION, &class);
A
Auke Kok 已提交
761
	dev->revision = class & 0xff;
L
Linus Torvalds 已提交
762 763 764 765
	class >>= 8;				    /* upper 3 bytes */
	dev->class = class;
	class >>= 8;

766
	dev_dbg(&dev->dev, "found [%04x:%04x] class %06x header type %02x\n",
L
Linus Torvalds 已提交
767 768
		 dev->vendor, dev->device, class, dev->hdr_type);

769 770 771
	/* need to have dev->class ready */
	dev->cfg_size = pci_cfg_space_size(dev);

L
Linus Torvalds 已提交
772
	/* "Unknown power state" */
773
	dev->current_state = PCI_UNKNOWN;
L
Linus Torvalds 已提交
774 775 776

	/* Early fixups, before probing the BARs */
	pci_fixup_device(pci_fixup_early, dev);
777 778
	/* device class may be changed after fixup */
	class = dev->class >> 8;
L
Linus Torvalds 已提交
779 780 781 782 783 784 785 786 787

	switch (dev->hdr_type) {		    /* header type */
	case PCI_HEADER_TYPE_NORMAL:		    /* standard header */
		if (class == PCI_CLASS_BRIDGE_PCI)
			goto bad;
		pci_read_irq(dev);
		pci_read_bases(dev, 6, PCI_ROM_ADDRESS);
		pci_read_config_word(dev, PCI_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
		pci_read_config_word(dev, PCI_SUBSYSTEM_ID, &dev->subsystem_device);
788 789 790 791 792 793 794 795 796 797 798

		/*
		 *	Do the ugly legacy mode stuff here rather than broken chip
		 *	quirk code. Legacy mode ATA controllers have fixed
		 *	addresses. These are not always echoed in BAR0-3, and
		 *	BAR0-3 in a few cases contain junk!
		 */
		if (class == PCI_CLASS_STORAGE_IDE) {
			u8 progif;
			pci_read_config_byte(dev, PCI_CLASS_PROG, &progif);
			if ((progif & 1) == 0) {
799 800 801 802 803 804
				dev->resource[0].start = 0x1F0;
				dev->resource[0].end = 0x1F7;
				dev->resource[0].flags = LEGACY_IO_RESOURCE;
				dev->resource[1].start = 0x3F6;
				dev->resource[1].end = 0x3F6;
				dev->resource[1].flags = LEGACY_IO_RESOURCE;
805 806
			}
			if ((progif & 4) == 0) {
807 808 809 810 811 812
				dev->resource[2].start = 0x170;
				dev->resource[2].end = 0x177;
				dev->resource[2].flags = LEGACY_IO_RESOURCE;
				dev->resource[3].start = 0x376;
				dev->resource[3].end = 0x376;
				dev->resource[3].flags = LEGACY_IO_RESOURCE;
813 814
			}
		}
L
Linus Torvalds 已提交
815 816 817 818 819 820 821 822
		break;

	case PCI_HEADER_TYPE_BRIDGE:		    /* bridge header */
		if (class != PCI_CLASS_BRIDGE_PCI)
			goto bad;
		/* The PCI-to-PCI bridge spec requires that subtractive
		   decoding (i.e. transparent) bridge must have programming
		   interface code of 0x01. */ 
823
		pci_read_irq(dev);
L
Linus Torvalds 已提交
824 825
		dev->transparent = ((dev->class & 0xff) == 1);
		pci_read_bases(dev, 2, PCI_ROM_ADDRESS1);
826
		set_pcie_hotplug_bridge(dev);
827 828 829 830 831
		pos = pci_find_capability(dev, PCI_CAP_ID_SSVID);
		if (pos) {
			pci_read_config_word(dev, pos + PCI_SSVID_VENDOR_ID, &dev->subsystem_vendor);
			pci_read_config_word(dev, pos + PCI_SSVID_DEVICE_ID, &dev->subsystem_device);
		}
L
Linus Torvalds 已提交
832 833 834 835 836 837 838 839 840 841 842 843
		break;

	case PCI_HEADER_TYPE_CARDBUS:		    /* CardBus bridge header */
		if (class != PCI_CLASS_BRIDGE_CARDBUS)
			goto bad;
		pci_read_irq(dev);
		pci_read_bases(dev, 1, 0);
		pci_read_config_word(dev, PCI_CB_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
		pci_read_config_word(dev, PCI_CB_SUBSYSTEM_ID, &dev->subsystem_device);
		break;

	default:				    /* unknown header */
844 845
		dev_err(&dev->dev, "unknown header type %02x, "
			"ignoring device\n", dev->hdr_type);
Y
Yu Zhao 已提交
846
		return -EIO;
L
Linus Torvalds 已提交
847 848

	bad:
849 850
		dev_err(&dev->dev, "ignoring class %02x (doesn't match header "
			"type %02x)\n", class, dev->hdr_type);
L
Linus Torvalds 已提交
851 852 853 854 855 856 857
		dev->class = PCI_CLASS_NOT_DEFINED;
	}

	/* We found a fine healthy device, go go go... */
	return 0;
}

858 859 860
static void pci_release_capabilities(struct pci_dev *dev)
{
	pci_vpd_release(dev);
861
	pci_iov_release(dev);
862 863
}

L
Linus Torvalds 已提交
864 865 866 867 868 869 870 871 872 873 874 875
/**
 * pci_release_dev - free a pci device structure when all users of it are finished.
 * @dev: device that's been disconnected
 *
 * Will be called only by the device core when all users of this pci device are
 * done.
 */
static void pci_release_dev(struct device *dev)
{
	struct pci_dev *pci_dev;

	pci_dev = to_pci_dev(dev);
876
	pci_release_capabilities(pci_dev);
L
Linus Torvalds 已提交
877 878 879 880 881
	kfree(pci_dev);
}

/**
 * pci_cfg_space_size - get the configuration space size of the PCI device.
R
Randy Dunlap 已提交
882
 * @dev: PCI device
L
Linus Torvalds 已提交
883 884 885 886 887 888 889 890
 *
 * Regular PCI devices have 256 bytes, but PCI-X 2 and PCI Express devices
 * have 4096 bytes.  Even if the device is capable, that doesn't mean we can
 * access it.  Maybe we don't have a way to generate extended config space
 * accesses, or the device is behind a reverse Express bridge.  So we try
 * reading the dword at 0x100 which must either be 0 or a valid extended
 * capability header.
 */
891
int pci_cfg_space_size_ext(struct pci_dev *dev)
L
Linus Torvalds 已提交
892 893
{
	u32 status;
894
	int pos = PCI_CFG_SPACE_SIZE;
L
Linus Torvalds 已提交
895

896
	if (pci_read_config_dword(dev, pos, &status) != PCIBIOS_SUCCESSFUL)
897 898 899 900 901 902 903 904 905 906 907 908 909 910
		goto fail;
	if (status == 0xffffffff)
		goto fail;

	return PCI_CFG_SPACE_EXP_SIZE;

 fail:
	return PCI_CFG_SPACE_SIZE;
}

int pci_cfg_space_size(struct pci_dev *dev)
{
	int pos;
	u32 status;
911 912 913 914 915
	u16 class;

	class = dev->class >> 8;
	if (class == PCI_CLASS_BRIDGE_HOST)
		return pci_cfg_space_size_ext(dev);
916

L
Linus Torvalds 已提交
917 918 919 920 921 922 923 924 925 926 927
	pos = pci_find_capability(dev, PCI_CAP_ID_EXP);
	if (!pos) {
		pos = pci_find_capability(dev, PCI_CAP_ID_PCIX);
		if (!pos)
			goto fail;

		pci_read_config_dword(dev, pos + PCI_X_STATUS, &status);
		if (!(status & (PCI_X_STATUS_266MHZ | PCI_X_STATUS_533MHZ)))
			goto fail;
	}

928
	return pci_cfg_space_size_ext(dev);
L
Linus Torvalds 已提交
929 930 931 932 933 934 935 936 937 938

 fail:
	return PCI_CFG_SPACE_SIZE;
}

static void pci_release_bus_bridge_dev(struct device *dev)
{
	kfree(dev);
}

939 940 941 942 943 944 945 946 947 948 949 950 951 952
struct pci_dev *alloc_pci_dev(void)
{
	struct pci_dev *dev;

	dev = kzalloc(sizeof(struct pci_dev), GFP_KERNEL);
	if (!dev)
		return NULL;

	INIT_LIST_HEAD(&dev->bus_list);

	return dev;
}
EXPORT_SYMBOL(alloc_pci_dev);

L
Linus Torvalds 已提交
953 954 955 956
/*
 * Read the config data for a PCI device, sanity-check it
 * and fill in the dev structure...
 */
957
static struct pci_dev *pci_scan_device(struct pci_bus *bus, int devfn)
L
Linus Torvalds 已提交
958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978
{
	struct pci_dev *dev;
	u32 l;
	int delay = 1;

	if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, &l))
		return NULL;

	/* some broken boards return 0 or ~0 if a slot is empty: */
	if (l == 0xffffffff || l == 0x00000000 ||
	    l == 0x0000ffff || l == 0xffff0000)
		return NULL;

	/* Configuration request Retry Status */
	while (l == 0xffff0001) {
		msleep(delay);
		delay *= 2;
		if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, &l))
			return NULL;
		/* Card hasn't responded in 60 seconds?  Must be stuck. */
		if (delay > 60 * 1000) {
979
			printk(KERN_WARNING "pci %04x:%02x:%02x.%d: not "
L
Linus Torvalds 已提交
980 981 982 983 984 985 986
					"responding\n", pci_domain_nr(bus),
					bus->number, PCI_SLOT(devfn),
					PCI_FUNC(devfn));
			return NULL;
		}
	}

987
	dev = alloc_pci_dev();
L
Linus Torvalds 已提交
988 989 990 991 992 993 994
	if (!dev)
		return NULL;

	dev->bus = bus;
	dev->devfn = devfn;
	dev->vendor = l & 0xffff;
	dev->device = (l >> 16) & 0xffff;
995

Y
Yu Zhao 已提交
996
	if (pci_setup_device(dev)) {
L
Linus Torvalds 已提交
997 998 999 1000 1001 1002 1003
		kfree(dev);
		return NULL;
	}

	return dev;
}

1004 1005 1006 1007 1008
static void pci_init_capabilities(struct pci_dev *dev)
{
	/* MSI/MSI-X list */
	pci_msi_init_pci_dev(dev);

1009 1010 1011
	/* Buffers for saving PCIe and PCI-X capabilities */
	pci_allocate_cap_save_buffers(dev);

1012 1013
	/* Power Management */
	pci_pm_init(dev);
1014
	platform_pci_wakeup_init(dev);
1015 1016 1017

	/* Vital Product Data */
	pci_vpd_pci22_init(dev);
Y
Yu Zhao 已提交
1018 1019 1020

	/* Alternative Routing-ID Forwarding */
	pci_enable_ari(dev);
1021 1022 1023

	/* Single Root I/O Virtualization */
	pci_iov_init(dev);
1024 1025

	/* Enable ACS P2P upstream forwarding */
1026
	if (iommu_found() || xen_initial_domain())
1027
		pci_enable_acs(dev);
1028 1029
}

1030
void pci_device_add(struct pci_dev *dev, struct pci_bus *bus)
L
Linus Torvalds 已提交
1031
{
1032 1033 1034
	device_initialize(&dev->dev);
	dev->dev.release = pci_release_dev;
	pci_dev_get(dev);
L
Linus Torvalds 已提交
1035

1036
	dev->dev.dma_mask = &dev->dma_mask;
1037
	dev->dev.dma_parms = &dev->dma_parms;
1038
	dev->dev.coherent_dma_mask = 0xffffffffull;
L
Linus Torvalds 已提交
1039

1040
	pci_set_dma_max_seg_size(dev, 65536);
1041
	pci_set_dma_seg_boundary(dev, 0xffffffff);
1042

L
Linus Torvalds 已提交
1043 1044 1045
	/* Fix up broken headers */
	pci_fixup_device(pci_fixup_header, dev);

1046 1047 1048
	/* Clear the state_saved flag. */
	dev->state_saved = false;

1049 1050
	/* Initialize various capabilities */
	pci_init_capabilities(dev);
1051

L
Linus Torvalds 已提交
1052 1053 1054 1055
	/*
	 * Add the device to our list of discovered devices
	 * and the bus list for fixup functions, etc.
	 */
1056
	down_write(&pci_bus_sem);
L
Linus Torvalds 已提交
1057
	list_add_tail(&dev->bus_list, &bus->devices);
1058
	up_write(&pci_bus_sem);
1059 1060
}

1061
struct pci_dev *__ref pci_scan_single_device(struct pci_bus *bus, int devfn)
1062 1063 1064
{
	struct pci_dev *dev;

T
Trent Piepho 已提交
1065 1066 1067 1068 1069 1070
	dev = pci_get_slot(bus, devfn);
	if (dev) {
		pci_dev_put(dev);
		return dev;
	}

1071 1072 1073 1074 1075
	dev = pci_scan_device(bus, devfn);
	if (!dev)
		return NULL;

	pci_device_add(dev, bus);
L
Linus Torvalds 已提交
1076 1077 1078

	return dev;
}
1079
EXPORT_SYMBOL(pci_scan_single_device);
L
Linus Torvalds 已提交
1080 1081 1082 1083 1084 1085 1086 1087

/**
 * pci_scan_slot - scan a PCI slot on a bus for devices.
 * @bus: PCI bus to scan
 * @devfn: slot number to scan (must have zero function.)
 *
 * Scan a PCI slot on the specified PCI bus for devices, adding
 * discovered devices to the @bus->devices list.  New devices
1088
 * will not have is_added set.
1089 1090
 *
 * Returns the number of new devices found.
L
Linus Torvalds 已提交
1091
 */
1092
int pci_scan_slot(struct pci_bus *bus, int devfn)
L
Linus Torvalds 已提交
1093
{
1094 1095
	int fn, nr = 0;
	struct pci_dev *dev;
L
Linus Torvalds 已提交
1096

1097 1098 1099 1100
	dev = pci_scan_single_device(bus, devfn);
	if (dev && !dev->is_added)	/* new device? */
		nr++;

A
Alex Chiang 已提交
1101
	if (dev && dev->multifunction) {
1102 1103 1104 1105 1106 1107
		for (fn = 1; fn < 8; fn++) {
			dev = pci_scan_single_device(bus, devfn + fn);
			if (dev) {
				if (!dev->is_added)
					nr++;
				dev->multifunction = 1;
L
Linus Torvalds 已提交
1108 1109 1110
			}
		}
	}
S
Shaohua Li 已提交
1111

1112 1113
	/* only one slot has pcie device */
	if (bus->self && nr)
S
Shaohua Li 已提交
1114 1115
		pcie_aspm_init_link_state(bus->self);

L
Linus Torvalds 已提交
1116 1117 1118
	return nr;
}

1119
unsigned int __devinit pci_scan_child_bus(struct pci_bus *bus)
L
Linus Torvalds 已提交
1120 1121 1122 1123 1124 1125 1126 1127 1128 1129
{
	unsigned int devfn, pass, max = bus->secondary;
	struct pci_dev *dev;

	pr_debug("PCI: Scanning bus %04x:%02x\n", pci_domain_nr(bus), bus->number);

	/* Go find them, Rover! */
	for (devfn = 0; devfn < 0x100; devfn += 8)
		pci_scan_slot(bus, devfn);

1130 1131 1132
	/* Reserve buses for SR-IOV capability. */
	max += pci_iov_bus_range(bus);

L
Linus Torvalds 已提交
1133 1134 1135 1136
	/*
	 * After performing arch-dependent fixup of the bus, look behind
	 * all PCI-to-PCI bridges on this bus.
	 */
A
Alex Chiang 已提交
1137 1138 1139 1140 1141 1142 1143 1144
	if (!bus->is_added) {
		pr_debug("PCI: Fixups for bus %04x:%02x\n",
			 pci_domain_nr(bus), bus->number);
		pcibios_fixup_bus(bus);
		if (pci_is_root_bus(bus))
			bus->is_added = 1;
	}

L
Linus Torvalds 已提交
1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163
	for (pass=0; pass < 2; pass++)
		list_for_each_entry(dev, &bus->devices, bus_list) {
			if (dev->hdr_type == PCI_HEADER_TYPE_BRIDGE ||
			    dev->hdr_type == PCI_HEADER_TYPE_CARDBUS)
				max = pci_scan_bridge(bus, dev, max, pass);
		}

	/*
	 * We've scanned the bus and so we know all about what's on
	 * the other side of any bridges that may be on this bus plus
	 * any devices.
	 *
	 * Return how far we've got finding sub-buses.
	 */
	pr_debug("PCI: Bus scan for %04x:%02x returning with max=%02x\n",
		pci_domain_nr(bus), bus->number, max);
	return max;
}

1164
struct pci_bus * pci_create_bus(struct device *parent,
1165
		int bus, struct pci_ops *ops, void *sysdata)
L
Linus Torvalds 已提交
1166 1167 1168 1169 1170 1171 1172 1173 1174
{
	int error;
	struct pci_bus *b;
	struct device *dev;

	b = pci_alloc_bus();
	if (!b)
		return NULL;

1175
	dev = kzalloc(sizeof(*dev), GFP_KERNEL);
L
Linus Torvalds 已提交
1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188
	if (!dev){
		kfree(b);
		return NULL;
	}

	b->sysdata = sysdata;
	b->ops = ops;

	if (pci_find_bus(pci_domain_nr(b), bus)) {
		/* If we already got to this bus through a different bridge, ignore it */
		pr_debug("PCI: Bus %04x:%02x already known\n", pci_domain_nr(b), bus);
		goto err_out;
	}
1189 1190

	down_write(&pci_bus_sem);
L
Linus Torvalds 已提交
1191
	list_add_tail(&b->node, &pci_root_buses);
1192
	up_write(&pci_bus_sem);
L
Linus Torvalds 已提交
1193 1194 1195

	dev->parent = parent;
	dev->release = pci_release_bus_bridge_dev;
1196
	dev_set_name(dev, "pci%04x:%02x", pci_domain_nr(b), bus);
L
Linus Torvalds 已提交
1197 1198 1199 1200 1201
	error = device_register(dev);
	if (error)
		goto dev_reg_err;
	b->bridge = get_device(dev);

1202 1203 1204
	if (!parent)
		set_dev_node(b->bridge, pcibus_to_node(b));

1205 1206
	b->dev.class = &pcibus_class;
	b->dev.parent = b->bridge;
1207
	dev_set_name(&b->dev, "%04x:%02x", pci_domain_nr(b), bus);
1208
	error = device_register(&b->dev);
L
Linus Torvalds 已提交
1209 1210
	if (error)
		goto class_dev_reg_err;
1211
	error = device_create_file(&b->dev, &dev_attr_cpuaffinity);
L
Linus Torvalds 已提交
1212
	if (error)
1213
		goto dev_create_file_err;
L
Linus Torvalds 已提交
1214 1215 1216 1217 1218 1219 1220 1221 1222 1223

	/* Create legacy_io and legacy_mem files for this bus */
	pci_create_legacy_files(b);

	b->number = b->secondary = bus;
	b->resource[0] = &ioport_resource;
	b->resource[1] = &iomem_resource;

	return b;

1224 1225
dev_create_file_err:
	device_unregister(&b->dev);
L
Linus Torvalds 已提交
1226 1227 1228
class_dev_reg_err:
	device_unregister(dev);
dev_reg_err:
1229
	down_write(&pci_bus_sem);
L
Linus Torvalds 已提交
1230
	list_del(&b->node);
1231
	up_write(&pci_bus_sem);
L
Linus Torvalds 已提交
1232 1233 1234 1235 1236
err_out:
	kfree(dev);
	kfree(b);
	return NULL;
}
1237

1238
struct pci_bus * __devinit pci_scan_bus_parented(struct device *parent,
1239 1240 1241 1242 1243 1244 1245 1246 1247
		int bus, struct pci_ops *ops, void *sysdata)
{
	struct pci_bus *b;

	b = pci_create_bus(parent, bus, ops, sysdata);
	if (b)
		b->subordinate = pci_scan_child_bus(b);
	return b;
}
L
Linus Torvalds 已提交
1248 1249 1250
EXPORT_SYMBOL(pci_scan_bus_parented);

#ifdef CONFIG_HOTPLUG
A
Alex Chiang 已提交
1251 1252 1253 1254 1255 1256 1257 1258 1259
/**
 * pci_rescan_bus - scan a PCI bus for devices.
 * @bus: PCI bus to scan
 *
 * Scan a PCI bus and child buses for new devices, adds them,
 * and enables them.
 *
 * Returns the max number of subordinate bus discovered.
 */
1260
unsigned int __ref pci_rescan_bus(struct pci_bus *bus)
A
Alex Chiang 已提交
1261 1262 1263 1264 1265 1266
{
	unsigned int max;
	struct pci_dev *dev;

	max = pci_scan_child_bus(bus);

A
Alex Chiang 已提交
1267
	down_read(&pci_bus_sem);
A
Alex Chiang 已提交
1268 1269 1270 1271 1272
	list_for_each_entry(dev, &bus->devices, bus_list)
		if (dev->hdr_type == PCI_HEADER_TYPE_BRIDGE ||
		    dev->hdr_type == PCI_HEADER_TYPE_CARDBUS)
			if (dev->subordinate)
				pci_bus_size_bridges(dev->subordinate);
A
Alex Chiang 已提交
1273
	up_read(&pci_bus_sem);
A
Alex Chiang 已提交
1274 1275 1276 1277 1278 1279 1280 1281 1282

	pci_bus_assign_resources(bus);
	pci_enable_bridges(bus);
	pci_bus_add_devices(bus);

	return max;
}
EXPORT_SYMBOL_GPL(pci_rescan_bus);

L
Linus Torvalds 已提交
1283 1284 1285 1286 1287
EXPORT_SYMBOL(pci_add_new_bus);
EXPORT_SYMBOL(pci_scan_slot);
EXPORT_SYMBOL(pci_scan_bridge);
EXPORT_SYMBOL_GPL(pci_scan_child_bus);
#endif
1288

1289
static int __init pci_sort_bf_cmp(const struct device *d_a, const struct device *d_b)
1290
{
1291 1292 1293
	const struct pci_dev *a = to_pci_dev(d_a);
	const struct pci_dev *b = to_pci_dev(d_b);

1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305
	if      (pci_domain_nr(a->bus) < pci_domain_nr(b->bus)) return -1;
	else if (pci_domain_nr(a->bus) > pci_domain_nr(b->bus)) return  1;

	if      (a->bus->number < b->bus->number) return -1;
	else if (a->bus->number > b->bus->number) return  1;

	if      (a->devfn < b->devfn) return -1;
	else if (a->devfn > b->devfn) return  1;

	return 0;
}

1306
void __init pci_sort_breadthfirst(void)
1307
{
1308
	bus_sort_breadthfirst(&pci_bus_type, &pci_sort_bf_cmp);
1309
}