probe.c 51.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11
/*
 * probe.c - PCI detection and setup code
 */

#include <linux/kernel.h>
#include <linux/delay.h>
#include <linux/init.h>
#include <linux/pci.h>
#include <linux/slab.h>
#include <linux/module.h>
#include <linux/cpumask.h>
S
Shaohua Li 已提交
12
#include <linux/pci-aspm.h>
13
#include <asm-generic/pci-bridge.h>
14
#include "pci.h"
L
Linus Torvalds 已提交
15 16 17 18

#define CARDBUS_LATENCY_TIMER	176	/* secondary latency timer */
#define CARDBUS_RESERVE_BUSNR	3

Y
Yinghai Lu 已提交
19 20 21 22 23 24 25
struct resource busn_resource = {
	.name	= "PCI busn",
	.start	= 0,
	.end	= 255,
	.flags	= IORESOURCE_BUS,
};

L
Linus Torvalds 已提交
26 27 28 29
/* Ugh.  Need to stop exporting this to modules. */
LIST_HEAD(pci_root_buses);
EXPORT_SYMBOL(pci_root_buses);

30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
static LIST_HEAD(pci_domain_busn_res_list);

struct pci_domain_busn_res {
	struct list_head list;
	struct resource res;
	int domain_nr;
};

static struct resource *get_pci_domain_busn_res(int domain_nr)
{
	struct pci_domain_busn_res *r;

	list_for_each_entry(r, &pci_domain_busn_res_list, list)
		if (r->domain_nr == domain_nr)
			return &r->res;

	r = kzalloc(sizeof(*r), GFP_KERNEL);
	if (!r)
		return NULL;

	r->domain_nr = domain_nr;
	r->res.start = 0;
	r->res.end = 0xff;
	r->res.flags = IORESOURCE_BUS | IORESOURCE_PCI_FIXED;

	list_add_tail(&r->list, &pci_domain_busn_res_list);

	return &r->res;
}

60 61 62 63
static int find_anything(struct device *dev, void *data)
{
	return 1;
}
L
Linus Torvalds 已提交
64

Z
Zhang, Yanmin 已提交
65 66 67
/*
 * Some device drivers need know if pci is initiated.
 * Basically, we think pci is not initiated when there
68
 * is no device to be found on the pci_bus_type.
Z
Zhang, Yanmin 已提交
69 70 71
 */
int no_pci_devices(void)
{
72 73
	struct device *dev;
	int no_devices;
Z
Zhang, Yanmin 已提交
74

75 76 77 78 79
	dev = bus_find_device(&pci_bus_type, NULL, NULL, find_anything);
	no_devices = (dev == NULL);
	put_device(dev);
	return no_devices;
}
Z
Zhang, Yanmin 已提交
80 81
EXPORT_SYMBOL(no_pci_devices);

L
Linus Torvalds 已提交
82 83 84
/*
 * PCI Bus Class
 */
85
static void release_pcibus_dev(struct device *dev)
L
Linus Torvalds 已提交
86
{
87
	struct pci_bus *pci_bus = to_pci_bus(dev);
L
Linus Torvalds 已提交
88 89 90

	if (pci_bus->bridge)
		put_device(pci_bus->bridge);
91
	pci_bus_remove_resources(pci_bus);
92
	pci_release_bus_of_node(pci_bus);
L
Linus Torvalds 已提交
93 94 95 96 97
	kfree(pci_bus);
}

static struct class pcibus_class = {
	.name		= "pci_bus",
98
	.dev_release	= &release_pcibus_dev,
99
	.dev_attrs	= pcibus_dev_attrs,
L
Linus Torvalds 已提交
100 101 102 103 104 105 106 107
};

static int __init pcibus_class_init(void)
{
	return class_register(&pcibus_class);
}
postcore_initcall(pcibus_class_init);

108
static u64 pci_size(u64 base, u64 maxbase, u64 mask)
L
Linus Torvalds 已提交
109
{
110
	u64 size = mask & maxbase;	/* Find the significant bits */
L
Linus Torvalds 已提交
111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
	if (!size)
		return 0;

	/* Get the lowest of them to find the decode size, and
	   from that the extent.  */
	size = (size & ~(size-1)) - 1;

	/* base == maxbase can be valid only if the BAR has
	   already been programmed with all 1s.  */
	if (base == maxbase && ((base | size) & mask) != mask)
		return 0;

	return size;
}

126
static inline unsigned long decode_bar(struct pci_dev *dev, u32 bar)
127
{
128
	u32 mem_type;
129
	unsigned long flags;
130

131
	if ((bar & PCI_BASE_ADDRESS_SPACE) == PCI_BASE_ADDRESS_SPACE_IO) {
132 133 134
		flags = bar & ~PCI_BASE_ADDRESS_IO_MASK;
		flags |= IORESOURCE_IO;
		return flags;
135
	}
136

137 138 139 140
	flags = bar & ~PCI_BASE_ADDRESS_MEM_MASK;
	flags |= IORESOURCE_MEM;
	if (flags & PCI_BASE_ADDRESS_MEM_PREFETCH)
		flags |= IORESOURCE_PREFETCH;
141

142 143 144 145 146
	mem_type = bar & PCI_BASE_ADDRESS_MEM_TYPE_MASK;
	switch (mem_type) {
	case PCI_BASE_ADDRESS_MEM_TYPE_32:
		break;
	case PCI_BASE_ADDRESS_MEM_TYPE_1M:
147
		/* 1M mem BAR treated as 32-bit BAR */
148 149
		break;
	case PCI_BASE_ADDRESS_MEM_TYPE_64:
150 151
		flags |= IORESOURCE_MEM_64;
		break;
152
	default:
153
		/* mem unknown type treated as 32-bit BAR */
154 155
		break;
	}
156
	return flags;
157 158
}

Y
Yu Zhao 已提交
159 160 161 162 163 164 165 166
/**
 * pci_read_base - read a PCI BAR
 * @dev: the PCI device
 * @type: type of the BAR
 * @res: resource buffer to be filled in
 * @pos: BAR position in the config space
 *
 * Returns 1 if the BAR is 64-bit, or 0 if 32-bit.
167
 */
Y
Yu Zhao 已提交
168
int __pci_read_base(struct pci_dev *dev, enum pci_bar_type type,
169
			struct resource *res, unsigned int pos)
170
{
171
	u32 l, sz, mask;
J
Jacob Pan 已提交
172
	u16 orig_cmd;
173
	struct pci_bus_region region, inverted_region;
174
	bool bar_too_big = false, bar_disabled = false;
175

176
	mask = type ? PCI_ROM_ADDRESS_MASK : ~0;
177

178
	/* No printks while decoding is disabled! */
J
Jacob Pan 已提交
179 180 181 182 183 184
	if (!dev->mmio_always_on) {
		pci_read_config_word(dev, PCI_COMMAND, &orig_cmd);
		pci_write_config_word(dev, PCI_COMMAND,
			orig_cmd & ~(PCI_COMMAND_MEMORY | PCI_COMMAND_IO));
	}

185 186 187
	res->name = pci_name(dev);

	pci_read_config_dword(dev, pos, &l);
188
	pci_write_config_dword(dev, pos, l | mask);
189 190 191 192 193
	pci_read_config_dword(dev, pos, &sz);
	pci_write_config_dword(dev, pos, l);

	/*
	 * All bits set in sz means the device isn't working properly.
194 195 196
	 * If the BAR isn't implemented, all bits must be 0.  If it's a
	 * memory BAR or a ROM, bit 0 must be clear; if it's an io BAR, bit
	 * 1 must be clear.
197
	 */
198
	if (!sz || sz == 0xffffffff)
199 200 201 202 203 204 205 206 207 208
		goto fail;

	/*
	 * I don't know how l can have all bits set.  Copied from old code.
	 * Maybe it fixes a bug on some ancient platform.
	 */
	if (l == 0xffffffff)
		l = 0;

	if (type == pci_bar_unknown) {
209 210 211
		res->flags = decode_bar(dev, l);
		res->flags |= IORESOURCE_SIZEALIGN;
		if (res->flags & IORESOURCE_IO) {
212
			l &= PCI_BASE_ADDRESS_IO_MASK;
213
			mask = PCI_BASE_ADDRESS_IO_MASK & (u32) IO_SPACE_LIMIT;
214 215 216 217 218 219 220 221 222 223
		} else {
			l &= PCI_BASE_ADDRESS_MEM_MASK;
			mask = (u32)PCI_BASE_ADDRESS_MEM_MASK;
		}
	} else {
		res->flags |= (l & IORESOURCE_ROM_ENABLE);
		l &= PCI_ROM_ADDRESS_MASK;
		mask = (u32)PCI_ROM_ADDRESS_MASK;
	}

224
	if (res->flags & IORESOURCE_MEM_64) {
225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241
		u64 l64 = l;
		u64 sz64 = sz;
		u64 mask64 = mask | (u64)~0 << 32;

		pci_read_config_dword(dev, pos + 4, &l);
		pci_write_config_dword(dev, pos + 4, ~0);
		pci_read_config_dword(dev, pos + 4, &sz);
		pci_write_config_dword(dev, pos + 4, l);

		l64 |= ((u64)l << 32);
		sz64 |= ((u64)sz << 32);

		sz64 = pci_size(l64, sz64, mask64);

		if (!sz64)
			goto fail;

242
		if ((sizeof(resource_size_t) < 8) && (sz64 > 0x100000000ULL)) {
243
			bar_too_big = true;
244
			goto fail;
245 246 247
		}

		if ((sizeof(resource_size_t) < 8) && l) {
248 249 250
			/* Address above 32-bit boundary; disable the BAR */
			pci_write_config_dword(dev, pos, 0);
			pci_write_config_dword(dev, pos + 4, 0);
251 252
			region.start = 0;
			region.end = sz64;
253
			bar_disabled = true;
254
		} else {
255 256
			region.start = l64;
			region.end = l64 + sz64;
257 258
		}
	} else {
259
		sz = pci_size(l, sz, mask);
260

261
		if (!sz)
262 263
			goto fail;

264 265
		region.start = l;
		region.end = l + sz;
266 267
	}

268
	pcibios_bus_to_resource(dev, res, &region);
269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288
	pcibios_resource_to_bus(dev, &inverted_region, res);

	/*
	 * If "A" is a BAR value (a bus address), "bus_to_resource(A)" is
	 * the corresponding resource address (the physical address used by
	 * the CPU.  Converting that resource address back to a bus address
	 * should yield the original BAR value:
	 *
	 *     resource_to_bus(bus_to_resource(A)) == A
	 *
	 * If it doesn't, CPU accesses to "bus_to_resource(A)" will not
	 * be claimed by the device.
	 */
	if (inverted_region.start != region.start) {
		dev_info(&dev->dev, "reg 0x%x: initial BAR value %pa invalid; forcing reassignment\n",
			 pos, &region.start);
		res->flags |= IORESOURCE_UNSET;
		res->end -= res->start;
		res->start = 0;
	}
289

290 291 292 293 294 295
	goto out;


fail:
	res->flags = 0;
out:
296 297 298
	if (!dev->mmio_always_on)
		pci_write_config_word(dev, PCI_COMMAND, orig_cmd);

299
	if (bar_too_big)
300
		dev_err(&dev->dev, "reg 0x%x: can't handle 64-bit BAR\n", pos);
301
	if (res->flags && !bar_disabled)
302
		dev_printk(KERN_DEBUG, &dev->dev, "reg 0x%x: %pR\n", pos, res);
303

304
	return (res->flags & IORESOURCE_MEM_64) ? 1 : 0;
305 306
}

L
Linus Torvalds 已提交
307 308
static void pci_read_bases(struct pci_dev *dev, unsigned int howmany, int rom)
{
309
	unsigned int pos, reg;
310

311 312
	for (pos = 0; pos < howmany; pos++) {
		struct resource *res = &dev->resource[pos];
L
Linus Torvalds 已提交
313
		reg = PCI_BASE_ADDRESS_0 + (pos << 2);
314
		pos += __pci_read_base(dev, pci_bar_unknown, res, reg);
L
Linus Torvalds 已提交
315
	}
316

L
Linus Torvalds 已提交
317
	if (rom) {
318
		struct resource *res = &dev->resource[PCI_ROM_RESOURCE];
L
Linus Torvalds 已提交
319
		dev->rom_base_reg = rom;
320 321 322 323
		res->flags = IORESOURCE_MEM | IORESOURCE_PREFETCH |
				IORESOURCE_READONLY | IORESOURCE_CACHEABLE |
				IORESOURCE_SIZEALIGN;
		__pci_read_base(dev, pci_bar_mem32, res, rom);
L
Linus Torvalds 已提交
324 325 326
	}
}

B
Bill Pemberton 已提交
327
static void pci_read_bridge_io(struct pci_bus *child)
L
Linus Torvalds 已提交
328 329 330
{
	struct pci_dev *dev = child->self;
	u8 io_base_lo, io_limit_lo;
331
	unsigned long io_mask, io_granularity, base, limit;
332
	struct pci_bus_region region;
333 334 335 336 337 338 339 340 341
	struct resource *res;

	io_mask = PCI_IO_RANGE_MASK;
	io_granularity = 0x1000;
	if (dev->io_window_1k) {
		/* Support 1K I/O space granularity */
		io_mask = PCI_IO_1K_RANGE_MASK;
		io_granularity = 0x400;
	}
L
Linus Torvalds 已提交
342 343 344 345

	res = child->resource[0];
	pci_read_config_byte(dev, PCI_IO_BASE, &io_base_lo);
	pci_read_config_byte(dev, PCI_IO_LIMIT, &io_limit_lo);
346 347
	base = (io_base_lo & io_mask) << 8;
	limit = (io_limit_lo & io_mask) << 8;
L
Linus Torvalds 已提交
348 349 350

	if ((io_base_lo & PCI_IO_RANGE_TYPE_MASK) == PCI_IO_RANGE_TYPE_32) {
		u16 io_base_hi, io_limit_hi;
351

L
Linus Torvalds 已提交
352 353
		pci_read_config_word(dev, PCI_IO_BASE_UPPER16, &io_base_hi);
		pci_read_config_word(dev, PCI_IO_LIMIT_UPPER16, &io_limit_hi);
354 355
		base |= ((unsigned long) io_base_hi << 16);
		limit |= ((unsigned long) io_limit_hi << 16);
L
Linus Torvalds 已提交
356 357
	}

358
	if (base <= limit) {
L
Linus Torvalds 已提交
359
		res->flags = (io_base_lo & PCI_IO_RANGE_TYPE_MASK) | IORESOURCE_IO;
360
		region.start = base;
361 362
		region.end = limit + io_granularity - 1;
		pcibios_bus_to_resource(dev, res, &region);
363
		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
L
Linus Torvalds 已提交
364
	}
365 366
}

B
Bill Pemberton 已提交
367
static void pci_read_bridge_mmio(struct pci_bus *child)
368 369 370 371
{
	struct pci_dev *dev = child->self;
	u16 mem_base_lo, mem_limit_lo;
	unsigned long base, limit;
372
	struct pci_bus_region region;
373
	struct resource *res;
L
Linus Torvalds 已提交
374 375 376 377

	res = child->resource[1];
	pci_read_config_word(dev, PCI_MEMORY_BASE, &mem_base_lo);
	pci_read_config_word(dev, PCI_MEMORY_LIMIT, &mem_limit_lo);
378 379
	base = ((unsigned long) mem_base_lo & PCI_MEMORY_RANGE_MASK) << 16;
	limit = ((unsigned long) mem_limit_lo & PCI_MEMORY_RANGE_MASK) << 16;
380
	if (base <= limit) {
L
Linus Torvalds 已提交
381
		res->flags = (mem_base_lo & PCI_MEMORY_RANGE_TYPE_MASK) | IORESOURCE_MEM;
382 383
		region.start = base;
		region.end = limit + 0xfffff;
384
		pcibios_bus_to_resource(dev, res, &region);
385
		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
L
Linus Torvalds 已提交
386
	}
387 388
}

B
Bill Pemberton 已提交
389
static void pci_read_bridge_mmio_pref(struct pci_bus *child)
390 391 392 393
{
	struct pci_dev *dev = child->self;
	u16 mem_base_lo, mem_limit_lo;
	unsigned long base, limit;
394
	struct pci_bus_region region;
395
	struct resource *res;
L
Linus Torvalds 已提交
396 397 398 399

	res = child->resource[2];
	pci_read_config_word(dev, PCI_PREF_MEMORY_BASE, &mem_base_lo);
	pci_read_config_word(dev, PCI_PREF_MEMORY_LIMIT, &mem_limit_lo);
400 401
	base = ((unsigned long) mem_base_lo & PCI_PREF_RANGE_MASK) << 16;
	limit = ((unsigned long) mem_limit_lo & PCI_PREF_RANGE_MASK) << 16;
L
Linus Torvalds 已提交
402 403 404

	if ((mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) == PCI_PREF_RANGE_TYPE_64) {
		u32 mem_base_hi, mem_limit_hi;
405

L
Linus Torvalds 已提交
406 407 408 409 410 411 412 413 414 415
		pci_read_config_dword(dev, PCI_PREF_BASE_UPPER32, &mem_base_hi);
		pci_read_config_dword(dev, PCI_PREF_LIMIT_UPPER32, &mem_limit_hi);

		/*
		 * Some bridges set the base > limit by default, and some
		 * (broken) BIOSes do not initialize them.  If we find
		 * this, just assume they are not being used.
		 */
		if (mem_base_hi <= mem_limit_hi) {
#if BITS_PER_LONG == 64
416 417
			base |= ((unsigned long) mem_base_hi) << 32;
			limit |= ((unsigned long) mem_limit_hi) << 32;
L
Linus Torvalds 已提交
418 419
#else
			if (mem_base_hi || mem_limit_hi) {
420 421
				dev_err(&dev->dev, "can't handle 64-bit "
					"address space for bridge\n");
L
Linus Torvalds 已提交
422 423 424 425 426
				return;
			}
#endif
		}
	}
427
	if (base <= limit) {
428 429 430 431
		res->flags = (mem_base_lo & PCI_PREF_RANGE_TYPE_MASK) |
					 IORESOURCE_MEM | IORESOURCE_PREFETCH;
		if (res->flags & PCI_PREF_RANGE_TYPE_64)
			res->flags |= IORESOURCE_MEM_64;
432 433
		region.start = base;
		region.end = limit + 0xfffff;
434
		pcibios_bus_to_resource(dev, res, &region);
435
		dev_printk(KERN_DEBUG, &dev->dev, "  bridge window %pR\n", res);
L
Linus Torvalds 已提交
436 437 438
	}
}

B
Bill Pemberton 已提交
439
void pci_read_bridge_bases(struct pci_bus *child)
440 441
{
	struct pci_dev *dev = child->self;
442
	struct resource *res;
443 444 445 446 447
	int i;

	if (pci_is_root_bus(child))	/* It's a host bus, nothing to read */
		return;

448 449
	dev_info(&dev->dev, "PCI bridge to %pR%s\n",
		 &child->busn_res,
450 451
		 dev->transparent ? " (subtractive decode)" : "");

452 453 454 455
	pci_bus_remove_resources(child);
	for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++)
		child->resource[i] = &dev->resource[PCI_BRIDGE_RESOURCES+i];

456 457 458
	pci_read_bridge_io(child);
	pci_read_bridge_mmio(child);
	pci_read_bridge_mmio_pref(child);
459 460

	if (dev->transparent) {
461 462 463 464
		pci_bus_for_each_resource(child->parent, res, i) {
			if (res) {
				pci_bus_add_resource(child, res,
						     PCI_SUBTRACTIVE_DECODE);
465 466
				dev_printk(KERN_DEBUG, &dev->dev,
					   "  bridge window %pR (subtractive decode)\n",
467 468
					   res);
			}
469 470
		}
	}
471 472
}

473
static struct pci_bus *pci_alloc_bus(void)
L
Linus Torvalds 已提交
474 475 476
{
	struct pci_bus *b;

477
	b = kzalloc(sizeof(*b), GFP_KERNEL);
478 479 480 481 482 483 484 485 486 487
	if (!b)
		return NULL;

	INIT_LIST_HEAD(&b->node);
	INIT_LIST_HEAD(&b->children);
	INIT_LIST_HEAD(&b->devices);
	INIT_LIST_HEAD(&b->slots);
	INIT_LIST_HEAD(&b->resources);
	b->max_bus_speed = PCI_SPEED_UNKNOWN;
	b->cur_bus_speed = PCI_SPEED_UNKNOWN;
L
Linus Torvalds 已提交
488 489 490
	return b;
}

491 492 493 494 495 496 497 498 499 500 501 502
static void pci_release_host_bridge_dev(struct device *dev)
{
	struct pci_host_bridge *bridge = to_pci_host_bridge(dev);

	if (bridge->release_fn)
		bridge->release_fn(bridge);

	pci_free_resource_list(&bridge->windows);

	kfree(bridge);
}

503 504 505 506 507
static struct pci_host_bridge *pci_alloc_host_bridge(struct pci_bus *b)
{
	struct pci_host_bridge *bridge;

	bridge = kzalloc(sizeof(*bridge), GFP_KERNEL);
508 509
	if (!bridge)
		return NULL;
510

511 512
	INIT_LIST_HEAD(&bridge->windows);
	bridge->bus = b;
513 514 515
	return bridge;
}

516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534
static unsigned char pcix_bus_speed[] = {
	PCI_SPEED_UNKNOWN,		/* 0 */
	PCI_SPEED_66MHz_PCIX,		/* 1 */
	PCI_SPEED_100MHz_PCIX,		/* 2 */
	PCI_SPEED_133MHz_PCIX,		/* 3 */
	PCI_SPEED_UNKNOWN,		/* 4 */
	PCI_SPEED_66MHz_PCIX_ECC,	/* 5 */
	PCI_SPEED_100MHz_PCIX_ECC,	/* 6 */
	PCI_SPEED_133MHz_PCIX_ECC,	/* 7 */
	PCI_SPEED_UNKNOWN,		/* 8 */
	PCI_SPEED_66MHz_PCIX_266,	/* 9 */
	PCI_SPEED_100MHz_PCIX_266,	/* A */
	PCI_SPEED_133MHz_PCIX_266,	/* B */
	PCI_SPEED_UNKNOWN,		/* C */
	PCI_SPEED_66MHz_PCIX_533,	/* D */
	PCI_SPEED_100MHz_PCIX_533,	/* E */
	PCI_SPEED_133MHz_PCIX_533	/* F */
};

535 536 537 538
static unsigned char pcie_link_speed[] = {
	PCI_SPEED_UNKNOWN,		/* 0 */
	PCIE_SPEED_2_5GT,		/* 1 */
	PCIE_SPEED_5_0GT,		/* 2 */
539
	PCIE_SPEED_8_0GT,		/* 3 */
540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555
	PCI_SPEED_UNKNOWN,		/* 4 */
	PCI_SPEED_UNKNOWN,		/* 5 */
	PCI_SPEED_UNKNOWN,		/* 6 */
	PCI_SPEED_UNKNOWN,		/* 7 */
	PCI_SPEED_UNKNOWN,		/* 8 */
	PCI_SPEED_UNKNOWN,		/* 9 */
	PCI_SPEED_UNKNOWN,		/* A */
	PCI_SPEED_UNKNOWN,		/* B */
	PCI_SPEED_UNKNOWN,		/* C */
	PCI_SPEED_UNKNOWN,		/* D */
	PCI_SPEED_UNKNOWN,		/* E */
	PCI_SPEED_UNKNOWN		/* F */
};

void pcie_update_link_speed(struct pci_bus *bus, u16 linksta)
{
556
	bus->cur_bus_speed = pcie_link_speed[linksta & PCI_EXP_LNKSTA_CLS];
557 558 559
}
EXPORT_SYMBOL_GPL(pcie_update_link_speed);

560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591
static unsigned char agp_speeds[] = {
	AGP_UNKNOWN,
	AGP_1X,
	AGP_2X,
	AGP_4X,
	AGP_8X
};

static enum pci_bus_speed agp_speed(int agp3, int agpstat)
{
	int index = 0;

	if (agpstat & 4)
		index = 3;
	else if (agpstat & 2)
		index = 2;
	else if (agpstat & 1)
		index = 1;
	else
		goto out;
	
	if (agp3) {
		index += 2;
		if (index == 5)
			index = 0;
	}

 out:
	return agp_speeds[index];
}


592 593 594 595 596
static void pci_set_bus_speed(struct pci_bus *bus)
{
	struct pci_dev *bridge = bus->self;
	int pos;

597 598 599 600 601 602 603 604 605 606 607 608 609
	pos = pci_find_capability(bridge, PCI_CAP_ID_AGP);
	if (!pos)
		pos = pci_find_capability(bridge, PCI_CAP_ID_AGP3);
	if (pos) {
		u32 agpstat, agpcmd;

		pci_read_config_dword(bridge, pos + PCI_AGP_STATUS, &agpstat);
		bus->max_bus_speed = agp_speed(agpstat & 8, agpstat & 7);

		pci_read_config_dword(bridge, pos + PCI_AGP_COMMAND, &agpcmd);
		bus->cur_bus_speed = agp_speed(agpstat & 8, agpcmd & 7);
	}

610 611 612 613 614
	pos = pci_find_capability(bridge, PCI_CAP_ID_PCIX);
	if (pos) {
		u16 status;
		enum pci_bus_speed max;

615 616 617 618
		pci_read_config_word(bridge, pos + PCI_X_BRIDGE_SSTATUS,
				     &status);

		if (status & PCI_X_SSTATUS_533MHZ) {
619
			max = PCI_SPEED_133MHz_PCIX_533;
620
		} else if (status & PCI_X_SSTATUS_266MHZ) {
621
			max = PCI_SPEED_133MHz_PCIX_266;
622 623
		} else if (status & PCI_X_SSTATUS_133MHZ) {
			if ((status & PCI_X_SSTATUS_VERS) == PCI_X_SSTATUS_V2) {
624 625 626 627 628 629 630 631 632
				max = PCI_SPEED_133MHz_PCIX_ECC;
			} else {
				max = PCI_SPEED_133MHz_PCIX;
			}
		} else {
			max = PCI_SPEED_66MHz_PCIX;
		}

		bus->max_bus_speed = max;
633 634
		bus->cur_bus_speed = pcix_bus_speed[
			(status & PCI_X_SSTATUS_FREQ) >> 6];
635 636 637 638 639 640 641 642 643

		return;
	}

	pos = pci_find_capability(bridge, PCI_CAP_ID_EXP);
	if (pos) {
		u32 linkcap;
		u16 linksta;

644
		pcie_capability_read_dword(bridge, PCI_EXP_LNKCAP, &linkcap);
645
		bus->max_bus_speed = pcie_link_speed[linkcap & PCI_EXP_LNKCAP_SLS];
646

647
		pcie_capability_read_word(bridge, PCI_EXP_LNKSTA, &linksta);
648 649 650 651 652
		pcie_update_link_speed(bus, linksta);
	}
}


653 654
static struct pci_bus *pci_alloc_child_bus(struct pci_bus *parent,
					   struct pci_dev *bridge, int busnr)
L
Linus Torvalds 已提交
655 656 657
{
	struct pci_bus *child;
	int i;
658
	int ret;
L
Linus Torvalds 已提交
659 660 661 662 663 664 665 666 667 668 669

	/*
	 * Allocate a new bus, and inherit stuff from the parent..
	 */
	child = pci_alloc_bus();
	if (!child)
		return NULL;

	child->parent = parent;
	child->ops = parent->ops;
	child->sysdata = parent->sysdata;
670
	child->bus_flags = parent->bus_flags;
L
Linus Torvalds 已提交
671

672
	/* initialize some portions of the bus device, but don't register it
673
	 * now as the parent is not properly set up yet.
674 675
	 */
	child->dev.class = &pcibus_class;
676
	dev_set_name(&child->dev, "%04x:%02x", pci_domain_nr(child), busnr);
L
Linus Torvalds 已提交
677 678 679 680 681

	/*
	 * Set up the primary, secondary and subordinate
	 * bus numbers.
	 */
682 683 684
	child->number = child->busn_res.start = busnr;
	child->primary = parent->busn_res.start;
	child->busn_res.end = 0xff;
L
Linus Torvalds 已提交
685

686 687 688 689
	if (!bridge) {
		child->dev.parent = parent->bridge;
		goto add_dev;
	}
690 691 692

	child->self = bridge;
	child->bridge = get_device(&bridge->dev);
693
	child->dev.parent = child->bridge;
694
	pci_set_bus_of_node(child);
695 696
	pci_set_bus_speed(child);

L
Linus Torvalds 已提交
697
	/* Set up default resource pointers and names.. */
698
	for (i = 0; i < PCI_BRIDGE_RESOURCE_NUM; i++) {
L
Linus Torvalds 已提交
699 700 701 702 703
		child->resource[i] = &bridge->resource[PCI_BRIDGE_RESOURCES+i];
		child->resource[i]->name = child->name;
	}
	bridge->subordinate = child;

704 705 706 707
add_dev:
	ret = device_register(&child->dev);
	WARN_ON(ret < 0);

708 709
	pcibios_add_bus(child);

710 711 712
	/* Create legacy_io and legacy_mem files for this bus */
	pci_create_legacy_files(child);

L
Linus Torvalds 已提交
713 714 715
	return child;
}

716
struct pci_bus *__ref pci_add_new_bus(struct pci_bus *parent, struct pci_dev *dev, int busnr)
L
Linus Torvalds 已提交
717 718 719 720
{
	struct pci_bus *child;

	child = pci_alloc_child_bus(parent, dev, busnr);
721
	if (child) {
722
		down_write(&pci_bus_sem);
L
Linus Torvalds 已提交
723
		list_add_tail(&child->node, &parent->children);
724
		up_write(&pci_bus_sem);
725
	}
L
Linus Torvalds 已提交
726 727 728
	return child;
}

729
static void pci_fixup_parent_subordinate_busnr(struct pci_bus *child, int max)
730 731
{
	struct pci_bus *parent = child->parent;
732 733 734 735 736 737

	/* Attempts to fix that up are really dangerous unless
	   we're going to re-assign all bus numbers. */
	if (!pcibios_assign_all_busses())
		return;

738 739
	while (parent->parent && parent->busn_res.end < max) {
		parent->busn_res.end = max;
740 741 742 743 744
		pci_write_config_byte(parent->self, PCI_SUBORDINATE_BUS, max);
		parent = parent->parent;
	}
}

L
Linus Torvalds 已提交
745 746 747 748 749 750 751 752 753 754
/*
 * If it's a bridge, configure it and scan the bus behind it.
 * For CardBus bridges, we don't scan behind as the devices will
 * be handled by the bridge driver itself.
 *
 * We need to process bridges in two passes -- first we scan those
 * already configured by the BIOS and after we are done with all of
 * them, we proceed to assigning numbers to the remaining buses in
 * order to avoid overlaps between old and new bus numbers.
 */
B
Bill Pemberton 已提交
755
int pci_scan_bridge(struct pci_bus *bus, struct pci_dev *dev, int max, int pass)
L
Linus Torvalds 已提交
756 757 758
{
	struct pci_bus *child;
	int is_cardbus = (dev->hdr_type == PCI_HEADER_TYPE_CARDBUS);
759
	u32 buses, i, j = 0;
L
Linus Torvalds 已提交
760
	u16 bctl;
761
	u8 primary, secondary, subordinate;
762
	int broken = 0;
L
Linus Torvalds 已提交
763 764

	pci_read_config_dword(dev, PCI_PRIMARY_BUS, &buses);
765 766 767
	primary = buses & 0xFF;
	secondary = (buses >> 8) & 0xFF;
	subordinate = (buses >> 16) & 0xFF;
L
Linus Torvalds 已提交
768

769 770
	dev_dbg(&dev->dev, "scanning [bus %02x-%02x] behind bridge, pass %d\n",
		secondary, subordinate, pass);
L
Linus Torvalds 已提交
771

772 773 774 775 776
	if (!primary && (primary != bus->number) && secondary && subordinate) {
		dev_warn(&dev->dev, "Primary bus is hard wired to 0\n");
		primary = bus->number;
	}

777 778
	/* Check if setup is sensible at all */
	if (!pass &&
779 780 781 782
	    (primary != bus->number || secondary <= bus->number ||
	     secondary > subordinate)) {
		dev_info(&dev->dev, "bridge configuration invalid ([bus %02x-%02x]), reconfiguring\n",
			 secondary, subordinate);
783 784 785
		broken = 1;
	}

L
Linus Torvalds 已提交
786 787 788 789 790 791
	/* Disable MasterAbortMode during probing to avoid reporting
	   of bus errors (in some architectures) */ 
	pci_read_config_word(dev, PCI_BRIDGE_CONTROL, &bctl);
	pci_write_config_word(dev, PCI_BRIDGE_CONTROL,
			      bctl & ~PCI_BRIDGE_CTL_MASTER_ABORT);

792 793 794
	if ((secondary || subordinate) && !pcibios_assign_all_busses() &&
	    !is_cardbus && !broken) {
		unsigned int cmax;
L
Linus Torvalds 已提交
795 796 797 798 799
		/*
		 * Bus already configured by firmware, process it in the first
		 * pass and just note the configuration.
		 */
		if (pass)
800
			goto out;
L
Linus Torvalds 已提交
801 802 803

		/*
		 * If we already got to this bus through a different bridge,
A
Alex Chiang 已提交
804 805 806 807
		 * don't re-add it. This can happen with the i450NX chipset.
		 *
		 * However, we continue to descend down the hierarchy and
		 * scan remaining child buses.
L
Linus Torvalds 已提交
808
		 */
809
		child = pci_find_bus(pci_domain_nr(bus), secondary);
A
Alex Chiang 已提交
810
		if (!child) {
811
			child = pci_add_new_bus(bus, dev, secondary);
A
Alex Chiang 已提交
812 813
			if (!child)
				goto out;
814
			child->primary = primary;
Y
Yinghai Lu 已提交
815
			pci_bus_insert_busn_res(child, secondary, subordinate);
A
Alex Chiang 已提交
816
			child->bridge_ctl = bctl;
L
Linus Torvalds 已提交
817 818 819 820 821
		}

		cmax = pci_scan_child_bus(child);
		if (cmax > max)
			max = cmax;
822 823
		if (child->busn_res.end > max)
			max = child->busn_res.end;
L
Linus Torvalds 已提交
824 825 826 827 828
	} else {
		/*
		 * We need to assign a number to this bus which we always
		 * do in the second pass.
		 */
829
		if (!pass) {
830
			if (pcibios_assign_all_busses() || broken)
831 832 833 834 835 836 837 838
				/* Temporarily disable forwarding of the
				   configuration cycles on all bridges in
				   this bus segment to avoid possible
				   conflicts in the second pass between two
				   bridges programmed with overlapping
				   bus ranges. */
				pci_write_config_dword(dev, PCI_PRIMARY_BUS,
						       buses & ~0xffffff);
839
			goto out;
840
		}
L
Linus Torvalds 已提交
841 842 843 844

		/* Clear errors */
		pci_write_config_word(dev, PCI_STATUS, 0xffff);

845
		/* Prevent assigning a bus number that already exists.
846 847 848 849 850 851 852
		 * This can happen when a bridge is hot-plugged, so in
		 * this case we only re-scan this bus. */
		child = pci_find_bus(pci_domain_nr(bus), max+1);
		if (!child) {
			child = pci_add_new_bus(bus, dev, ++max);
			if (!child)
				goto out;
Y
Yinghai Lu 已提交
853
			pci_bus_insert_busn_res(child, max, 0xff);
854
		}
L
Linus Torvalds 已提交
855 856
		buses = (buses & 0xff000000)
		      | ((unsigned int)(child->primary)     <<  0)
857 858
		      | ((unsigned int)(child->busn_res.start)   <<  8)
		      | ((unsigned int)(child->busn_res.end) << 16);
L
Linus Torvalds 已提交
859 860 861 862 863 864 865 866 867

		/*
		 * yenta.c forces a secondary latency timer of 176.
		 * Copy that behaviour here.
		 */
		if (is_cardbus) {
			buses &= ~0xff000000;
			buses |= CARDBUS_LATENCY_TIMER << 24;
		}
868

L
Linus Torvalds 已提交
869 870 871 872 873 874
		/*
		 * We need to blast all three values with a single write.
		 */
		pci_write_config_dword(dev, PCI_PRIMARY_BUS, buses);

		if (!is_cardbus) {
875
			child->bridge_ctl = bctl;
876 877 878 879 880 881 882
			/*
			 * Adjust subordinate busnr in parent buses.
			 * We do this before scanning for children because
			 * some devices may not be detected if the bios
			 * was lazy.
			 */
			pci_fixup_parent_subordinate_busnr(child, max);
L
Linus Torvalds 已提交
883 884
			/* Now we can scan all subordinate buses... */
			max = pci_scan_child_bus(child);
885 886 887 888 889
			/*
			 * now fix it up again since we have found
			 * the real value of max.
			 */
			pci_fixup_parent_subordinate_busnr(child, max);
L
Linus Torvalds 已提交
890 891 892 893 894 895
		} else {
			/*
			 * For CardBus bridges, we leave 4 bus numbers
			 * as cards with a PCI-to-PCI bridge can be
			 * inserted later.
			 */
896 897
			for (i=0; i<CARDBUS_RESERVE_BUSNR; i++) {
				struct pci_bus *parent = bus;
898 899 900
				if (pci_find_bus(pci_domain_nr(bus),
							max+i+1))
					break;
901 902
				while (parent->parent) {
					if ((!pcibios_assign_all_busses()) &&
903 904
					    (parent->busn_res.end > max) &&
					    (parent->busn_res.end <= max+i)) {
905 906 907 908 909 910 911 912 913 914 915 916 917 918
						j = 1;
					}
					parent = parent->parent;
				}
				if (j) {
					/*
					 * Often, there are two cardbus bridges
					 * -- try to leave one valid bus number
					 * for each one.
					 */
					i /= 2;
					break;
				}
			}
919
			max += i;
920
			pci_fixup_parent_subordinate_busnr(child, max);
L
Linus Torvalds 已提交
921 922 923 924
		}
		/*
		 * Set the subordinate bus number to its real value.
		 */
Y
Yinghai Lu 已提交
925
		pci_bus_update_busn_res_end(child, max);
L
Linus Torvalds 已提交
926 927 928
		pci_write_config_byte(dev, PCI_SUBORDINATE_BUS, max);
	}

929 930 931
	sprintf(child->name,
		(is_cardbus ? "PCI CardBus %04x:%02x" : "PCI Bus %04x:%02x"),
		pci_domain_nr(bus), child->number);
L
Linus Torvalds 已提交
932

933
	/* Has only triggered on CardBus, fixup is in yenta_socket */
934
	while (bus->parent) {
935 936
		if ((child->busn_res.end > bus->busn_res.end) ||
		    (child->number > bus->busn_res.end) ||
937
		    (child->number < bus->number) ||
938 939 940 941 942 943
		    (child->busn_res.end < bus->number)) {
			dev_info(&child->dev, "%pR %s "
				"hidden behind%s bridge %s %pR\n",
				&child->busn_res,
				(bus->number > child->busn_res.end &&
				 bus->busn_res.end < child->number) ?
944 945
					"wholly" : "partially",
				bus->self->transparent ? " transparent" : "",
946
				dev_name(&bus->dev),
947
				&bus->busn_res);
948 949 950 951
		}
		bus = bus->parent;
	}

952 953 954
out:
	pci_write_config_word(dev, PCI_BRIDGE_CONTROL, bctl);

L
Linus Torvalds 已提交
955 956 957 958 959 960 961 962 963 964 965 966
	return max;
}

/*
 * Read interrupt line and base address registers.
 * The architecture-dependent code can tweak these, of course.
 */
static void pci_read_irq(struct pci_dev *dev)
{
	unsigned char irq;

	pci_read_config_byte(dev, PCI_INTERRUPT_PIN, &irq);
967
	dev->pin = irq;
L
Linus Torvalds 已提交
968 969 970 971 972
	if (irq)
		pci_read_config_byte(dev, PCI_INTERRUPT_LINE, &irq);
	dev->irq = irq;
}

973
void set_pcie_port_type(struct pci_dev *pdev)
Y
Yu Zhao 已提交
974 975 976 977 978 979 980 981
{
	int pos;
	u16 reg16;

	pos = pci_find_capability(pdev, PCI_CAP_ID_EXP);
	if (!pos)
		return;
	pdev->is_pcie = 1;
982
	pdev->pcie_cap = pos;
Y
Yu Zhao 已提交
983
	pci_read_config_word(pdev, pos + PCI_EXP_FLAGS, &reg16);
984
	pdev->pcie_flags_reg = reg16;
985 986
	pci_read_config_word(pdev, pos + PCI_EXP_DEVCAP, &reg16);
	pdev->pcie_mpss = reg16 & PCI_EXP_DEVCAP_PAYLOAD;
Y
Yu Zhao 已提交
987 988
}

989
void set_pcie_hotplug_bridge(struct pci_dev *pdev)
990 991 992
{
	u32 reg32;

993
	pcie_capability_read_dword(pdev, PCI_EXP_SLTCAP, &reg32);
994 995 996 997
	if (reg32 & PCI_EXP_SLTCAP_HPC)
		pdev->is_hotplug_bridge = 1;
}

998
#define LEGACY_IO_RESOURCE	(IORESOURCE_IO | IORESOURCE_PCI_FIXED)
999

L
Linus Torvalds 已提交
1000 1001 1002 1003 1004 1005 1006
/**
 * pci_setup_device - fill in class and map information of a device
 * @dev: the device structure to fill
 *
 * Initialize the device structure with information about the device's 
 * vendor,class,memory and IO-space addresses,IRQ lines etc.
 * Called at initialisation of the PCI subsystem and by CardBus services.
Y
Yu Zhao 已提交
1007 1008
 * Returns 0 on success and negative if unknown type of device (not normal,
 * bridge or CardBus).
L
Linus Torvalds 已提交
1009
 */
Y
Yu Zhao 已提交
1010
int pci_setup_device(struct pci_dev *dev)
L
Linus Torvalds 已提交
1011 1012
{
	u32 class;
Y
Yu Zhao 已提交
1013 1014
	u8 hdr_type;
	struct pci_slot *slot;
1015
	int pos = 0;
1016 1017
	struct pci_bus_region region;
	struct resource *res;
Y
Yu Zhao 已提交
1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036

	if (pci_read_config_byte(dev, PCI_HEADER_TYPE, &hdr_type))
		return -EIO;

	dev->sysdata = dev->bus->sysdata;
	dev->dev.parent = dev->bus->bridge;
	dev->dev.bus = &pci_bus_type;
	dev->hdr_type = hdr_type & 0x7f;
	dev->multifunction = !!(hdr_type & 0x80);
	dev->error_state = pci_channel_io_normal;
	set_pcie_port_type(dev);

	list_for_each_entry(slot, &dev->bus->slots, list)
		if (PCI_SLOT(dev->devfn) == slot->number)
			dev->slot = slot;

	/* Assume 32-bit PCI; let 64-bit PCI cards (which are far rarer)
	   set this higher, assuming the system even supports it.  */
	dev->dma_mask = 0xffffffff;
L
Linus Torvalds 已提交
1037

1038 1039 1040
	dev_set_name(&dev->dev, "%04x:%02x:%02x.%d", pci_domain_nr(dev->bus),
		     dev->bus->number, PCI_SLOT(dev->devfn),
		     PCI_FUNC(dev->devfn));
L
Linus Torvalds 已提交
1041 1042

	pci_read_config_dword(dev, PCI_CLASS_REVISION, &class);
A
Auke Kok 已提交
1043
	dev->revision = class & 0xff;
Y
Yinghai Lu 已提交
1044
	dev->class = class >> 8;		    /* upper 3 bytes */
L
Linus Torvalds 已提交
1045

Y
Yinghai Lu 已提交
1046 1047
	dev_printk(KERN_DEBUG, &dev->dev, "[%04x:%04x] type %02x class %#08x\n",
		   dev->vendor, dev->device, dev->hdr_type, dev->class);
L
Linus Torvalds 已提交
1048

1049 1050 1051
	/* need to have dev->class ready */
	dev->cfg_size = pci_cfg_space_size(dev);

L
Linus Torvalds 已提交
1052
	/* "Unknown power state" */
1053
	dev->current_state = PCI_UNKNOWN;
L
Linus Torvalds 已提交
1054 1055 1056

	/* Early fixups, before probing the BARs */
	pci_fixup_device(pci_fixup_early, dev);
1057 1058
	/* device class may be changed after fixup */
	class = dev->class >> 8;
L
Linus Torvalds 已提交
1059 1060 1061 1062 1063 1064 1065 1066 1067

	switch (dev->hdr_type) {		    /* header type */
	case PCI_HEADER_TYPE_NORMAL:		    /* standard header */
		if (class == PCI_CLASS_BRIDGE_PCI)
			goto bad;
		pci_read_irq(dev);
		pci_read_bases(dev, 6, PCI_ROM_ADDRESS);
		pci_read_config_word(dev, PCI_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
		pci_read_config_word(dev, PCI_SUBSYSTEM_ID, &dev->subsystem_device);
1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078

		/*
		 *	Do the ugly legacy mode stuff here rather than broken chip
		 *	quirk code. Legacy mode ATA controllers have fixed
		 *	addresses. These are not always echoed in BAR0-3, and
		 *	BAR0-3 in a few cases contain junk!
		 */
		if (class == PCI_CLASS_STORAGE_IDE) {
			u8 progif;
			pci_read_config_byte(dev, PCI_CLASS_PROG, &progif);
			if ((progif & 1) == 0) {
1079 1080 1081 1082
				region.start = 0x1F0;
				region.end = 0x1F7;
				res = &dev->resource[0];
				res->flags = LEGACY_IO_RESOURCE;
1083
				pcibios_bus_to_resource(dev, res, &region);
1084 1085 1086 1087
				region.start = 0x3F6;
				region.end = 0x3F6;
				res = &dev->resource[1];
				res->flags = LEGACY_IO_RESOURCE;
1088
				pcibios_bus_to_resource(dev, res, &region);
1089 1090
			}
			if ((progif & 4) == 0) {
1091 1092 1093 1094
				region.start = 0x170;
				region.end = 0x177;
				res = &dev->resource[2];
				res->flags = LEGACY_IO_RESOURCE;
1095
				pcibios_bus_to_resource(dev, res, &region);
1096 1097 1098 1099
				region.start = 0x376;
				region.end = 0x376;
				res = &dev->resource[3];
				res->flags = LEGACY_IO_RESOURCE;
1100
				pcibios_bus_to_resource(dev, res, &region);
1101 1102
			}
		}
L
Linus Torvalds 已提交
1103 1104 1105 1106 1107 1108 1109 1110
		break;

	case PCI_HEADER_TYPE_BRIDGE:		    /* bridge header */
		if (class != PCI_CLASS_BRIDGE_PCI)
			goto bad;
		/* The PCI-to-PCI bridge spec requires that subtractive
		   decoding (i.e. transparent) bridge must have programming
		   interface code of 0x01. */ 
1111
		pci_read_irq(dev);
L
Linus Torvalds 已提交
1112 1113
		dev->transparent = ((dev->class & 0xff) == 1);
		pci_read_bases(dev, 2, PCI_ROM_ADDRESS1);
1114
		set_pcie_hotplug_bridge(dev);
1115 1116 1117 1118 1119
		pos = pci_find_capability(dev, PCI_CAP_ID_SSVID);
		if (pos) {
			pci_read_config_word(dev, pos + PCI_SSVID_VENDOR_ID, &dev->subsystem_vendor);
			pci_read_config_word(dev, pos + PCI_SSVID_DEVICE_ID, &dev->subsystem_device);
		}
L
Linus Torvalds 已提交
1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131
		break;

	case PCI_HEADER_TYPE_CARDBUS:		    /* CardBus bridge header */
		if (class != PCI_CLASS_BRIDGE_CARDBUS)
			goto bad;
		pci_read_irq(dev);
		pci_read_bases(dev, 1, 0);
		pci_read_config_word(dev, PCI_CB_SUBSYSTEM_VENDOR_ID, &dev->subsystem_vendor);
		pci_read_config_word(dev, PCI_CB_SUBSYSTEM_ID, &dev->subsystem_device);
		break;

	default:				    /* unknown header */
1132 1133
		dev_err(&dev->dev, "unknown header type %02x, "
			"ignoring device\n", dev->hdr_type);
Y
Yu Zhao 已提交
1134
		return -EIO;
L
Linus Torvalds 已提交
1135 1136

	bad:
Y
Yinghai Lu 已提交
1137 1138
		dev_err(&dev->dev, "ignoring class %#08x (doesn't match header "
			"type %02x)\n", dev->class, dev->hdr_type);
L
Linus Torvalds 已提交
1139 1140 1141 1142 1143 1144 1145
		dev->class = PCI_CLASS_NOT_DEFINED;
	}

	/* We found a fine healthy device, go go go... */
	return 0;
}

1146 1147 1148
static void pci_release_capabilities(struct pci_dev *dev)
{
	pci_vpd_release(dev);
1149
	pci_iov_release(dev);
1150
	pci_free_cap_save_buffers(dev);
1151 1152
}

L
Linus Torvalds 已提交
1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164
/**
 * pci_release_dev - free a pci device structure when all users of it are finished.
 * @dev: device that's been disconnected
 *
 * Will be called only by the device core when all users of this pci device are
 * done.
 */
static void pci_release_dev(struct device *dev)
{
	struct pci_dev *pci_dev;

	pci_dev = to_pci_dev(dev);
1165
	pci_release_capabilities(pci_dev);
1166
	pci_release_of_node(pci_dev);
1167
	pcibios_release_device(pci_dev);
1168
	pci_bus_put(pci_dev->bus);
L
Linus Torvalds 已提交
1169 1170 1171 1172 1173
	kfree(pci_dev);
}

/**
 * pci_cfg_space_size - get the configuration space size of the PCI device.
R
Randy Dunlap 已提交
1174
 * @dev: PCI device
L
Linus Torvalds 已提交
1175 1176 1177 1178 1179 1180 1181 1182
 *
 * Regular PCI devices have 256 bytes, but PCI-X 2 and PCI Express devices
 * have 4096 bytes.  Even if the device is capable, that doesn't mean we can
 * access it.  Maybe we don't have a way to generate extended config space
 * accesses, or the device is behind a reverse Express bridge.  So we try
 * reading the dword at 0x100 which must either be 0 or a valid extended
 * capability header.
 */
1183
int pci_cfg_space_size_ext(struct pci_dev *dev)
L
Linus Torvalds 已提交
1184 1185
{
	u32 status;
1186
	int pos = PCI_CFG_SPACE_SIZE;
L
Linus Torvalds 已提交
1187

1188
	if (pci_read_config_dword(dev, pos, &status) != PCIBIOS_SUCCESSFUL)
1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202
		goto fail;
	if (status == 0xffffffff)
		goto fail;

	return PCI_CFG_SPACE_EXP_SIZE;

 fail:
	return PCI_CFG_SPACE_SIZE;
}

int pci_cfg_space_size(struct pci_dev *dev)
{
	int pos;
	u32 status;
1203 1204 1205 1206 1207
	u16 class;

	class = dev->class >> 8;
	if (class == PCI_CLASS_BRIDGE_HOST)
		return pci_cfg_space_size_ext(dev);
1208

1209
	if (!pci_is_pcie(dev)) {
L
Linus Torvalds 已提交
1210 1211 1212 1213 1214 1215 1216 1217 1218
		pos = pci_find_capability(dev, PCI_CAP_ID_PCIX);
		if (!pos)
			goto fail;

		pci_read_config_dword(dev, pos + PCI_X_STATUS, &status);
		if (!(status & (PCI_X_STATUS_266MHZ | PCI_X_STATUS_533MHZ)))
			goto fail;
	}

1219
	return pci_cfg_space_size_ext(dev);
L
Linus Torvalds 已提交
1220 1221 1222 1223 1224

 fail:
	return PCI_CFG_SPACE_SIZE;
}

1225
struct pci_dev *pci_alloc_dev(struct pci_bus *bus)
1226 1227 1228 1229 1230 1231 1232 1233
{
	struct pci_dev *dev;

	dev = kzalloc(sizeof(struct pci_dev), GFP_KERNEL);
	if (!dev)
		return NULL;

	INIT_LIST_HEAD(&dev->bus_list);
1234
	dev->dev.type = &pci_dev_type;
1235
	dev->bus = pci_bus_get(bus);
1236 1237 1238

	return dev;
}
1239 1240 1241 1242 1243 1244
EXPORT_SYMBOL(pci_alloc_dev);

struct pci_dev *alloc_pci_dev(void)
{
	return pci_alloc_dev(NULL);
}
1245 1246
EXPORT_SYMBOL(alloc_pci_dev);

1247 1248
bool pci_bus_read_dev_vendor_id(struct pci_bus *bus, int devfn, u32 *l,
				 int crs_timeout)
L
Linus Torvalds 已提交
1249 1250 1251
{
	int delay = 1;

1252 1253
	if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l))
		return false;
L
Linus Torvalds 已提交
1254 1255

	/* some broken boards return 0 or ~0 if a slot is empty: */
1256 1257 1258
	if (*l == 0xffffffff || *l == 0x00000000 ||
	    *l == 0x0000ffff || *l == 0xffff0000)
		return false;
L
Linus Torvalds 已提交
1259 1260

	/* Configuration request Retry Status */
1261 1262 1263 1264
	while (*l == 0xffff0001) {
		if (!crs_timeout)
			return false;

L
Linus Torvalds 已提交
1265 1266
		msleep(delay);
		delay *= 2;
1267 1268
		if (pci_bus_read_config_dword(bus, devfn, PCI_VENDOR_ID, l))
			return false;
L
Linus Torvalds 已提交
1269
		/* Card hasn't responded in 60 seconds?  Must be stuck. */
1270
		if (delay > crs_timeout) {
1271
			printk(KERN_WARNING "pci %04x:%02x:%02x.%d: not "
L
Linus Torvalds 已提交
1272 1273 1274
					"responding\n", pci_domain_nr(bus),
					bus->number, PCI_SLOT(devfn),
					PCI_FUNC(devfn));
1275
			return false;
L
Linus Torvalds 已提交
1276 1277 1278
		}
	}

1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294
	return true;
}
EXPORT_SYMBOL(pci_bus_read_dev_vendor_id);

/*
 * Read the config data for a PCI device, sanity-check it
 * and fill in the dev structure...
 */
static struct pci_dev *pci_scan_device(struct pci_bus *bus, int devfn)
{
	struct pci_dev *dev;
	u32 l;

	if (!pci_bus_read_dev_vendor_id(bus, devfn, &l, 60*1000))
		return NULL;

1295
	dev = pci_alloc_dev(bus);
L
Linus Torvalds 已提交
1296 1297 1298 1299 1300 1301
	if (!dev)
		return NULL;

	dev->devfn = devfn;
	dev->vendor = l & 0xffff;
	dev->device = (l >> 16) & 0xffff;
1302

1303 1304
	pci_set_of_node(dev);

Y
Yu Zhao 已提交
1305
	if (pci_setup_device(dev)) {
1306
		pci_bus_put(dev->bus);
L
Linus Torvalds 已提交
1307 1308 1309 1310 1311 1312 1313
		kfree(dev);
		return NULL;
	}

	return dev;
}

1314 1315 1316 1317 1318
static void pci_init_capabilities(struct pci_dev *dev)
{
	/* MSI/MSI-X list */
	pci_msi_init_pci_dev(dev);

1319 1320 1321
	/* Buffers for saving PCIe and PCI-X capabilities */
	pci_allocate_cap_save_buffers(dev);

1322 1323 1324 1325 1326
	/* Power Management */
	pci_pm_init(dev);

	/* Vital Product Data */
	pci_vpd_pci22_init(dev);
Y
Yu Zhao 已提交
1327 1328

	/* Alternative Routing-ID Forwarding */
1329
	pci_configure_ari(dev);
1330 1331 1332

	/* Single Root I/O Virtualization */
	pci_iov_init(dev);
1333 1334

	/* Enable ACS P2P upstream forwarding */
C
Chris Wright 已提交
1335
	pci_enable_acs(dev);
1336 1337
}

1338
void pci_device_add(struct pci_dev *dev, struct pci_bus *bus)
L
Linus Torvalds 已提交
1339
{
1340 1341
	int ret;

1342 1343
	device_initialize(&dev->dev);
	dev->dev.release = pci_release_dev;
L
Linus Torvalds 已提交
1344

1345
	set_dev_node(&dev->dev, pcibus_to_node(bus));
1346
	dev->dev.dma_mask = &dev->dma_mask;
1347
	dev->dev.dma_parms = &dev->dma_parms;
1348
	dev->dev.coherent_dma_mask = 0xffffffffull;
L
Linus Torvalds 已提交
1349

1350
	pci_set_dma_max_seg_size(dev, 65536);
1351
	pci_set_dma_seg_boundary(dev, 0xffffffff);
1352

L
Linus Torvalds 已提交
1353 1354 1355
	/* Fix up broken headers */
	pci_fixup_device(pci_fixup_header, dev);

1356 1357 1358
	/* moved out from quirk header fixup code */
	pci_reassigndev_resource_alignment(dev);

1359 1360 1361
	/* Clear the state_saved flag. */
	dev->state_saved = false;

1362 1363
	/* Initialize various capabilities */
	pci_init_capabilities(dev);
1364

L
Linus Torvalds 已提交
1365 1366 1367 1368
	/*
	 * Add the device to our list of discovered devices
	 * and the bus list for fixup functions, etc.
	 */
1369
	down_write(&pci_bus_sem);
L
Linus Torvalds 已提交
1370
	list_add_tail(&dev->bus_list, &bus->devices);
1371
	up_write(&pci_bus_sem);
1372 1373 1374 1375 1376 1377 1378 1379 1380 1381

	ret = pcibios_add_device(dev);
	WARN_ON(ret < 0);

	/* Notifier could use PCI capabilities */
	dev->match_driver = false;
	ret = device_add(&dev->dev);
	WARN_ON(ret < 0);

	pci_proc_attach_device(dev);
1382 1383
}

1384
struct pci_dev *__ref pci_scan_single_device(struct pci_bus *bus, int devfn)
1385 1386 1387
{
	struct pci_dev *dev;

T
Trent Piepho 已提交
1388 1389 1390 1391 1392 1393
	dev = pci_get_slot(bus, devfn);
	if (dev) {
		pci_dev_put(dev);
		return dev;
	}

1394 1395 1396 1397 1398
	dev = pci_scan_device(bus, devfn);
	if (!dev)
		return NULL;

	pci_device_add(dev, bus);
L
Linus Torvalds 已提交
1399 1400 1401

	return dev;
}
1402
EXPORT_SYMBOL(pci_scan_single_device);
L
Linus Torvalds 已提交
1403

1404
static unsigned next_fn(struct pci_bus *bus, struct pci_dev *dev, unsigned fn)
M
Matthew Wilcox 已提交
1405
{
1406 1407 1408
	int pos;
	u16 cap = 0;
	unsigned next_fn;
1409

1410 1411 1412 1413 1414 1415
	if (pci_ari_enabled(bus)) {
		if (!dev)
			return 0;
		pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_ARI);
		if (!pos)
			return 0;
1416

1417 1418 1419 1420
		pci_read_config_word(dev, pos + PCI_ARI_CAP, &cap);
		next_fn = PCI_ARI_CAP_NFN(cap);
		if (next_fn <= fn)
			return 0;	/* protect against malformed list */
M
Matthew Wilcox 已提交
1421

1422 1423 1424 1425 1426 1427
		return next_fn;
	}

	/* dev may be NULL for non-contiguous multifunction devices */
	if (!dev || dev->multifunction)
		return (fn + 1) % 8;
M
Matthew Wilcox 已提交
1428 1429 1430 1431 1432 1433 1434

	return 0;
}

static int only_one_child(struct pci_bus *bus)
{
	struct pci_dev *parent = bus->self;
1435

M
Matthew Wilcox 已提交
1436 1437
	if (!parent || !pci_is_pcie(parent))
		return 0;
1438
	if (pci_pcie_type(parent) == PCI_EXP_TYPE_ROOT_PORT)
1439
		return 1;
1440
	if (pci_pcie_type(parent) == PCI_EXP_TYPE_DOWNSTREAM &&
1441
	    !pci_has_flag(PCI_SCAN_ALL_PCIE_DEVS))
M
Matthew Wilcox 已提交
1442 1443 1444 1445
		return 1;
	return 0;
}

L
Linus Torvalds 已提交
1446 1447 1448 1449 1450 1451 1452
/**
 * pci_scan_slot - scan a PCI slot on a bus for devices.
 * @bus: PCI bus to scan
 * @devfn: slot number to scan (must have zero function.)
 *
 * Scan a PCI slot on the specified PCI bus for devices, adding
 * discovered devices to the @bus->devices list.  New devices
1453
 * will not have is_added set.
1454 1455
 *
 * Returns the number of new devices found.
L
Linus Torvalds 已提交
1456
 */
1457
int pci_scan_slot(struct pci_bus *bus, int devfn)
L
Linus Torvalds 已提交
1458
{
M
Matthew Wilcox 已提交
1459
	unsigned fn, nr = 0;
1460
	struct pci_dev *dev;
M
Matthew Wilcox 已提交
1461 1462 1463

	if (only_one_child(bus) && (devfn > 0))
		return 0; /* Already scanned the entire slot */
L
Linus Torvalds 已提交
1464

1465
	dev = pci_scan_single_device(bus, devfn);
1466 1467 1468
	if (!dev)
		return 0;
	if (!dev->is_added)
1469 1470
		nr++;

1471
	for (fn = next_fn(bus, dev, 0); fn > 0; fn = next_fn(bus, dev, fn)) {
M
Matthew Wilcox 已提交
1472 1473 1474 1475 1476
		dev = pci_scan_single_device(bus, devfn + fn);
		if (dev) {
			if (!dev->is_added)
				nr++;
			dev->multifunction = 1;
L
Linus Torvalds 已提交
1477 1478
		}
	}
S
Shaohua Li 已提交
1479

1480 1481
	/* only one slot has pcie device */
	if (bus->self && nr)
S
Shaohua Li 已提交
1482 1483
		pcie_aspm_init_link_state(bus->self);

L
Linus Torvalds 已提交
1484 1485 1486
	return nr;
}

1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509
static int pcie_find_smpss(struct pci_dev *dev, void *data)
{
	u8 *smpss = data;

	if (!pci_is_pcie(dev))
		return 0;

	/* For PCIE hotplug enabled slots not connected directly to a
	 * PCI-E root port, there can be problems when hotplugging
	 * devices.  This is due to the possibility of hotplugging a
	 * device into the fabric with a smaller MPS that the devices
	 * currently running have configured.  Modifying the MPS on the
	 * running devices could cause a fatal bus error due to an
	 * incoming frame being larger than the newly configured MPS.
	 * To work around this, the MPS for the entire fabric must be
	 * set to the minimum size.  Any devices hotplugged into this
	 * fabric will have the minimum MPS set.  If the PCI hotplug
	 * slot is directly connected to the root port and there are not
	 * other devices on the fabric (which seems to be the most
	 * common case), then this is not an issue and MPS discovery
	 * will occur as normal.
	 */
	if (dev->is_hotplug_bridge && (!list_is_singular(&dev->bus->devices) ||
1510
	     (dev->bus->self &&
1511
	      pci_pcie_type(dev->bus->self) != PCI_EXP_TYPE_ROOT_PORT)))
1512 1513 1514 1515 1516 1517 1518 1519 1520 1521
		*smpss = 0;

	if (*smpss > dev->pcie_mpss)
		*smpss = dev->pcie_mpss;

	return 0;
}

static void pcie_write_mps(struct pci_dev *dev, int mps)
{
1522
	int rc;
1523 1524

	if (pcie_bus_config == PCIE_BUS_PERFORMANCE) {
1525
		mps = 128 << dev->pcie_mpss;
1526

1527 1528
		if (pci_pcie_type(dev) != PCI_EXP_TYPE_ROOT_PORT &&
		    dev->bus->self)
1529
			/* For "Performance", the assumption is made that
1530 1531 1532 1533 1534
			 * downstream communication will never be larger than
			 * the MRRS.  So, the MPS only needs to be configured
			 * for the upstream communication.  This being the case,
			 * walk from the top down and set the MPS of the child
			 * to that of the parent bus.
1535 1536 1537 1538 1539
			 *
			 * Configure the device MPS with the smaller of the
			 * device MPSS or the bridge MPS (which is assumed to be
			 * properly configured at this point to the largest
			 * allowable MPS based on its parent bus).
1540
			 */
1541
			mps = min(mps, pcie_get_mps(dev->bus->self));
1542 1543 1544 1545 1546 1547 1548
	}

	rc = pcie_set_mps(dev, mps);
	if (rc)
		dev_err(&dev->dev, "Failed attempting to set the MPS\n");
}

1549
static void pcie_write_mrrs(struct pci_dev *dev)
1550
{
1551
	int rc, mrrs;
1552

1553 1554 1555 1556 1557 1558 1559 1560
	/* In the "safe" case, do not configure the MRRS.  There appear to be
	 * issues with setting MRRS to 0 on a number of devices.
	 */
	if (pcie_bus_config != PCIE_BUS_PERFORMANCE)
		return;

	/* For Max performance, the MRRS must be set to the largest supported
	 * value.  However, it cannot be configured larger than the MPS the
1561 1562
	 * device or the bus can support.  This should already be properly
	 * configured by a prior call to pcie_write_mps.
1563
	 */
1564
	mrrs = pcie_get_mps(dev);
1565 1566

	/* MRRS is a R/W register.  Invalid values can be written, but a
1567
	 * subsequent read will verify if the value is acceptable or not.
1568 1569 1570 1571 1572
	 * If the MRRS value provided is not acceptable (e.g., too large),
	 * shrink the value until it is acceptable to the HW.
 	 */
	while (mrrs != pcie_get_readrq(dev) && mrrs >= 128) {
		rc = pcie_set_readrq(dev, mrrs);
1573 1574
		if (!rc)
			break;
1575

1576
		dev_warn(&dev->dev, "Failed attempting to set the MRRS\n");
1577 1578
		mrrs /= 2;
	}
1579 1580 1581 1582 1583

	if (mrrs < 128)
		dev_err(&dev->dev, "MRRS was unable to be configured with a "
			"safe value.  If problems are experienced, try running "
			"with pci=pcie_bus_safe.\n");
1584 1585 1586 1587
}

static int pcie_bus_configure_set(struct pci_dev *dev, void *data)
{
J
Jon Mason 已提交
1588
	int mps, orig_mps;
1589 1590 1591 1592

	if (!pci_is_pcie(dev))
		return 0;

J
Jon Mason 已提交
1593 1594
	mps = 128 << *(u8 *)data;
	orig_mps = pcie_get_mps(dev);
1595 1596

	pcie_write_mps(dev, mps);
1597
	pcie_write_mrrs(dev);
1598

1599
	dev_info(&dev->dev, "Max Payload Size set to %4d/%4d (was %4d), "
J
Jon Mason 已提交
1600 1601
		 "Max Read Rq %4d\n", pcie_get_mps(dev), 128 << dev->pcie_mpss,
		 orig_mps, pcie_get_readrq(dev));
1602 1603 1604 1605

	return 0;
}

J
Jon Mason 已提交
1606
/* pcie_bus_configure_settings requires that pci_walk_bus work in a top-down,
1607 1608 1609
 * parents then children fashion.  If this changes, then this code will not
 * work as designed.
 */
1610
void pcie_bus_configure_settings(struct pci_bus *bus)
1611
{
1612
	u8 smpss;
1613

1614 1615 1616
	if (!bus->self)
		return;

1617 1618 1619
	if (!pci_is_pcie(bus->self))
		return;

1620 1621 1622 1623 1624 1625 1626 1627 1628 1629
	if (pcie_bus_config == PCIE_BUS_TUNE_OFF)
		return;

	/* FIXME - Peer to peer DMA is possible, though the endpoint would need
	 * to be aware to the MPS of the destination.  To work around this,
	 * simply force the MPS of the entire system to the smallest possible.
	 */
	if (pcie_bus_config == PCIE_BUS_PEER2PEER)
		smpss = 0;

1630
	if (pcie_bus_config == PCIE_BUS_SAFE) {
1631
		smpss = bus->self->pcie_mpss;
1632

1633 1634 1635 1636 1637 1638 1639
		pcie_find_smpss(bus->self, &smpss);
		pci_walk_bus(bus, pcie_find_smpss, &smpss);
	}

	pcie_bus_configure_set(bus->self, &smpss);
	pci_walk_bus(bus, pcie_bus_configure_set, &smpss);
}
1640
EXPORT_SYMBOL_GPL(pcie_bus_configure_settings);
1641

B
Bill Pemberton 已提交
1642
unsigned int pci_scan_child_bus(struct pci_bus *bus)
L
Linus Torvalds 已提交
1643
{
1644
	unsigned int devfn, pass, max = bus->busn_res.start;
L
Linus Torvalds 已提交
1645 1646
	struct pci_dev *dev;

B
Bjorn Helgaas 已提交
1647
	dev_dbg(&bus->dev, "scanning bus\n");
L
Linus Torvalds 已提交
1648 1649 1650 1651 1652

	/* Go find them, Rover! */
	for (devfn = 0; devfn < 0x100; devfn += 8)
		pci_scan_slot(bus, devfn);

1653 1654 1655
	/* Reserve buses for SR-IOV capability. */
	max += pci_iov_bus_range(bus);

L
Linus Torvalds 已提交
1656 1657 1658 1659
	/*
	 * After performing arch-dependent fixup of the bus, look behind
	 * all PCI-to-PCI bridges on this bus.
	 */
A
Alex Chiang 已提交
1660
	if (!bus->is_added) {
B
Bjorn Helgaas 已提交
1661
		dev_dbg(&bus->dev, "fixups for bus\n");
A
Alex Chiang 已提交
1662
		pcibios_fixup_bus(bus);
1663
		bus->is_added = 1;
A
Alex Chiang 已提交
1664 1665
	}

L
Linus Torvalds 已提交
1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679
	for (pass=0; pass < 2; pass++)
		list_for_each_entry(dev, &bus->devices, bus_list) {
			if (dev->hdr_type == PCI_HEADER_TYPE_BRIDGE ||
			    dev->hdr_type == PCI_HEADER_TYPE_CARDBUS)
				max = pci_scan_bridge(bus, dev, max, pass);
		}

	/*
	 * We've scanned the bus and so we know all about what's on
	 * the other side of any bridges that may be on this bus plus
	 * any devices.
	 *
	 * Return how far we've got finding sub-buses.
	 */
B
Bjorn Helgaas 已提交
1680
	dev_dbg(&bus->dev, "bus scan returning with max=%02x\n", max);
L
Linus Torvalds 已提交
1681 1682 1683
	return max;
}

1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695
/**
 * pcibios_root_bridge_prepare - Platform-specific host bridge setup.
 * @bridge: Host bridge to set up.
 *
 * Default empty implementation.  Replace with an architecture-specific setup
 * routine, if necessary.
 */
int __weak pcibios_root_bridge_prepare(struct pci_host_bridge *bridge)
{
	return 0;
}

1696 1697 1698 1699 1700 1701 1702 1703
void __weak pcibios_add_bus(struct pci_bus *bus)
{
}

void __weak pcibios_remove_bus(struct pci_bus *bus)
{
}

1704 1705
struct pci_bus *pci_create_root_bus(struct device *parent, int bus,
		struct pci_ops *ops, void *sysdata, struct list_head *resources)
L
Linus Torvalds 已提交
1706
{
1707
	int error;
1708
	struct pci_host_bridge *bridge;
B
Bjorn Helgaas 已提交
1709
	struct pci_bus *b, *b2;
1710
	struct pci_host_bridge_window *window, *n;
1711
	struct resource *res;
1712 1713 1714
	resource_size_t offset;
	char bus_addr[64];
	char *fmt;
L
Linus Torvalds 已提交
1715 1716 1717

	b = pci_alloc_bus();
	if (!b)
1718
		return NULL;
L
Linus Torvalds 已提交
1719 1720 1721

	b->sysdata = sysdata;
	b->ops = ops;
1722
	b->number = b->busn_res.start = bus;
B
Bjorn Helgaas 已提交
1723 1724
	b2 = pci_find_bus(pci_domain_nr(b), bus);
	if (b2) {
L
Linus Torvalds 已提交
1725
		/* If we already got to this bus through a different bridge, ignore it */
B
Bjorn Helgaas 已提交
1726
		dev_dbg(&b2->dev, "bus already known\n");
L
Linus Torvalds 已提交
1727 1728
		goto err_out;
	}
1729

1730 1731 1732 1733 1734
	bridge = pci_alloc_host_bridge(b);
	if (!bridge)
		goto err_out;

	bridge->dev.parent = parent;
1735
	bridge->dev.release = pci_release_host_bridge_dev;
1736
	dev_set_name(&bridge->dev, "pci%04x:%02x", pci_domain_nr(b), bus);
1737
	error = pcibios_root_bridge_prepare(bridge);
1738 1739 1740 1741
	if (error) {
		kfree(bridge);
		goto err_out;
	}
1742

1743
	error = device_register(&bridge->dev);
1744 1745 1746 1747
	if (error) {
		put_device(&bridge->dev);
		goto err_out;
	}
1748
	b->bridge = get_device(&bridge->dev);
1749
	device_enable_async_suspend(b->bridge);
1750
	pci_set_bus_of_node(b);
L
Linus Torvalds 已提交
1751

1752 1753 1754
	if (!parent)
		set_dev_node(b->bridge, pcibus_to_node(b));

1755 1756
	b->dev.class = &pcibus_class;
	b->dev.parent = b->bridge;
1757
	dev_set_name(&b->dev, "%04x:%02x", pci_domain_nr(b), bus);
1758
	error = device_register(&b->dev);
L
Linus Torvalds 已提交
1759 1760 1761
	if (error)
		goto class_dev_reg_err;

1762 1763
	pcibios_add_bus(b);

L
Linus Torvalds 已提交
1764 1765 1766
	/* Create legacy_io and legacy_mem files for this bus */
	pci_create_legacy_files(b);

1767 1768 1769 1770 1771
	if (parent)
		dev_info(parent, "PCI host bridge to bus %s\n", dev_name(&b->dev));
	else
		printk(KERN_INFO "PCI host bridge to bus %s\n", dev_name(&b->dev));

1772 1773 1774 1775 1776
	/* Add initial resources to the bus */
	list_for_each_entry_safe(window, n, resources, list) {
		list_move_tail(&window->list, &bridge->windows);
		res = window->res;
		offset = window->offset;
1777 1778 1779 1780
		if (res->flags & IORESOURCE_BUS)
			pci_bus_insert_busn_res(b, bus, res->end);
		else
			pci_bus_add_resource(b, res, 0);
1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791
		if (offset) {
			if (resource_type(res) == IORESOURCE_IO)
				fmt = " (bus address [%#06llx-%#06llx])";
			else
				fmt = " (bus address [%#010llx-%#010llx])";
			snprintf(bus_addr, sizeof(bus_addr), fmt,
				 (unsigned long long) (res->start - offset),
				 (unsigned long long) (res->end - offset));
		} else
			bus_addr[0] = '\0';
		dev_info(&b->dev, "root bus resource %pR%s\n", res, bus_addr);
1792 1793
	}

1794 1795 1796 1797
	down_write(&pci_bus_sem);
	list_add_tail(&b->node, &pci_root_buses);
	up_write(&pci_bus_sem);

L
Linus Torvalds 已提交
1798 1799 1800
	return b;

class_dev_reg_err:
1801 1802
	put_device(&bridge->dev);
	device_unregister(&bridge->dev);
L
Linus Torvalds 已提交
1803 1804 1805 1806
err_out:
	kfree(b);
	return NULL;
}
1807

1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870
int pci_bus_insert_busn_res(struct pci_bus *b, int bus, int bus_max)
{
	struct resource *res = &b->busn_res;
	struct resource *parent_res, *conflict;

	res->start = bus;
	res->end = bus_max;
	res->flags = IORESOURCE_BUS;

	if (!pci_is_root_bus(b))
		parent_res = &b->parent->busn_res;
	else {
		parent_res = get_pci_domain_busn_res(pci_domain_nr(b));
		res->flags |= IORESOURCE_PCI_FIXED;
	}

	conflict = insert_resource_conflict(parent_res, res);

	if (conflict)
		dev_printk(KERN_DEBUG, &b->dev,
			   "busn_res: can not insert %pR under %s%pR (conflicts with %s %pR)\n",
			    res, pci_is_root_bus(b) ? "domain " : "",
			    parent_res, conflict->name, conflict);

	return conflict == NULL;
}

int pci_bus_update_busn_res_end(struct pci_bus *b, int bus_max)
{
	struct resource *res = &b->busn_res;
	struct resource old_res = *res;
	resource_size_t size;
	int ret;

	if (res->start > bus_max)
		return -EINVAL;

	size = bus_max - res->start + 1;
	ret = adjust_resource(res, res->start, size);
	dev_printk(KERN_DEBUG, &b->dev,
			"busn_res: %pR end %s updated to %02x\n",
			&old_res, ret ? "can not be" : "is", bus_max);

	if (!ret && !res->parent)
		pci_bus_insert_busn_res(b, res->start, res->end);

	return ret;
}

void pci_bus_release_busn_res(struct pci_bus *b)
{
	struct resource *res = &b->busn_res;
	int ret;

	if (!res->flags || !res->parent)
		return;

	ret = release_resource(res);
	dev_printk(KERN_DEBUG, &b->dev,
			"busn_res: %pR %s released\n",
			res, ret ? "can not be" : "is");
}

B
Bill Pemberton 已提交
1871
struct pci_bus *pci_scan_root_bus(struct device *parent, int bus,
1872 1873
		struct pci_ops *ops, void *sysdata, struct list_head *resources)
{
1874 1875
	struct pci_host_bridge_window *window;
	bool found = false;
1876
	struct pci_bus *b;
1877 1878 1879 1880 1881 1882 1883
	int max;

	list_for_each_entry(window, resources, list)
		if (window->res->flags & IORESOURCE_BUS) {
			found = true;
			break;
		}
1884 1885 1886 1887 1888

	b = pci_create_root_bus(parent, bus, ops, sysdata, resources);
	if (!b)
		return NULL;

1889 1890 1891 1892 1893 1894 1895 1896 1897 1898 1899 1900
	if (!found) {
		dev_info(&b->dev,
		 "No busn resource found for root bus, will use [bus %02x-ff]\n",
			bus);
		pci_bus_insert_busn_res(b, bus, 255);
	}

	max = pci_scan_child_bus(b);

	if (!found)
		pci_bus_update_busn_res_end(b, max);

1901 1902 1903 1904 1905
	pci_bus_add_devices(b);
	return b;
}
EXPORT_SYMBOL(pci_scan_root_bus);

1906
/* Deprecated; use pci_scan_root_bus() instead */
B
Bill Pemberton 已提交
1907
struct pci_bus *pci_scan_bus_parented(struct device *parent,
1908 1909
		int bus, struct pci_ops *ops, void *sysdata)
{
1910
	LIST_HEAD(resources);
1911 1912
	struct pci_bus *b;

1913 1914
	pci_add_resource(&resources, &ioport_resource);
	pci_add_resource(&resources, &iomem_resource);
1915
	pci_add_resource(&resources, &busn_resource);
1916
	b = pci_create_root_bus(parent, bus, ops, sysdata, &resources);
1917
	if (b)
1918
		pci_scan_child_bus(b);
1919 1920
	else
		pci_free_resource_list(&resources);
1921 1922
	return b;
}
L
Linus Torvalds 已提交
1923 1924
EXPORT_SYMBOL(pci_scan_bus_parented);

B
Bill Pemberton 已提交
1925
struct pci_bus *pci_scan_bus(int bus, struct pci_ops *ops,
1926 1927 1928 1929 1930 1931 1932
					void *sysdata)
{
	LIST_HEAD(resources);
	struct pci_bus *b;

	pci_add_resource(&resources, &ioport_resource);
	pci_add_resource(&resources, &iomem_resource);
1933
	pci_add_resource(&resources, &busn_resource);
1934 1935
	b = pci_create_root_bus(NULL, bus, ops, sysdata, &resources);
	if (b) {
1936
		pci_scan_child_bus(b);
1937 1938 1939 1940 1941 1942 1943 1944
		pci_bus_add_devices(b);
	} else {
		pci_free_resource_list(&resources);
	}
	return b;
}
EXPORT_SYMBOL(pci_scan_bus);

1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969
/**
 * pci_rescan_bus_bridge_resize - scan a PCI bus for devices.
 * @bridge: PCI bridge for the bus to scan
 *
 * Scan a PCI bus and child buses for new devices, add them,
 * and enable them, resizing bridge mmio/io resource if necessary
 * and possible.  The caller must ensure the child devices are already
 * removed for resizing to occur.
 *
 * Returns the max number of subordinate bus discovered.
 */
unsigned int __ref pci_rescan_bus_bridge_resize(struct pci_dev *bridge)
{
	unsigned int max;
	struct pci_bus *bus = bridge->subordinate;

	max = pci_scan_child_bus(bus);

	pci_assign_unassigned_bridge_resources(bridge);

	pci_bus_add_devices(bus);

	return max;
}

1970 1971 1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982 1983 1984
/**
 * pci_rescan_bus - scan a PCI bus for devices.
 * @bus: PCI bus to scan
 *
 * Scan a PCI bus and child buses for new devices, adds them,
 * and enables them.
 *
 * Returns the max number of subordinate bus discovered.
 */
unsigned int __ref pci_rescan_bus(struct pci_bus *bus)
{
	unsigned int max;

	max = pci_scan_child_bus(bus);
	pci_assign_unassigned_bus_resources(bus);
1985
	pci_enable_bridges(bus);
1986 1987 1988 1989 1990 1991
	pci_bus_add_devices(bus);

	return max;
}
EXPORT_SYMBOL_GPL(pci_rescan_bus);

L
Linus Torvalds 已提交
1992 1993 1994 1995
EXPORT_SYMBOL(pci_add_new_bus);
EXPORT_SYMBOL(pci_scan_slot);
EXPORT_SYMBOL(pci_scan_bridge);
EXPORT_SYMBOL_GPL(pci_scan_child_bus);
1996

1997
static int __init pci_sort_bf_cmp(const struct device *d_a, const struct device *d_b)
1998
{
1999 2000 2001
	const struct pci_dev *a = to_pci_dev(d_a);
	const struct pci_dev *b = to_pci_dev(d_b);

2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013
	if      (pci_domain_nr(a->bus) < pci_domain_nr(b->bus)) return -1;
	else if (pci_domain_nr(a->bus) > pci_domain_nr(b->bus)) return  1;

	if      (a->bus->number < b->bus->number) return -1;
	else if (a->bus->number > b->bus->number) return  1;

	if      (a->devfn < b->devfn) return -1;
	else if (a->devfn > b->devfn) return  1;

	return 0;
}

2014
void __init pci_sort_breadthfirst(void)
2015
{
2016
	bus_sort_breadthfirst(&pci_bus_type, &pci_sort_bf_cmp);
2017
}