mmconfig-shared.c 18.4 KB
Newer Older
1 2 3 4 5
/*
 * mmconfig-shared.c - Low-level direct PCI config space access via
 *                     MMCONFIG - common code between i386 and x86-64.
 *
 * This code does:
6
 * - known chipset handling
7 8 9 10 11 12 13 14
 * - ACPI decoding and validation
 *
 * Per-architecture code takes care of the mappings and accesses
 * themselves.
 */

#include <linux/pci.h>
#include <linux/init.h>
F
Feng Tang 已提交
15
#include <linux/sfi_acpi.h>
16
#include <linux/bitmap.h>
B
Bjorn Helgaas 已提交
17
#include <linux/dmi.h>
18
#include <linux/slab.h>
19 20
#include <linux/mutex.h>
#include <linux/rculist.h>
21
#include <asm/e820.h>
22
#include <asm/pci_x86.h>
F
Feng Tang 已提交
23
#include <asm/acpi.h>
24

25
#define PREFIX "PCI: "
26

27
/* Indicate if the mmcfg resources have been placed into the resource table. */
28
static bool pci_mmcfg_running_state;
29
static bool pci_mmcfg_arch_init_failed;
30
static DEFINE_MUTEX(pci_mmcfg_lock);
31

32 33
LIST_HEAD(pci_mmcfg_list);

34 35 36 37 38 39 40 41
static __init void pci_mmconfig_remove(struct pci_mmcfg_region *cfg)
{
	if (cfg->res.parent)
		release_resource(&cfg->res);
	list_del(&cfg->list);
	kfree(cfg);
}

42 43
static __init void free_all_mmcfg(void)
{
44
	struct pci_mmcfg_region *cfg, *tmp;
45

46
	pci_mmcfg_arch_free();
47 48
	list_for_each_entry_safe(cfg, tmp, &pci_mmcfg_list, list)
		pci_mmconfig_remove(cfg);
49 50
}

51
static void list_add_sorted(struct pci_mmcfg_region *new)
52 53 54 55
{
	struct pci_mmcfg_region *cfg;

	/* keep list sorted by segment and starting bus number */
56
	list_for_each_entry_rcu(cfg, &pci_mmcfg_list, list) {
57 58 59
		if (cfg->segment > new->segment ||
		    (cfg->segment == new->segment &&
		     cfg->start_bus >= new->start_bus)) {
60
			list_add_tail_rcu(&new->list, &cfg->list);
61 62 63
			return;
		}
	}
64
	list_add_tail_rcu(&new->list, &pci_mmcfg_list);
65 66
}

67 68
static struct pci_mmcfg_region *pci_mmconfig_alloc(int segment, int start,
						   int end, u64 addr)
69
{
70
	struct pci_mmcfg_region *new;
71
	struct resource *res;
72

73 74 75
	if (addr == 0)
		return NULL;

76
	new = kzalloc(sizeof(*new), GFP_KERNEL);
77
	if (!new)
78
		return NULL;
79

80 81 82 83
	new->address = addr;
	new->segment = segment;
	new->start_bus = start;
	new->end_bus = end;
84

85 86
	res = &new->res;
	res->start = addr + PCI_MMCFG_BUS_OFFSET(start);
87
	res->end = addr + PCI_MMCFG_BUS_OFFSET(end + 1) - 1;
88 89 90 91 92
	res->flags = IORESOURCE_MEM | IORESOURCE_BUSY;
	snprintf(new->name, PCI_MMCFG_RESOURCE_NAME_LEN,
		 "PCI MMCONFIG %04x [bus %02x-%02x]", segment, start, end);
	res->name = new->name;

93
	return new;
94 95
}

96 97 98 99 100 101
static __init struct pci_mmcfg_region *pci_mmconfig_add(int segment, int start,
							int end, u64 addr)
{
	struct pci_mmcfg_region *new;

	new = pci_mmconfig_alloc(segment, start, end, addr);
102 103
	if (new) {
		mutex_lock(&pci_mmcfg_lock);
104
		list_add_sorted(new);
105
		mutex_unlock(&pci_mmcfg_lock);
106

107
		pr_info(PREFIX
108 109 110
		       "MMCONFIG for domain %04x [bus %02x-%02x] at %pR "
		       "(base %#lx)\n",
		       segment, start, end, &new->res, (unsigned long)addr);
111
	}
112 113 114 115

	return new;
}

116 117 118 119
struct pci_mmcfg_region *pci_mmconfig_lookup(int segment, int bus)
{
	struct pci_mmcfg_region *cfg;

120
	list_for_each_entry_rcu(cfg, &pci_mmcfg_list, list)
121 122 123 124 125 126 127
		if (cfg->segment == segment &&
		    cfg->start_bus <= bus && bus <= cfg->end_bus)
			return cfg;

	return NULL;
}

128
static const char __init *pci_mmcfg_e7520(void)
129 130
{
	u32 win;
131
	raw_pci_ops->read(0, 0, PCI_DEVFN(0, 0), 0xce, 2, &win);
132

133
	win = win & 0xf000;
134 135 136
	if (win == 0x0000 || win == 0xf000)
		return NULL;

137
	if (pci_mmconfig_add(0, 0, 255, win << 16) == NULL)
138 139
		return NULL;

140 141 142
	return "Intel Corporation E7520 Memory Controller Hub";
}

143
static const char __init *pci_mmcfg_intel_945(void)
144 145 146
{
	u32 pciexbar, mask = 0, len = 0;

147
	raw_pci_ops->read(0, 0, PCI_DEVFN(0, 0), 0x48, 4, &pciexbar);
148 149 150

	/* Enable bit */
	if (!(pciexbar & 1))
151
		return NULL;
152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167

	/* Size bits */
	switch ((pciexbar >> 1) & 3) {
	case 0:
		mask = 0xf0000000U;
		len  = 0x10000000U;
		break;
	case 1:
		mask = 0xf8000000U;
		len  = 0x08000000U;
		break;
	case 2:
		mask = 0xfc000000U;
		len  = 0x04000000U;
		break;
	default:
168
		return NULL;
169 170 171 172 173 174
	}

	/* Errata #2, things break when not aligned on a 256Mb boundary */
	/* Can only happen in 64M/128M mode */

	if ((pciexbar & mask) & 0x0fffffffU)
175
		return NULL;
176

177 178
	/* Don't hit the APIC registers and their friends */
	if ((pciexbar & mask) >= 0xf0000000U)
179 180
		return NULL;

181
	if (pci_mmconfig_add(0, 0, (len >> 20) - 1, pciexbar & mask) == NULL)
182 183
		return NULL;

184 185 186
	return "Intel Corporation 945G/GZ/P/PL Express Memory Controller Hub";
}

187 188 189 190 191
static const char __init *pci_mmcfg_amd_fam10h(void)
{
	u32 low, high, address;
	u64 base, msr;
	int i;
192
	unsigned segnbits = 0, busnbits, end_bus;
193

194 195 196
	if (!(pci_probe & PCI_CHECK_ENABLE_AMD_MMCONF))
		return NULL;

197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225
	address = MSR_FAM10H_MMIO_CONF_BASE;
	if (rdmsr_safe(address, &low, &high))
		return NULL;

	msr = high;
	msr <<= 32;
	msr |= low;

	/* mmconfig is not enable */
	if (!(msr & FAM10H_MMIO_CONF_ENABLE))
		return NULL;

	base = msr & (FAM10H_MMIO_CONF_BASE_MASK<<FAM10H_MMIO_CONF_BASE_SHIFT);

	busnbits = (msr >> FAM10H_MMIO_CONF_BUSRANGE_SHIFT) &
			 FAM10H_MMIO_CONF_BUSRANGE_MASK;

	/*
	 * only handle bus 0 ?
	 * need to skip it
	 */
	if (!busnbits)
		return NULL;

	if (busnbits > 8) {
		segnbits = busnbits - 8;
		busnbits = 8;
	}

226
	end_bus = (1 << busnbits) - 1;
227
	for (i = 0; i < (1 << segnbits); i++)
228 229 230 231 232
		if (pci_mmconfig_add(i, 0, end_bus,
				     base + (1<<28) * i) == NULL) {
			free_all_mmcfg();
			return NULL;
		}
233 234 235 236

	return "AMD Family 10h NB";
}

237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
static bool __initdata mcp55_checked;
static const char __init *pci_mmcfg_nvidia_mcp55(void)
{
	int bus;
	int mcp55_mmconf_found = 0;

	static const u32 extcfg_regnum		= 0x90;
	static const u32 extcfg_regsize		= 4;
	static const u32 extcfg_enable_mask	= 1<<31;
	static const u32 extcfg_start_mask	= 0xff<<16;
	static const int extcfg_start_shift	= 16;
	static const u32 extcfg_size_mask	= 0x3<<28;
	static const int extcfg_size_shift	= 28;
	static const int extcfg_sizebus[]	= {0x100, 0x80, 0x40, 0x20};
	static const u32 extcfg_base_mask[]	= {0x7ff8, 0x7ffc, 0x7ffe, 0x7fff};
	static const int extcfg_base_lshift	= 25;

	/*
	 * do check if amd fam10h already took over
	 */
257
	if (!acpi_disabled || !list_empty(&pci_mmcfg_list) || mcp55_checked)
258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285
		return NULL;

	mcp55_checked = true;
	for (bus = 0; bus < 256; bus++) {
		u64 base;
		u32 l, extcfg;
		u16 vendor, device;
		int start, size_index, end;

		raw_pci_ops->read(0, bus, PCI_DEVFN(0, 0), 0, 4, &l);
		vendor = l & 0xffff;
		device = (l >> 16) & 0xffff;

		if (PCI_VENDOR_ID_NVIDIA != vendor || 0x0369 != device)
			continue;

		raw_pci_ops->read(0, bus, PCI_DEVFN(0, 0), extcfg_regnum,
				  extcfg_regsize, &extcfg);

		if (!(extcfg & extcfg_enable_mask))
			continue;

		size_index = (extcfg & extcfg_size_mask) >> extcfg_size_shift;
		base = extcfg & extcfg_base_mask[size_index];
		/* base could > 4G */
		base <<= extcfg_base_lshift;
		start = (extcfg & extcfg_start_mask) >> extcfg_start_shift;
		end = start + extcfg_sizebus[size_index] - 1;
286 287
		if (pci_mmconfig_add(0, start, end, base) == NULL)
			continue;
288 289 290 291 292 293 294 295 296
		mcp55_mmconf_found++;
	}

	if (!mcp55_mmconf_found)
		return NULL;

	return "nVidia MCP55";
}

297
struct pci_mmcfg_hostbridge_probe {
298 299
	u32 bus;
	u32 devfn;
300 301 302 303 304
	u32 vendor;
	u32 device;
	const char *(*probe)(void);
};

305
static struct pci_mmcfg_hostbridge_probe pci_mmcfg_probes[] __initdata = {
306 307 308 309 310 311 312 313
	{ 0, PCI_DEVFN(0, 0), PCI_VENDOR_ID_INTEL,
	  PCI_DEVICE_ID_INTEL_E7520_MCH, pci_mmcfg_e7520 },
	{ 0, PCI_DEVFN(0, 0), PCI_VENDOR_ID_INTEL,
	  PCI_DEVICE_ID_INTEL_82945G_HB, pci_mmcfg_intel_945 },
	{ 0, PCI_DEVFN(0x18, 0), PCI_VENDOR_ID_AMD,
	  0x1200, pci_mmcfg_amd_fam10h },
	{ 0xff, PCI_DEVFN(0, 0), PCI_VENDOR_ID_AMD,
	  0x1200, pci_mmcfg_amd_fam10h },
314 315
	{ 0, PCI_DEVFN(0, 0), PCI_VENDOR_ID_NVIDIA,
	  0x0369, pci_mmcfg_nvidia_mcp55 },
316 317
};

318 319
static void __init pci_mmcfg_check_end_bus_number(void)
{
320
	struct pci_mmcfg_region *cfg, *cfgx;
321

322
	/* Fixup overlaps */
323
	list_for_each_entry(cfg, &pci_mmcfg_list, list) {
324 325
		if (cfg->end_bus < cfg->start_bus)
			cfg->end_bus = 255;
326

327 328 329 330
		/* Don't access the list head ! */
		if (cfg->list.next == &pci_mmcfg_list)
			break;

331
		cfgx = list_entry(cfg->list.next, typeof(*cfg), list);
332
		if (cfg->end_bus >= cfgx->start_bus)
333
			cfg->end_bus = cfgx->start_bus - 1;
334 335 336
	}
}

337 338 339
static int __init pci_mmcfg_check_hostbridge(void)
{
	u32 l;
340
	u32 bus, devfn;
341 342 343 344
	u16 vendor, device;
	int i;
	const char *name;

345 346 347
	if (!raw_pci_ops)
		return 0;

348
	free_all_mmcfg();
349

350
	for (i = 0; i < ARRAY_SIZE(pci_mmcfg_probes); i++) {
351 352
		bus =  pci_mmcfg_probes[i].bus;
		devfn = pci_mmcfg_probes[i].devfn;
353
		raw_pci_ops->read(0, bus, devfn, 0, 4, &l);
354 355 356
		vendor = l & 0xffff;
		device = (l >> 16) & 0xffff;

357
		name = NULL;
358 359
		if (pci_mmcfg_probes[i].vendor == vendor &&
		    pci_mmcfg_probes[i].device == device)
360 361
			name = pci_mmcfg_probes[i].probe();

362
		if (name)
363
			pr_info(PREFIX "%s with MMCONFIG support\n", name);
364 365
	}

366 367 368
	/* some end_bus_number is crazy, fix it */
	pci_mmcfg_check_end_bus_number();

369
	return !list_empty(&pci_mmcfg_list);
370 371
}

372
static acpi_status check_mcfg_resource(struct acpi_resource *res, void *data)
373 374 375 376 377 378 379 380 381 382 383
{
	struct resource *mcfg_res = data;
	struct acpi_resource_address64 address;
	acpi_status status;

	if (res->type == ACPI_RESOURCE_TYPE_FIXED_MEMORY32) {
		struct acpi_resource_fixed_memory32 *fixmem32 =
			&res->data.fixed_memory32;
		if (!fixmem32)
			return AE_OK;
		if ((mcfg_res->start >= fixmem32->address) &&
384
		    (mcfg_res->end < (fixmem32->address +
385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400
				      fixmem32->address_length))) {
			mcfg_res->flags = 1;
			return AE_CTRL_TERMINATE;
		}
	}
	if ((res->type != ACPI_RESOURCE_TYPE_ADDRESS32) &&
	    (res->type != ACPI_RESOURCE_TYPE_ADDRESS64))
		return AE_OK;

	status = acpi_resource_to_address64(res, &address);
	if (ACPI_FAILURE(status) ||
	   (address.address_length <= 0) ||
	   (address.resource_type != ACPI_MEMORY_RANGE))
		return AE_OK;

	if ((mcfg_res->start >= address.minimum) &&
401
	    (mcfg_res->end < (address.minimum + address.address_length))) {
402 403 404 405 406 407
		mcfg_res->flags = 1;
		return AE_CTRL_TERMINATE;
	}
	return AE_OK;
}

408 409
static acpi_status find_mboard_resource(acpi_handle handle, u32 lvl,
					void *context, void **rv)
410 411 412 413 414 415 416 417 418 419 420 421
{
	struct resource *mcfg_res = context;

	acpi_walk_resources(handle, METHOD_NAME__CRS,
			    check_mcfg_resource, context);

	if (mcfg_res->flags)
		return AE_CTRL_TERMINATE;

	return AE_OK;
}

422
static int is_acpi_reserved(u64 start, u64 end, unsigned not_used)
423 424 425 426
{
	struct resource mcfg_res;

	mcfg_res.start = start;
427
	mcfg_res.end = end - 1;
428 429 430 431 432 433 434 435 436 437 438
	mcfg_res.flags = 0;

	acpi_get_devices("PNP0C01", find_mboard_resource, &mcfg_res, NULL);

	if (!mcfg_res.flags)
		acpi_get_devices("PNP0C02", find_mboard_resource, &mcfg_res,
				 NULL);

	return mcfg_res.flags;
}

439 440
typedef int (*check_reserved_t)(u64 start, u64 end, unsigned type);

441 442 443
static int __ref is_mmconf_reserved(check_reserved_t is_reserved,
				    struct pci_mmcfg_region *cfg,
				    struct device *dev, int with_e820)
444
{
445 446
	u64 addr = cfg->res.start;
	u64 size = resource_size(&cfg->res);
447
	u64 old_size = size;
448 449
	int num_buses;
	char *method = with_e820 ? "E820" : "ACPI motherboard resources";
450

451
	while (!is_reserved(addr, addr + size, E820_RESERVED)) {
452 453 454 455 456
		size >>= 1;
		if (size < (16UL<<20))
			break;
	}

457 458 459 460 461 462 463
	if (size < (16UL<<20) && size != old_size)
		return 0;

	if (dev)
		dev_info(dev, "MMCONFIG at %pR reserved in %s\n",
			 &cfg->res, method);
	else
464
		pr_info(PREFIX "MMCONFIG at %pR reserved in %s\n",
465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482
		       &cfg->res, method);

	if (old_size != size) {
		/* update end_bus */
		cfg->end_bus = cfg->start_bus + ((size>>20) - 1);
		num_buses = cfg->end_bus - cfg->start_bus + 1;
		cfg->res.end = cfg->res.start +
		    PCI_MMCFG_BUS_OFFSET(num_buses) - 1;
		snprintf(cfg->name, PCI_MMCFG_RESOURCE_NAME_LEN,
			 "PCI MMCONFIG %04x [bus %02x-%02x]",
			 cfg->segment, cfg->start_bus, cfg->end_bus);

		if (dev)
			dev_info(dev,
				"MMCONFIG "
				"at %pR (base %#lx) (size reduced!)\n",
				&cfg->res, (unsigned long) cfg->address);
		else
483
			pr_info(PREFIX
484 485 486 487
				"MMCONFIG for %04x [bus%02x-%02x] "
				"at %pR (base %#lx) (size reduced!)\n",
				cfg->segment, cfg->start_bus, cfg->end_bus,
				&cfg->res, (unsigned long) cfg->address);
488 489
	}

490
	return 1;
491 492
}

493 494
static int __ref pci_mmcfg_check_reserved(struct device *dev,
		  struct pci_mmcfg_region *cfg, int early)
495 496
{
	if (!early && !acpi_disabled) {
497
		if (is_mmconf_reserved(is_acpi_reserved, cfg, dev, 0))
498
			return 1;
499 500 501 502 503 504

		if (dev)
			dev_info(dev, FW_INFO
				 "MMCONFIG at %pR not reserved in "
				 "ACPI motherboard resources\n",
				 &cfg->res);
505
		else
506
			pr_info(FW_INFO PREFIX
507 508 509 510 511
			       "MMCONFIG at %pR not reserved in "
			       "ACPI motherboard resources\n",
			       &cfg->res);
	}

512 513 514 515 516 517 518 519 520
	/*
	 * e820_all_mapped() is marked as __init.
	 * All entries from ACPI MCFG table have been checked at boot time.
	 * For MCFG information constructed from hotpluggable host bridge's
	 * _CBA method, just assume it's reserved.
	 */
	if (pci_mmcfg_running_state)
		return 1;

521 522 523
	/* Don't try to do this check unless configuration
	   type 1 is available. how about type 2 ?*/
	if (raw_pci_ops)
524
		return is_mmconf_reserved(e820_all_mapped, cfg, dev, 1);
525 526 527 528

	return 0;
}

529
static void __init pci_mmcfg_reject_broken(int early)
530
{
531
	struct pci_mmcfg_region *cfg;
532

533
	list_for_each_entry(cfg, &pci_mmcfg_list, list) {
534
		if (pci_mmcfg_check_reserved(NULL, cfg, early) == 0) {
535
			pr_info(PREFIX "not using MMCONFIG\n");
536 537
			free_all_mmcfg();
			return;
538
		}
539 540 541
	}
}

B
Bjorn Helgaas 已提交
542 543
static int __init acpi_mcfg_check_entry(struct acpi_table_mcfg *mcfg,
					struct acpi_mcfg_allocation *cfg)
544
{
B
Bjorn Helgaas 已提交
545 546 547 548 549
	int year;

	if (cfg->address < 0xFFFFFFFF)
		return 0;

550
	if (!strncmp(mcfg->header.oem_id, "SGI", 3))
B
Bjorn Helgaas 已提交
551
		return 0;
552

B
Bjorn Helgaas 已提交
553 554 555 556 557 558
	if (mcfg->header.revision >= 1) {
		if (dmi_get_date(DMI_BIOS_DATE, &year, NULL, NULL) &&
		    year >= 2010)
			return 0;
	}

559
	pr_err(PREFIX "MCFG region for %04x [bus %02x-%02x] at %#llx "
B
Bjorn Helgaas 已提交
560 561 562
	       "is above 4GB, ignored\n", cfg->pci_segment,
	       cfg->start_bus_number, cfg->end_bus_number, cfg->address);
	return -EINVAL;
563 564 565 566 567
}

static int __init pci_parse_mcfg(struct acpi_table_header *header)
{
	struct acpi_table_mcfg *mcfg;
568
	struct acpi_mcfg_allocation *cfg_table, *cfg;
569
	unsigned long i;
570
	int entries;
571 572 573 574 575 576 577

	if (!header)
		return -EINVAL;

	mcfg = (struct acpi_table_mcfg *)header;

	/* how many config structures do we have */
578
	free_all_mmcfg();
579
	entries = 0;
580 581
	i = header->length - sizeof(struct acpi_table_mcfg);
	while (i >= sizeof(struct acpi_mcfg_allocation)) {
582
		entries++;
583
		i -= sizeof(struct acpi_mcfg_allocation);
584
	}
585
	if (entries == 0) {
586
		pr_err(PREFIX "MMCONFIG has no entries\n");
587 588 589
		return -ENODEV;
	}

590
	cfg_table = (struct acpi_mcfg_allocation *) &mcfg[1];
591
	for (i = 0; i < entries; i++) {
592 593
		cfg = &cfg_table[i];
		if (acpi_mcfg_check_entry(mcfg, cfg)) {
594
			free_all_mmcfg();
595 596
			return -ENODEV;
		}
597 598 599

		if (pci_mmconfig_add(cfg->pci_segment, cfg->start_bus_number,
				   cfg->end_bus_number, cfg->address) == NULL) {
600
			pr_warn(PREFIX "no memory for MCFG entries\n");
601 602 603
			free_all_mmcfg();
			return -ENOMEM;
		}
604 605 606 607 608
	}

	return 0;
}

609
static void __init __pci_mmcfg_init(int early)
610
{
611
	pci_mmcfg_reject_broken(early);
612
	if (list_empty(&pci_mmcfg_list))
613 614
		return;

615 616 617 618 619 620 621 622 623 624
	if (pcibios_last_bus < 0) {
		const struct pci_mmcfg_region *cfg;

		list_for_each_entry(cfg, &pci_mmcfg_list, list) {
			if (cfg->segment)
				break;
			pcibios_last_bus = cfg->end_bus;
		}
	}

625
	if (pci_mmcfg_arch_init())
626
		pci_probe = (pci_probe & ~PCI_PROBE_MASK) | PCI_PROBE_MMCONF;
627
	else {
628
		free_all_mmcfg();
629
		pci_mmcfg_arch_init_failed = true;
630 631
	}
}
632

633 634
static int __initdata known_bridge;

635
void __init pci_mmcfg_early_init(void)
Y
Yinghai Lu 已提交
636
{
637 638 639 640 641 642 643
	if (pci_probe & PCI_PROBE_MMCONF) {
		if (pci_mmcfg_check_hostbridge())
			known_bridge = 1;
		else
			acpi_sfi_table_parse(ACPI_SIG_MCFG, pci_parse_mcfg);
		__pci_mmcfg_init(1);
	}
Y
Yinghai Lu 已提交
644 645 646 647
}

void __init pci_mmcfg_late_init(void)
{
648 649 650 651 652 653 654 655 656 657 658 659
	/* MMCONFIG disabled */
	if ((pci_probe & PCI_PROBE_MMCONF) == 0)
		return;

	if (known_bridge)
		return;

	/* MMCONFIG hasn't been enabled yet, try again */
	if (pci_probe & PCI_PROBE_MASK & ~PCI_PROBE_MMCONF) {
		acpi_sfi_table_parse(ACPI_SIG_MCFG, pci_parse_mcfg);
		__pci_mmcfg_init(0);
	}
Y
Yinghai Lu 已提交
660 661
}

662 663
static int __init pci_mmcfg_late_insert_resources(void)
{
664 665
	struct pci_mmcfg_region *cfg;

666 667
	pci_mmcfg_running_state = true;

668 669
	/* If we are not using MMCONFIG, don't insert the resources. */
	if ((pci_probe & PCI_PROBE_MMCONF) == 0)
670 671 672 673 674 675 676
		return 1;

	/*
	 * Attempt to insert the mmcfg resources but not with the busy flag
	 * marked so it won't cause request errors when __request_region is
	 * called.
	 */
677 678 679
	list_for_each_entry(cfg, &pci_mmcfg_list, list)
		if (!cfg->res.parent)
			insert_resource(&iomem_resource, &cfg->res);
680 681 682 683 684 685 686 687 688 689

	return 0;
}

/*
 * Perform MMCONFIG resource insertion after PCI initialization to allow for
 * misprogrammed MCFG tables that state larger sizes but actually conflict
 * with other system resources.
 */
late_initcall(pci_mmcfg_late_insert_resources);
690 691

/* Add MMCFG information for host bridges */
692 693
int pci_mmconfig_insert(struct device *dev, u16 seg, u8 start, u8 end,
			phys_addr_t addr)
694 695 696 697 698 699 700 701
{
	int rc;
	struct resource *tmp = NULL;
	struct pci_mmcfg_region *cfg;

	if (!(pci_probe & PCI_PROBE_MMCONF) || pci_mmcfg_arch_init_failed)
		return -ENODEV;

702
	if (start > end)
703 704 705 706 707 708 709 710 711 712 713 714 715 716 717
		return -EINVAL;

	mutex_lock(&pci_mmcfg_lock);
	cfg = pci_mmconfig_lookup(seg, start);
	if (cfg) {
		if (cfg->end_bus < end)
			dev_info(dev, FW_INFO
				 "MMCONFIG for "
				 "domain %04x [bus %02x-%02x] "
				 "only partially covers this bridge\n",
				  cfg->segment, cfg->start_bus, cfg->end_bus);
		mutex_unlock(&pci_mmcfg_lock);
		return -EEXIST;
	}

718 719 720 721 722
	if (!addr) {
		mutex_unlock(&pci_mmcfg_lock);
		return -EINVAL;
	}

723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786
	rc = -EBUSY;
	cfg = pci_mmconfig_alloc(seg, start, end, addr);
	if (cfg == NULL) {
		dev_warn(dev, "fail to add MMCONFIG (out of memory)\n");
		rc = -ENOMEM;
	} else if (!pci_mmcfg_check_reserved(dev, cfg, 0)) {
		dev_warn(dev, FW_BUG "MMCONFIG %pR isn't reserved\n",
			 &cfg->res);
	} else {
		/* Insert resource if it's not in boot stage */
		if (pci_mmcfg_running_state)
			tmp = insert_resource_conflict(&iomem_resource,
						       &cfg->res);

		if (tmp) {
			dev_warn(dev,
				 "MMCONFIG %pR conflicts with "
				 "%s %pR\n",
				 &cfg->res, tmp->name, tmp);
		} else if (pci_mmcfg_arch_map(cfg)) {
			dev_warn(dev, "fail to map MMCONFIG %pR.\n",
				 &cfg->res);
		} else {
			list_add_sorted(cfg);
			dev_info(dev, "MMCONFIG at %pR (base %#lx)\n",
				 &cfg->res, (unsigned long)addr);
			cfg = NULL;
			rc = 0;
		}
	}

	if (cfg) {
		if (cfg->res.parent)
			release_resource(&cfg->res);
		kfree(cfg);
	}

	mutex_unlock(&pci_mmcfg_lock);

	return rc;
}

/* Delete MMCFG information for host bridges */
int pci_mmconfig_delete(u16 seg, u8 start, u8 end)
{
	struct pci_mmcfg_region *cfg;

	mutex_lock(&pci_mmcfg_lock);
	list_for_each_entry_rcu(cfg, &pci_mmcfg_list, list)
		if (cfg->segment == seg && cfg->start_bus == start &&
		    cfg->end_bus == end) {
			list_del_rcu(&cfg->list);
			synchronize_rcu();
			pci_mmcfg_arch_unmap(cfg);
			if (cfg->res.parent)
				release_resource(&cfg->res);
			mutex_unlock(&pci_mmcfg_lock);
			kfree(cfg);
			return 0;
		}
	mutex_unlock(&pci_mmcfg_lock);

	return -ENOENT;
}