acpi.c 25.7 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 *  acpi.c - Architecture-Specific Low-Level ACPI Support
 *
 *  Copyright (C) 1999 VA Linux Systems
 *  Copyright (C) 1999,2000 Walt Drummond <drummond@valinux.com>
 *  Copyright (C) 2000, 2002-2003 Hewlett-Packard Co.
 *	David Mosberger-Tang <davidm@hpl.hp.com>
 *  Copyright (C) 2000 Intel Corp.
 *  Copyright (C) 2000,2001 J.I. Lee <jung-ik.lee@intel.com>
 *  Copyright (C) 2001 Paul Diefenbaugh <paul.s.diefenbaugh@intel.com>
 *  Copyright (C) 2001 Jenna Hall <jenna.s.hall@intel.com>
 *  Copyright (C) 2001 Takayoshi Kochi <t-kochi@bq.jp.nec.com>
 *  Copyright (C) 2002 Erich Focht <efocht@ess.nec.de>
14
 *  Copyright (C) 2004 Ashok Raj <ashok.raj@intel.com>
L
Linus Torvalds 已提交
15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
 *
 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; either version 2 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 *
 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/kernel.h>
#include <linux/sched.h>
#include <linux/smp.h>
#include <linux/string.h>
#include <linux/types.h>
#include <linux/irq.h>
#include <linux/acpi.h>
#include <linux/efi.h>
#include <linux/mmzone.h>
#include <linux/nodemask.h>
47
#include <linux/slab.h>
48
#include <acpi/processor.h>
L
Linus Torvalds 已提交
49 50 51 52 53 54 55 56
#include <asm/io.h>
#include <asm/iosapic.h>
#include <asm/machvec.h>
#include <asm/page.h>
#include <asm/system.h>
#include <asm/numa.h>
#include <asm/sal.h>
#include <asm/cyclone.h>
57
#include <asm/xen/hypervisor.h>
L
Linus Torvalds 已提交
58 59 60

#define BAD_MADT_ENTRY(entry, end) (                                        \
		(!entry) || (unsigned long)entry + sizeof(*entry) > end ||  \
61
		((struct acpi_subtable_header *)entry)->length < sizeof(*entry))
L
Linus Torvalds 已提交
62 63 64

#define PREFIX			"ACPI: "

65
u32 acpi_rsdt_forced;
66 67 68
unsigned int acpi_cpei_override;
unsigned int acpi_cpei_phys_cpuid;

69 70
unsigned long acpi_wakeup_address = 0;

71 72 73 74 75 76 77 78 79 80 81 82 83
#ifdef CONFIG_IA64_GENERIC
static unsigned long __init acpi_find_rsdp(void)
{
	unsigned long rsdp_phys = 0;

	if (efi.acpi20 != EFI_INVALID_TABLE_ADDR)
		rsdp_phys = efi.acpi20;
	else if (efi.acpi != EFI_INVALID_TABLE_ADDR)
		printk(KERN_WARNING PREFIX
		       "v1.0/r0.71 tables no longer supported\n");
	return rsdp_phys;
}

84 85
const char __init *
acpi_get_sysname(void)
L
Linus Torvalds 已提交
86 87
{
	unsigned long rsdp_phys;
88
	struct acpi_table_rsdp *rsdp;
L
Linus Torvalds 已提交
89 90
	struct acpi_table_xsdt *xsdt;
	struct acpi_table_header *hdr;
91
#ifdef CONFIG_INTEL_IOMMU
92 93
	u64 i, nentries;
#endif
L
Linus Torvalds 已提交
94 95 96

	rsdp_phys = acpi_find_rsdp();
	if (!rsdp_phys) {
L
Len Brown 已提交
97 98
		printk(KERN_ERR
		       "ACPI 2.0 RSDP not found, default to \"dig\"\n");
L
Linus Torvalds 已提交
99 100 101
		return "dig";
	}

102 103
	rsdp = (struct acpi_table_rsdp *)__va(rsdp_phys);
	if (strncmp(rsdp->signature, ACPI_SIG_RSDP, sizeof(ACPI_SIG_RSDP) - 1)) {
L
Len Brown 已提交
104 105
		printk(KERN_ERR
		       "ACPI 2.0 RSDP signature incorrect, default to \"dig\"\n");
L
Linus Torvalds 已提交
106 107 108
		return "dig";
	}

109
	xsdt = (struct acpi_table_xsdt *)__va(rsdp->xsdt_physical_address);
L
Linus Torvalds 已提交
110
	hdr = &xsdt->header;
111
	if (strncmp(hdr->signature, ACPI_SIG_XSDT, sizeof(ACPI_SIG_XSDT) - 1)) {
L
Len Brown 已提交
112 113
		printk(KERN_ERR
		       "ACPI 2.0 XSDT signature incorrect, default to \"dig\"\n");
L
Linus Torvalds 已提交
114 115 116 117 118
		return "dig";
	}

	if (!strcmp(hdr->oem_id, "HP")) {
		return "hpzx1";
L
Len Brown 已提交
119
	} else if (!strcmp(hdr->oem_id, "SGI")) {
120 121 122 123
		if (!strcmp(hdr->oem_table_id + 4, "UV"))
			return "uv";
		else
			return "sn2";
124 125
	} else if (xen_pv_domain() && !strcmp(hdr->oem_id, "XEN")) {
		return "xen";
L
Linus Torvalds 已提交
126 127
	}

128
#ifdef CONFIG_INTEL_IOMMU
129 130 131 132 133 134 135 136 137 138 139
	/* Look for Intel IOMMU */
	nentries = (hdr->length - sizeof(*hdr)) /
			 sizeof(xsdt->table_offset_entry[0]);
	for (i = 0; i < nentries; i++) {
		hdr = __va(xsdt->table_offset_entry[i]);
		if (strncmp(hdr->signature, ACPI_SIG_DMAR,
			sizeof(ACPI_SIG_DMAR) - 1) == 0)
			return "dig_vtd";
	}
#endif

L
Linus Torvalds 已提交
140 141
	return "dig";
}
142
#endif /* CONFIG_IA64_GENERIC */
L
Linus Torvalds 已提交
143 144 145 146 147 148 149 150 151 152 153 154 155 156

#define ACPI_MAX_PLATFORM_INTERRUPTS	256

/* Array to record platform interrupt vectors for generic interrupt routing. */
int platform_intr_list[ACPI_MAX_PLATFORM_INTERRUPTS] = {
	[0 ... ACPI_MAX_PLATFORM_INTERRUPTS - 1] = -1
};

enum acpi_irq_model_id acpi_irq_model = ACPI_IRQ_MODEL_IOSAPIC;

/*
 * Interrupt routing API for device drivers.  Provides interrupt vector for
 * a generic platform event.  Currently only CPEI is implemented.
 */
L
Len Brown 已提交
157
int acpi_request_vector(u32 int_type)
L
Linus Torvalds 已提交
158 159 160 161 162 163 164
{
	int vector = -1;

	if (int_type < ACPI_MAX_PLATFORM_INTERRUPTS) {
		/* corrected platform error interrupt */
		vector = platform_intr_list[int_type];
	} else
L
Len Brown 已提交
165 166
		printk(KERN_ERR
		       "acpi_request_vector(): invalid interrupt type\n");
L
Linus Torvalds 已提交
167 168 169
	return vector;
}

170
char *__init __acpi_map_table(unsigned long phys_addr, unsigned long size)
L
Linus Torvalds 已提交
171 172 173 174
{
	return __va(phys_addr);
}

Y
Yinghai Lu 已提交
175
void __init __acpi_unmap_table(char *map, unsigned long size)
176 177 178
{
}

L
Linus Torvalds 已提交
179 180 181 182
/* --------------------------------------------------------------------------
                            Boot-time Table Parsing
   -------------------------------------------------------------------------- */

L
Len Brown 已提交
183 184 185
static int available_cpus __initdata;
struct acpi_table_madt *acpi_madt __initdata;
static u8 has_8259;
L
Linus Torvalds 已提交
186 187

static int __init
188
acpi_parse_lapic_addr_ovr(struct acpi_subtable_header * header,
L
Len Brown 已提交
189
			  const unsigned long end)
L
Linus Torvalds 已提交
190
{
191
	struct acpi_madt_local_apic_override *lapic;
L
Linus Torvalds 已提交
192

193
	lapic = (struct acpi_madt_local_apic_override *)header;
L
Linus Torvalds 已提交
194 195 196 197 198 199 200 201 202 203 204 205

	if (BAD_MADT_ENTRY(lapic, end))
		return -EINVAL;

	if (lapic->address) {
		iounmap(ipi_base_addr);
		ipi_base_addr = ioremap(lapic->address, 0);
	}
	return 0;
}

static int __init
206
acpi_parse_lsapic(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
207
{
208
	struct acpi_madt_local_sapic *lsapic;
L
Linus Torvalds 已提交
209

210
	lsapic = (struct acpi_madt_local_sapic *)header;
L
Linus Torvalds 已提交
211

212
	/*Skip BAD_MADT_ENTRY check, as lsapic size could vary */
L
Linus Torvalds 已提交
213

214
	if (lsapic->lapic_flags & ACPI_MADT_ENABLED) {
L
Linus Torvalds 已提交
215
#ifdef CONFIG_SMP
L
Len Brown 已提交
216 217
		smp_boot_data.cpu_phys_id[available_cpus] =
		    (lsapic->id << 8) | lsapic->eid;
L
Linus Torvalds 已提交
218 219 220 221 222 223 224 225 226
#endif
		++available_cpus;
	}

	total_cpus++;
	return 0;
}

static int __init
227
acpi_parse_lapic_nmi(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
228
{
229
	struct acpi_madt_local_apic_nmi *lacpi_nmi;
L
Linus Torvalds 已提交
230

231
	lacpi_nmi = (struct acpi_madt_local_apic_nmi *)header;
L
Linus Torvalds 已提交
232 233 234 235 236 237 238 239 240

	if (BAD_MADT_ENTRY(lacpi_nmi, end))
		return -EINVAL;

	/* TBD: Support lapic_nmi entries */
	return 0;
}

static int __init
241
acpi_parse_iosapic(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
242
{
243
	struct acpi_madt_io_sapic *iosapic;
L
Linus Torvalds 已提交
244

245
	iosapic = (struct acpi_madt_io_sapic *)header;
L
Linus Torvalds 已提交
246 247 248 249

	if (BAD_MADT_ENTRY(iosapic, end))
		return -EINVAL;

250
	return iosapic_init(iosapic->address, iosapic->global_irq_base);
L
Linus Torvalds 已提交
251 252
}

L
Len Brown 已提交
253 254
static unsigned int __initdata acpi_madt_rev;

L
Linus Torvalds 已提交
255
static int __init
256
acpi_parse_plat_int_src(struct acpi_subtable_header * header,
L
Len Brown 已提交
257
			const unsigned long end)
L
Linus Torvalds 已提交
258
{
259
	struct acpi_madt_interrupt_source *plintsrc;
L
Linus Torvalds 已提交
260 261
	int vector;

262
	plintsrc = (struct acpi_madt_interrupt_source *)header;
L
Linus Torvalds 已提交
263 264 265 266 267 268 269 270 271 272

	if (BAD_MADT_ENTRY(plintsrc, end))
		return -EINVAL;

	/*
	 * Get vector assignment for this interrupt, set attributes,
	 * and program the IOSAPIC routing table.
	 */
	vector = iosapic_register_platform_intr(plintsrc->type,
						plintsrc->global_irq,
273
						plintsrc->io_sapic_vector,
L
Linus Torvalds 已提交
274 275
						plintsrc->eid,
						plintsrc->id,
276 277 278 279 280 281
						((plintsrc->inti_flags & ACPI_MADT_POLARITY_MASK) ==
						 ACPI_MADT_POLARITY_ACTIVE_HIGH) ?
						IOSAPIC_POL_HIGH : IOSAPIC_POL_LOW,
						((plintsrc->inti_flags & ACPI_MADT_TRIGGER_MASK) ==
						 ACPI_MADT_TRIGGER_EDGE) ?
						IOSAPIC_EDGE : IOSAPIC_LEVEL);
L
Linus Torvalds 已提交
282 283

	platform_intr_list[plintsrc->type] = vector;
284
	if (acpi_madt_rev > 1) {
285
		acpi_cpei_override = plintsrc->flags & ACPI_MADT_CPEI_OVERRIDE;
286 287 288 289 290 291 292
	}

	/*
	 * Save the physical id, so we can check when its being removed
	 */
	acpi_cpei_phys_cpuid = ((plintsrc->id << 8) | (plintsrc->eid)) & 0xffff;

L
Linus Torvalds 已提交
293 294 295
	return 0;
}

296
#ifdef CONFIG_HOTPLUG_CPU
297 298 299
unsigned int can_cpei_retarget(void)
{
	extern int cpe_vector;
A
Ashok Raj 已提交
300
	extern unsigned int force_cpei_retarget;
301 302 303 304 305 306

	/*
	 * Only if CPEI is supported and the override flag
	 * is present, otherwise return that its re-targettable
	 * if we are in polling mode.
	 */
A
Ashok Raj 已提交
307 308 309 310 311 312 313
	if (cpe_vector > 0) {
		if (acpi_cpei_override || force_cpei_retarget)
			return 1;
		else
			return 0;
	}
	return 1;
314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331
}

unsigned int is_cpu_cpei_target(unsigned int cpu)
{
	unsigned int logical_id;

	logical_id = cpu_logical_id(acpi_cpei_phys_cpuid);

	if (logical_id == cpu)
		return 1;
	else
		return 0;
}

void set_cpei_target_cpu(unsigned int cpu)
{
	acpi_cpei_phys_cpuid = cpu_physical_id(cpu);
}
332
#endif
333 334 335 336 337 338

unsigned int get_cpei_target_cpu(void)
{
	return acpi_cpei_phys_cpuid;
}

L
Linus Torvalds 已提交
339
static int __init
340
acpi_parse_int_src_ovr(struct acpi_subtable_header * header,
L
Len Brown 已提交
341
		       const unsigned long end)
L
Linus Torvalds 已提交
342
{
343
	struct acpi_madt_interrupt_override *p;
L
Linus Torvalds 已提交
344

345
	p = (struct acpi_madt_interrupt_override *)header;
L
Linus Torvalds 已提交
346 347 348 349

	if (BAD_MADT_ENTRY(p, end))
		return -EINVAL;

350 351
	iosapic_override_isa_irq(p->source_irq, p->global_irq,
				 ((p->inti_flags & ACPI_MADT_POLARITY_MASK) ==
352 353
				  ACPI_MADT_POLARITY_ACTIVE_LOW) ?
				 IOSAPIC_POL_LOW : IOSAPIC_POL_HIGH,
354
				 ((p->inti_flags & ACPI_MADT_TRIGGER_MASK) ==
355 356
				 ACPI_MADT_TRIGGER_LEVEL) ?
				 IOSAPIC_LEVEL : IOSAPIC_EDGE);
L
Linus Torvalds 已提交
357 358 359 360
	return 0;
}

static int __init
361
acpi_parse_nmi_src(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
362
{
363
	struct acpi_madt_nmi_source *nmi_src;
L
Linus Torvalds 已提交
364

365
	nmi_src = (struct acpi_madt_nmi_source *)header;
L
Linus Torvalds 已提交
366 367 368 369 370 371 372 373

	if (BAD_MADT_ENTRY(nmi_src, end))
		return -EINVAL;

	/* TBD: Support nimsrc entries */
	return 0;
}

L
Len Brown 已提交
374
static void __init acpi_madt_oem_check(char *oem_id, char *oem_table_id)
L
Linus Torvalds 已提交
375
{
L
Len Brown 已提交
376
	if (!strncmp(oem_id, "IBM", 3) && (!strncmp(oem_table_id, "SERMOW", 6))) {
L
Linus Torvalds 已提交
377 378 379 380 381 382 383 384 385 386 387 388

		/*
		 * Unfortunately ITC_DRIFT is not yet part of the
		 * official SAL spec, so the ITC_DRIFT bit is not
		 * set by the BIOS on this hardware.
		 */
		sal_platform_features |= IA64_SAL_PLATFORM_FEATURE_ITC_DRIFT;

		cyclone_setup();
	}
}

389
static int __init acpi_parse_madt(struct acpi_table_header *table)
L
Linus Torvalds 已提交
390
{
391
	if (!table)
L
Linus Torvalds 已提交
392 393
		return -EINVAL;

394
	acpi_madt = (struct acpi_table_madt *)table;
L
Linus Torvalds 已提交
395

396 397
	acpi_madt_rev = acpi_madt->header.revision;

L
Linus Torvalds 已提交
398 399
	/* remember the value for reference after free_initmem() */
#ifdef CONFIG_ITANIUM
L
Len Brown 已提交
400
	has_8259 = 1;		/* Firmware on old Itanium systems is broken */
L
Linus Torvalds 已提交
401
#else
402
	has_8259 = acpi_madt->flags & ACPI_MADT_PCAT_COMPAT;
L
Linus Torvalds 已提交
403 404 405 406 407
#endif
	iosapic_system_init(has_8259);

	/* Get base address of IPI Message Block */

408 409
	if (acpi_madt->address)
		ipi_base_addr = ioremap(acpi_madt->address, 0);
L
Linus Torvalds 已提交
410 411 412 413

	printk(KERN_INFO PREFIX "Local APIC address %p\n", ipi_base_addr);

	acpi_madt_oem_check(acpi_madt->header.oem_id,
L
Len Brown 已提交
414
			    acpi_madt->header.oem_table_id);
L
Linus Torvalds 已提交
415 416 417 418 419 420 421 422 423 424

	return 0;
}

#ifdef CONFIG_ACPI_NUMA

#undef SLIT_DEBUG

#define PXM_FLAG_LEN ((MAX_PXM_DOMAINS + 1)/32)

L
Len Brown 已提交
425
static int __initdata srat_num_cpus;	/* number of cpus */
L
Linus Torvalds 已提交
426 427 428 429
static u32 __devinitdata pxm_flag[PXM_FLAG_LEN];
#define pxm_bit_set(bit)	(set_bit(bit,(void *)pxm_flag))
#define pxm_bit_test(bit)	(test_bit(bit,(void *)pxm_flag))
static struct acpi_table_slit __initdata *slit_table;
430
cpumask_t early_cpu_possible_map = CPU_MASK_NONE;
L
Linus Torvalds 已提交
431

432 433
static int __init
get_processor_proximity_domain(struct acpi_srat_cpu_affinity *pa)
434 435 436
{
	int pxm;

437
	pxm = pa->proximity_domain_lo;
438
	if (ia64_platform_is("sn2") || acpi_srat_revision >= 2)
439
		pxm += pa->proximity_domain_hi[0] << 8;
440 441 442
	return pxm;
}

443 444
static int __init
get_memory_proximity_domain(struct acpi_srat_mem_affinity *ma)
445 446 447 448
{
	int pxm;

	pxm = ma->proximity_domain;
449
	if (!ia64_platform_is("sn2") && acpi_srat_revision <= 1)
450
		pxm &= 0xff;
451

452 453 454
	return pxm;
}

L
Linus Torvalds 已提交
455 456 457 458
/*
 * ACPI 2.0 SLIT (System Locality Information Table)
 * http://devresource.hp.com/devresource/Docs/TechPapers/IA64/slit.pdf
 */
L
Len Brown 已提交
459
void __init acpi_numa_slit_init(struct acpi_table_slit *slit)
L
Linus Torvalds 已提交
460 461 462 463
{
	u32 len;

	len = sizeof(struct acpi_table_header) + 8
464
	    + slit->locality_count * slit->locality_count;
L
Linus Torvalds 已提交
465
	if (slit->header.length != len) {
L
Len Brown 已提交
466 467
		printk(KERN_ERR
		       "ACPI 2.0 SLIT: size mismatch: %d expected, %d actual\n",
L
Linus Torvalds 已提交
468 469 470 471 472 473 474
		       len, slit->header.length);
		return;
	}
	slit_table = slit;
}

void __init
475
acpi_numa_processor_affinity_init(struct acpi_srat_cpu_affinity *pa)
L
Linus Torvalds 已提交
476
{
477 478
	int pxm;

479
	if (!(pa->flags & ACPI_SRAT_CPU_ENABLED))
480 481
		return;

482 483
	if (srat_num_cpus >= ARRAY_SIZE(node_cpuid)) {
		printk_once(KERN_WARNING
484
			    "node_cpuid[%ld] is too small, may not be able to use all cpus\n",
485 486 487
			    ARRAY_SIZE(node_cpuid));
		return;
	}
488 489
	pxm = get_processor_proximity_domain(pa);

L
Linus Torvalds 已提交
490
	/* record this node in proximity bitmap */
491
	pxm_bit_set(pxm);
L
Linus Torvalds 已提交
492

L
Len Brown 已提交
493
	node_cpuid[srat_num_cpus].phys_id =
494
	    (pa->apic_id << 8) | (pa->local_sapic_eid);
L
Linus Torvalds 已提交
495
	/* nid should be overridden as logical node id later */
496
	node_cpuid[srat_num_cpus].nid = pxm;
497
	cpu_set(srat_num_cpus, early_cpu_possible_map);
L
Linus Torvalds 已提交
498 499 500 501
	srat_num_cpus++;
}

void __init
502
acpi_numa_memory_affinity_init(struct acpi_srat_mem_affinity *ma)
L
Linus Torvalds 已提交
503 504
{
	unsigned long paddr, size;
505
	int pxm;
L
Linus Torvalds 已提交
506 507
	struct node_memblk_s *p, *q, *pend;

508
	pxm = get_memory_proximity_domain(ma);
L
Linus Torvalds 已提交
509 510

	/* fill node memory chunk structure */
511 512
	paddr = ma->base_address;
	size = ma->length;
L
Linus Torvalds 已提交
513 514

	/* Ignore disabled entries */
515
	if (!(ma->flags & ACPI_SRAT_MEM_ENABLED))
L
Linus Torvalds 已提交
516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536
		return;

	/* record this node in proximity bitmap */
	pxm_bit_set(pxm);

	/* Insertion sort based on base address */
	pend = &node_memblk[num_node_memblks];
	for (p = &node_memblk[0]; p < pend; p++) {
		if (paddr < p->start_paddr)
			break;
	}
	if (p < pend) {
		for (q = pend - 1; q >= p; q--)
			*(q + 1) = *q;
	}
	p->start_paddr = paddr;
	p->size = size;
	p->nid = pxm;
	num_node_memblks++;
}

L
Len Brown 已提交
537
void __init acpi_numa_arch_fixup(void)
L
Linus Torvalds 已提交
538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554
{
	int i, j, node_from, node_to;

	/* If there's no SRAT, fix the phys_id and mark node 0 online */
	if (srat_num_cpus == 0) {
		node_set_online(0);
		node_cpuid[0].phys_id = hard_smp_processor_id();
		return;
	}

	/*
	 * MCD - This can probably be dropped now.  No need for pxm ID to node ID
	 * mapping with sparse node numbering iff MAX_PXM_DOMAINS <= MAX_NUMNODES.
	 */
	nodes_clear(node_online_map);
	for (i = 0; i < MAX_PXM_DOMAINS; i++) {
		if (pxm_bit_test(i)) {
555
			int nid = acpi_map_pxm_to_node(i);
L
Linus Torvalds 已提交
556 557 558 559 560 561
			node_set_online(nid);
		}
	}

	/* set logical node id in memory chunk structure */
	for (i = 0; i < num_node_memblks; i++)
562
		node_memblk[i].nid = pxm_to_node(node_memblk[i].nid);
L
Linus Torvalds 已提交
563 564 565 566 567 568 569 570 571 572 573 574

	/* assign memory bank numbers for each chunk on each node */
	for_each_online_node(i) {
		int bank;

		bank = 0;
		for (j = 0; j < num_node_memblks; j++)
			if (node_memblk[j].nid == i)
				node_memblk[j].bank = bank++;
	}

	/* set logical node id in cpu structure */
575
	for_each_possible_early_cpu(i)
576
		node_cpuid[i].nid = pxm_to_node(node_cpuid[i].nid);
L
Linus Torvalds 已提交
577

L
Len Brown 已提交
578 579 580 581
	printk(KERN_INFO "Number of logical nodes in system = %d\n",
	       num_online_nodes());
	printk(KERN_INFO "Number of memory chunks in system = %d\n",
	       num_node_memblks);
L
Linus Torvalds 已提交
582

583 584 585 586 587
	if (!slit_table) {
		for (i = 0; i < MAX_NUMNODES; i++)
			for (j = 0; j < MAX_NUMNODES; j++)
				node_distance(i, j) = i == j ? LOCAL_DISTANCE :
							REMOTE_DISTANCE;
L
Len Brown 已提交
588
		return;
589 590
	}

L
Linus Torvalds 已提交
591
	memset(numa_slit, -1, sizeof(numa_slit));
592
	for (i = 0; i < slit_table->locality_count; i++) {
L
Linus Torvalds 已提交
593 594
		if (!pxm_bit_test(i))
			continue;
595
		node_from = pxm_to_node(i);
596
		for (j = 0; j < slit_table->locality_count; j++) {
L
Linus Torvalds 已提交
597 598
			if (!pxm_bit_test(j))
				continue;
599
			node_to = pxm_to_node(j);
L
Linus Torvalds 已提交
600
			node_distance(node_from, node_to) =
601
			    slit_table->entry[i * slit_table->locality_count + j];
L
Linus Torvalds 已提交
602 603 604 605 606 607 608
		}
	}

#ifdef SLIT_DEBUG
	printk("ACPI 2.0 SLIT locality table:\n");
	for_each_online_node(i) {
		for_each_online_node(j)
L
Len Brown 已提交
609
		    printk("%03d ", node_distance(i, j));
L
Linus Torvalds 已提交
610 611 612 613
		printk("\n");
	}
#endif
}
L
Len Brown 已提交
614
#endif				/* CONFIG_ACPI_NUMA */
L
Linus Torvalds 已提交
615

616 617 618 619
/*
 * success: return IRQ number (>=0)
 * failure: return < 0
 */
620
int acpi_register_gsi(struct device *dev, u32 gsi, int triggering, int polarity)
L
Linus Torvalds 已提交
621
{
J
John Keller 已提交
622 623 624
	if (acpi_irq_model == ACPI_IRQ_MODEL_PLATFORM)
		return gsi;

L
Linus Torvalds 已提交
625 626 627 628
	if (has_8259 && gsi < 16)
		return isa_irq_to_vector(gsi);

	return iosapic_register_intr(gsi,
629
				     (polarity ==
L
Len Brown 已提交
630 631
				      ACPI_ACTIVE_HIGH) ? IOSAPIC_POL_HIGH :
				     IOSAPIC_POL_LOW,
632
				     (triggering ==
L
Len Brown 已提交
633 634
				      ACPI_EDGE_SENSITIVE) ? IOSAPIC_EDGE :
				     IOSAPIC_LEVEL);
L
Linus Torvalds 已提交
635
}
L
Len Brown 已提交
636 637

void acpi_unregister_gsi(u32 gsi)
L
Linus Torvalds 已提交
638
{
639 640 641
	if (acpi_irq_model == ACPI_IRQ_MODEL_PLATFORM)
		return;

642 643 644
	if (has_8259 && gsi < 16)
		return;

L
Linus Torvalds 已提交
645 646
	iosapic_unregister_intr(gsi);
}
L
Len Brown 已提交
647

648
static int __init acpi_parse_fadt(struct acpi_table_header *table)
L
Linus Torvalds 已提交
649 650
{
	struct acpi_table_header *fadt_header;
651
	struct acpi_table_fadt *fadt;
L
Linus Torvalds 已提交
652

653
	if (!table)
L
Linus Torvalds 已提交
654 655
		return -EINVAL;

656
	fadt_header = (struct acpi_table_header *)table;
L
Linus Torvalds 已提交
657
	if (fadt_header->revision != 3)
L
Len Brown 已提交
658
		return -ENODEV;	/* Only deal with ACPI 2.0 FADT */
L
Linus Torvalds 已提交
659

660
	fadt = (struct acpi_table_fadt *)fadt_header;
L
Linus Torvalds 已提交
661

662 663
	acpi_register_gsi(NULL, fadt->sci_interrupt, ACPI_LEVEL_SENSITIVE,
				 ACPI_ACTIVE_LOW);
L
Linus Torvalds 已提交
664 665 666
	return 0;
}

667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685
int __init early_acpi_boot_init(void)
{
	int ret;

	/*
	 * do a partial walk of MADT to determine how many CPUs
	 * we have including offline CPUs
	 */
	if (acpi_table_parse(ACPI_SIG_MADT, acpi_parse_madt)) {
		printk(KERN_ERR PREFIX "Can't find MADT\n");
		return 0;
	}

	ret = acpi_table_parse_madt(ACPI_MADT_TYPE_LOCAL_SAPIC,
		acpi_parse_lsapic, NR_CPUS);
	if (ret < 1)
		printk(KERN_ERR PREFIX
		       "Error parsing MADT - no LAPIC entries\n");

T
Tejun Heo 已提交
686 687 688 689 690 691 692 693 694 695 696 697 698 699
#ifdef CONFIG_SMP
	if (available_cpus == 0) {
		printk(KERN_INFO "ACPI: Found 0 CPUS; assuming 1\n");
		printk(KERN_INFO "CPU 0 (0x%04x)", hard_smp_processor_id());
		smp_boot_data.cpu_phys_id[available_cpus] =
		    hard_smp_processor_id();
		available_cpus = 1;	/* We've got at least one of these, no? */
	}
	smp_boot_data.cpu_count = available_cpus;
#endif
	/* Make boot-up look pretty */
	printk(KERN_INFO "%d CPUs available, %d CPUs total\n", available_cpus,
	       total_cpus);

700 701 702
	return 0;
}

L
Len Brown 已提交
703
int __init acpi_boot_init(void)
L
Linus Torvalds 已提交
704 705 706 707 708 709 710 711 712 713
{

	/*
	 * MADT
	 * ----
	 * Parse the Multiple APIC Description Table (MADT), if exists.
	 * Note that this table provides platform SMP configuration
	 * information -- the successor to MPS tables.
	 */

714
	if (acpi_table_parse(ACPI_SIG_MADT, acpi_parse_madt)) {
L
Linus Torvalds 已提交
715 716 717 718 719 720
		printk(KERN_ERR PREFIX "Can't find MADT\n");
		goto skip_madt;
	}

	/* Local APIC */

L
Len Brown 已提交
721
	if (acpi_table_parse_madt
722
	    (ACPI_MADT_TYPE_LOCAL_APIC_OVERRIDE, acpi_parse_lapic_addr_ovr, 0) < 0)
L
Len Brown 已提交
723 724
		printk(KERN_ERR PREFIX
		       "Error parsing LAPIC address override entry\n");
L
Linus Torvalds 已提交
725

726
	if (acpi_table_parse_madt(ACPI_MADT_TYPE_LOCAL_APIC_NMI, acpi_parse_lapic_nmi, 0)
L
Len Brown 已提交
727
	    < 0)
L
Linus Torvalds 已提交
728 729 730 731
		printk(KERN_ERR PREFIX "Error parsing LAPIC NMI entry\n");

	/* I/O APIC */

L
Len Brown 已提交
732
	if (acpi_table_parse_madt
733 734 735 736 737
	    (ACPI_MADT_TYPE_IO_SAPIC, acpi_parse_iosapic, NR_IOSAPICS) < 1) {
		if (!ia64_platform_is("sn2"))
			printk(KERN_ERR PREFIX
			       "Error parsing MADT - no IOSAPIC entries\n");
	}
L
Linus Torvalds 已提交
738 739 740

	/* System-Level Interrupt Routing */

L
Len Brown 已提交
741
	if (acpi_table_parse_madt
742
	    (ACPI_MADT_TYPE_INTERRUPT_SOURCE, acpi_parse_plat_int_src,
L
Len Brown 已提交
743 744 745
	     ACPI_MAX_PLATFORM_INTERRUPTS) < 0)
		printk(KERN_ERR PREFIX
		       "Error parsing platform interrupt source entry\n");
L
Linus Torvalds 已提交
746

L
Len Brown 已提交
747
	if (acpi_table_parse_madt
748
	    (ACPI_MADT_TYPE_INTERRUPT_OVERRIDE, acpi_parse_int_src_ovr, 0) < 0)
L
Len Brown 已提交
749 750
		printk(KERN_ERR PREFIX
		       "Error parsing interrupt source overrides entry\n");
L
Linus Torvalds 已提交
751

752
	if (acpi_table_parse_madt(ACPI_MADT_TYPE_NMI_SOURCE, acpi_parse_nmi_src, 0) < 0)
L
Linus Torvalds 已提交
753
		printk(KERN_ERR PREFIX "Error parsing NMI SRC entry\n");
L
Len Brown 已提交
754
      skip_madt:
L
Linus Torvalds 已提交
755 756 757 758 759 760 761

	/*
	 * FADT says whether a legacy keyboard controller is present.
	 * The FADT also contains an SCI_INT line, by which the system
	 * gets interrupts such as power and sleep buttons.  If it's not
	 * on a Legacy interrupt, it needs to be setup.
	 */
762
	if (acpi_table_parse(ACPI_SIG_FADT, acpi_parse_fadt))
L
Linus Torvalds 已提交
763 764
		printk(KERN_ERR PREFIX "Can't find FADT\n");

T
Tejun Heo 已提交
765
#ifdef CONFIG_ACPI_NUMA
L
Linus Torvalds 已提交
766 767 768 769
#ifdef CONFIG_SMP
	if (srat_num_cpus == 0) {
		int cpu, i = 1;
		for (cpu = 0; cpu < smp_boot_data.cpu_count; cpu++)
L
Len Brown 已提交
770 771 772 773
			if (smp_boot_data.cpu_phys_id[cpu] !=
			    hard_smp_processor_id())
				node_cpuid[i++].phys_id =
				    smp_boot_data.cpu_phys_id[cpu];
L
Linus Torvalds 已提交
774
	}
T
Tony Luck 已提交
775 776
#endif
	build_cpu_to_node_map();
L
Linus Torvalds 已提交
777 778 779 780
#endif
	return 0;
}

L
Len Brown 已提交
781
int acpi_gsi_to_irq(u32 gsi, unsigned int *irq)
L
Linus Torvalds 已提交
782
{
783
	int tmp;
L
Linus Torvalds 已提交
784 785 786 787

	if (has_8259 && gsi < 16)
		*irq = isa_irq_to_vector(gsi);
	else {
788 789
		tmp = gsi_to_irq(gsi);
		if (tmp == -1)
L
Linus Torvalds 已提交
790
			return -1;
791
		*irq = tmp;
L
Linus Torvalds 已提交
792 793 794 795
	}
	return 0;
}

796 797 798 799 800 801 802 803
int acpi_isa_irq_to_gsi(unsigned isa_irq, u32 *gsi)
{
	if (isa_irq >= 16)
		return -1;
	*gsi = isa_irq;
	return 0;
}

L
Linus Torvalds 已提交
804 805 806 807
/*
 *  ACPI based hotplug CPU support
 */
#ifdef CONFIG_ACPI_HOTPLUG_CPU
808
static __cpuinit
809
int acpi_map_cpu2node(acpi_handle handle, int cpu, int physid)
L
Linus Torvalds 已提交
810 811
{
#ifdef CONFIG_ACPI_NUMA
L
Len Brown 已提交
812
	int pxm_id;
813
	int nid;
L
Linus Torvalds 已提交
814 815 816

	pxm_id = acpi_get_pxm(handle);
	/*
817 818 819 820 821
	 * We don't have cpu-only-node hotadd. But if the system equips
	 * SRAT table, pxm is already found and node is ready.
  	 * So, just pxm_to_nid(pxm) is OK.
	 * This code here is for the system which doesn't have full SRAT
  	 * table for possible cpus.
L
Linus Torvalds 已提交
822
	 */
823
	nid = acpi_map_pxm_to_node(pxm_id);
L
Len Brown 已提交
824
	node_cpuid[cpu].phys_id = physid;
825
	node_cpuid[cpu].nid = nid;
L
Linus Torvalds 已提交
826
#endif
L
Len Brown 已提交
827
	return (0);
L
Linus Torvalds 已提交
828 829
}

830 831 832 833 834 835 836 837 838 839 840 841 842
int additional_cpus __initdata = -1;

static __init int setup_additional_cpus(char *s)
{
	if (s)
		additional_cpus = simple_strtol(s, NULL, 0);

	return 0;
}

early_param("additional_cpus", setup_additional_cpus);

/*
S
Simon Arlott 已提交
843
 * cpu_possible_map should be static, it cannot change as CPUs
844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862
 * are onlined, or offlined. The reason is per-cpu data-structures
 * are allocated by some modules at init time, and dont expect to
 * do this dynamically on cpu arrival/departure.
 * cpu_present_map on the other hand can change dynamically.
 * In case when cpu_hotplug is not compiled, then we resort to current
 * behaviour, which is cpu_possible == cpu_present.
 * - Ashok Raj
 *
 * Three ways to find out the number of additional hotplug CPUs:
 * - If the BIOS specified disabled CPUs in ACPI/mptables use that.
 * - The user can overwrite it with additional_cpus=NUM
 * - Otherwise don't reserve additional CPUs.
 */
__init void prefill_possible_map(void)
{
	int i;
	int possible, disabled_cpus;

	disabled_cpus = total_cpus - available_cpus;
863

864
 	if (additional_cpus == -1) {
865
 		if (disabled_cpus > 0)
866
			additional_cpus = disabled_cpus;
867
 		else
868
			additional_cpus = 0;
869 870 871 872
 	}

	possible = available_cpus + additional_cpus;

873 874
	if (possible > nr_cpu_ids)
		possible = nr_cpu_ids;
875 876

	printk(KERN_INFO "SMP: Allowing %d CPUs, %d hotplug CPUs\n",
877
		possible, max((possible - available_cpus), 0));
878 879

	for (i = 0; i < possible; i++)
880
		set_cpu_possible(i, true);
881 882
}

883
static int __cpuinit _acpi_map_lsapic(acpi_handle handle, int *pcpu)
L
Linus Torvalds 已提交
884
{
L
Len Brown 已提交
885
	struct acpi_buffer buffer = { ACPI_ALLOCATE_BUFFER, NULL };
L
Linus Torvalds 已提交
886
	union acpi_object *obj;
887
	struct acpi_madt_local_sapic *lsapic;
L
Linus Torvalds 已提交
888
	cpumask_t tmp_map;
889
	int cpu, physid;
L
Len Brown 已提交
890

L
Linus Torvalds 已提交
891 892 893
	if (ACPI_FAILURE(acpi_evaluate_object(handle, "_MAT", NULL, &buffer)))
		return -EINVAL;

L
Len Brown 已提交
894
	if (!buffer.length || !buffer.pointer)
L
Linus Torvalds 已提交
895
		return -EINVAL;
L
Len Brown 已提交
896

L
Linus Torvalds 已提交
897
	obj = buffer.pointer;
898 899
	if (obj->type != ACPI_TYPE_BUFFER)
	{
900
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
901 902 903
		return -EINVAL;
	}

904
	lsapic = (struct acpi_madt_local_sapic *)obj->buffer.pointer;
L
Linus Torvalds 已提交
905

906
	if ((lsapic->header.type != ACPI_MADT_TYPE_LOCAL_SAPIC) ||
907
	    (!(lsapic->lapic_flags & ACPI_MADT_ENABLED))) {
908
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
909 910 911
		return -EINVAL;
	}

L
Len Brown 已提交
912
	physid = ((lsapic->id << 8) | (lsapic->eid));
L
Linus Torvalds 已提交
913

914
	kfree(buffer.pointer);
L
Linus Torvalds 已提交
915 916 917
	buffer.length = ACPI_ALLOCATE_BUFFER;
	buffer.pointer = NULL;

918 919 920
	cpumask_complement(&tmp_map, cpu_present_mask);
	cpu = cpumask_first(&tmp_map);
	if (cpu >= nr_cpu_ids)
L
Linus Torvalds 已提交
921 922 923 924
		return -EINVAL;

	acpi_map_cpu2node(handle, cpu, physid);

L
Len Brown 已提交
925
	cpu_set(cpu, cpu_present_map);
L
Linus Torvalds 已提交
926 927
	ia64_cpu_to_sapicid[cpu] = physid;

928 929
	acpi_processor_set_pdc(handle);

L
Linus Torvalds 已提交
930
	*pcpu = cpu;
L
Len Brown 已提交
931
	return (0);
L
Linus Torvalds 已提交
932 933
}

934 935 936 937 938
/* wrapper to silence section mismatch warning */
int __ref acpi_map_lsapic(acpi_handle handle, int *pcpu)
{
	return _acpi_map_lsapic(handle, pcpu);
}
L
Len Brown 已提交
939
EXPORT_SYMBOL(acpi_map_lsapic);
L
Linus Torvalds 已提交
940

L
Len Brown 已提交
941
int acpi_unmap_lsapic(int cpu)
L
Linus Torvalds 已提交
942 943
{
	ia64_cpu_to_sapicid[cpu] = -1;
L
Len Brown 已提交
944
	cpu_clear(cpu, cpu_present_map);
L
Linus Torvalds 已提交
945 946 947 948 949

#ifdef CONFIG_ACPI_NUMA
	/* NUMA specific cleanup's */
#endif

L
Len Brown 已提交
950
	return (0);
L
Linus Torvalds 已提交
951
}
L
Len Brown 已提交
952

L
Linus Torvalds 已提交
953
EXPORT_SYMBOL(acpi_unmap_lsapic);
L
Len Brown 已提交
954
#endif				/* CONFIG_ACPI_HOTPLUG_CPU */
L
Linus Torvalds 已提交
955 956

#ifdef CONFIG_ACPI_NUMA
957
static acpi_status __devinit
L
Len Brown 已提交
958
acpi_map_iosapic(acpi_handle handle, u32 depth, void *context, void **ret)
L
Linus Torvalds 已提交
959
{
L
Len Brown 已提交
960
	struct acpi_buffer buffer = { ACPI_ALLOCATE_BUFFER, NULL };
L
Linus Torvalds 已提交
961
	union acpi_object *obj;
962
	struct acpi_madt_io_sapic *iosapic;
L
Linus Torvalds 已提交
963
	unsigned int gsi_base;
A
Alex Williamson 已提交
964
	int pxm, node;
L
Linus Torvalds 已提交
965 966 967 968 969 970 971 972 973 974 975

	/* Only care about objects w/ a method that returns the MADT */
	if (ACPI_FAILURE(acpi_evaluate_object(handle, "_MAT", NULL, &buffer)))
		return AE_OK;

	if (!buffer.length || !buffer.pointer)
		return AE_OK;

	obj = buffer.pointer;
	if (obj->type != ACPI_TYPE_BUFFER ||
	    obj->buffer.length < sizeof(*iosapic)) {
976
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
977 978 979
		return AE_OK;
	}

980
	iosapic = (struct acpi_madt_io_sapic *)obj->buffer.pointer;
L
Linus Torvalds 已提交
981

982
	if (iosapic->header.type != ACPI_MADT_TYPE_IO_SAPIC) {
983
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
984 985 986 987 988
		return AE_OK;
	}

	gsi_base = iosapic->global_irq_base;

989
	kfree(buffer.pointer);
L
Linus Torvalds 已提交
990 991

	/*
A
Alex Williamson 已提交
992
	 * OK, it's an IOSAPIC MADT entry, look for a _PXM value to tell
L
Linus Torvalds 已提交
993 994
	 * us which node to associate this with.
	 */
A
Alex Williamson 已提交
995 996
	pxm = acpi_get_pxm(handle);
	if (pxm < 0)
L
Linus Torvalds 已提交
997 998
		return AE_OK;

999
	node = pxm_to_node(pxm);
L
Linus Torvalds 已提交
1000 1001

	if (node >= MAX_NUMNODES || !node_online(node) ||
1002
	    cpumask_empty(cpumask_of_node(node)))
L
Linus Torvalds 已提交
1003 1004 1005 1006 1007 1008
		return AE_OK;

	/* We know a gsi to node mapping! */
	map_iosapic_to_node(gsi_base, node);
	return AE_OK;
}
1009 1010 1011 1012 1013 1014 1015 1016 1017 1018

static int __init
acpi_map_iosapics (void)
{
	acpi_get_devices(NULL, acpi_map_iosapic, NULL, NULL);
	return 0;
}

fs_initcall(acpi_map_iosapics);
#endif				/* CONFIG_ACPI_NUMA */
1019

1020
int __ref acpi_register_ioapic(acpi_handle handle, u64 phys_addr, u32 gsi_base)
1021
{
1022 1023 1024 1025 1026
	int err;

	if ((err = iosapic_init(phys_addr, gsi_base)))
		return err;

1027
#ifdef CONFIG_ACPI_NUMA
1028
	acpi_map_iosapic(handle, 0, NULL, NULL);
L
Len Brown 已提交
1029
#endif				/* CONFIG_ACPI_NUMA */
1030 1031

	return 0;
1032
}
L
Len Brown 已提交
1033

1034 1035
EXPORT_SYMBOL(acpi_register_ioapic);

L
Len Brown 已提交
1036
int acpi_unregister_ioapic(acpi_handle handle, u32 gsi_base)
1037
{
1038
	return iosapic_remove(gsi_base);
1039
}
L
Len Brown 已提交
1040

1041 1042
EXPORT_SYMBOL(acpi_unregister_ioapic);

1043
/*
1044
 * acpi_suspend_lowlevel() - save kernel state and suspend.
1045 1046 1047
 *
 * TBD when when IA64 starts to support suspend...
 */
1048
int acpi_suspend_lowlevel(void) { return 0; }