acpi.c 25.7 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 *  acpi.c - Architecture-Specific Low-Level ACPI Support
 *
 *  Copyright (C) 1999 VA Linux Systems
 *  Copyright (C) 1999,2000 Walt Drummond <drummond@valinux.com>
 *  Copyright (C) 2000, 2002-2003 Hewlett-Packard Co.
 *	David Mosberger-Tang <davidm@hpl.hp.com>
 *  Copyright (C) 2000 Intel Corp.
 *  Copyright (C) 2000,2001 J.I. Lee <jung-ik.lee@intel.com>
 *  Copyright (C) 2001 Paul Diefenbaugh <paul.s.diefenbaugh@intel.com>
 *  Copyright (C) 2001 Jenna Hall <jenna.s.hall@intel.com>
 *  Copyright (C) 2001 Takayoshi Kochi <t-kochi@bq.jp.nec.com>
 *  Copyright (C) 2002 Erich Focht <efocht@ess.nec.de>
14
 *  Copyright (C) 2004 Ashok Raj <ashok.raj@intel.com>
L
Linus Torvalds 已提交
15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
 *
 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; either version 2 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 *
 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/kernel.h>
#include <linux/sched.h>
#include <linux/smp.h>
#include <linux/string.h>
#include <linux/types.h>
#include <linux/irq.h>
#include <linux/acpi.h>
#include <linux/efi.h>
#include <linux/mmzone.h>
#include <linux/nodemask.h>
47
#include <linux/slab.h>
48
#include <acpi/processor.h>
L
Linus Torvalds 已提交
49 50 51 52 53 54 55
#include <asm/io.h>
#include <asm/iosapic.h>
#include <asm/machvec.h>
#include <asm/page.h>
#include <asm/numa.h>
#include <asm/sal.h>
#include <asm/cyclone.h>
56
#include <asm/xen/hypervisor.h>
L
Linus Torvalds 已提交
57 58 59

#define BAD_MADT_ENTRY(entry, end) (                                        \
		(!entry) || (unsigned long)entry + sizeof(*entry) > end ||  \
60
		((struct acpi_subtable_header *)entry)->length < sizeof(*entry))
L
Linus Torvalds 已提交
61 62 63

#define PREFIX			"ACPI: "

64
u32 acpi_rsdt_forced;
65 66 67
unsigned int acpi_cpei_override;
unsigned int acpi_cpei_phys_cpuid;

68 69
unsigned long acpi_wakeup_address = 0;

70 71 72 73 74 75 76 77 78 79 80 81 82
#ifdef CONFIG_IA64_GENERIC
static unsigned long __init acpi_find_rsdp(void)
{
	unsigned long rsdp_phys = 0;

	if (efi.acpi20 != EFI_INVALID_TABLE_ADDR)
		rsdp_phys = efi.acpi20;
	else if (efi.acpi != EFI_INVALID_TABLE_ADDR)
		printk(KERN_WARNING PREFIX
		       "v1.0/r0.71 tables no longer supported\n");
	return rsdp_phys;
}

83 84
const char __init *
acpi_get_sysname(void)
L
Linus Torvalds 已提交
85 86
{
	unsigned long rsdp_phys;
87
	struct acpi_table_rsdp *rsdp;
L
Linus Torvalds 已提交
88 89
	struct acpi_table_xsdt *xsdt;
	struct acpi_table_header *hdr;
90
#ifdef CONFIG_INTEL_IOMMU
91 92
	u64 i, nentries;
#endif
L
Linus Torvalds 已提交
93 94 95

	rsdp_phys = acpi_find_rsdp();
	if (!rsdp_phys) {
L
Len Brown 已提交
96 97
		printk(KERN_ERR
		       "ACPI 2.0 RSDP not found, default to \"dig\"\n");
L
Linus Torvalds 已提交
98 99 100
		return "dig";
	}

101 102
	rsdp = (struct acpi_table_rsdp *)__va(rsdp_phys);
	if (strncmp(rsdp->signature, ACPI_SIG_RSDP, sizeof(ACPI_SIG_RSDP) - 1)) {
L
Len Brown 已提交
103 104
		printk(KERN_ERR
		       "ACPI 2.0 RSDP signature incorrect, default to \"dig\"\n");
L
Linus Torvalds 已提交
105 106 107
		return "dig";
	}

108
	xsdt = (struct acpi_table_xsdt *)__va(rsdp->xsdt_physical_address);
L
Linus Torvalds 已提交
109
	hdr = &xsdt->header;
110
	if (strncmp(hdr->signature, ACPI_SIG_XSDT, sizeof(ACPI_SIG_XSDT) - 1)) {
L
Len Brown 已提交
111 112
		printk(KERN_ERR
		       "ACPI 2.0 XSDT signature incorrect, default to \"dig\"\n");
L
Linus Torvalds 已提交
113 114 115 116 117
		return "dig";
	}

	if (!strcmp(hdr->oem_id, "HP")) {
		return "hpzx1";
L
Len Brown 已提交
118
	} else if (!strcmp(hdr->oem_id, "SGI")) {
119 120 121 122
		if (!strcmp(hdr->oem_table_id + 4, "UV"))
			return "uv";
		else
			return "sn2";
123 124
	} else if (xen_pv_domain() && !strcmp(hdr->oem_id, "XEN")) {
		return "xen";
L
Linus Torvalds 已提交
125 126
	}

127
#ifdef CONFIG_INTEL_IOMMU
128 129 130 131 132 133 134 135 136 137 138
	/* Look for Intel IOMMU */
	nentries = (hdr->length - sizeof(*hdr)) /
			 sizeof(xsdt->table_offset_entry[0]);
	for (i = 0; i < nentries; i++) {
		hdr = __va(xsdt->table_offset_entry[i]);
		if (strncmp(hdr->signature, ACPI_SIG_DMAR,
			sizeof(ACPI_SIG_DMAR) - 1) == 0)
			return "dig_vtd";
	}
#endif

L
Linus Torvalds 已提交
139 140
	return "dig";
}
141
#endif /* CONFIG_IA64_GENERIC */
L
Linus Torvalds 已提交
142 143 144 145 146 147 148 149 150 151 152 153 154 155

#define ACPI_MAX_PLATFORM_INTERRUPTS	256

/* Array to record platform interrupt vectors for generic interrupt routing. */
int platform_intr_list[ACPI_MAX_PLATFORM_INTERRUPTS] = {
	[0 ... ACPI_MAX_PLATFORM_INTERRUPTS - 1] = -1
};

enum acpi_irq_model_id acpi_irq_model = ACPI_IRQ_MODEL_IOSAPIC;

/*
 * Interrupt routing API for device drivers.  Provides interrupt vector for
 * a generic platform event.  Currently only CPEI is implemented.
 */
L
Len Brown 已提交
156
int acpi_request_vector(u32 int_type)
L
Linus Torvalds 已提交
157 158 159 160 161 162 163
{
	int vector = -1;

	if (int_type < ACPI_MAX_PLATFORM_INTERRUPTS) {
		/* corrected platform error interrupt */
		vector = platform_intr_list[int_type];
	} else
L
Len Brown 已提交
164 165
		printk(KERN_ERR
		       "acpi_request_vector(): invalid interrupt type\n");
L
Linus Torvalds 已提交
166 167 168
	return vector;
}

169
char *__init __acpi_map_table(unsigned long phys_addr, unsigned long size)
L
Linus Torvalds 已提交
170 171 172 173
{
	return __va(phys_addr);
}

Y
Yinghai Lu 已提交
174
void __init __acpi_unmap_table(char *map, unsigned long size)
175 176 177
{
}

L
Linus Torvalds 已提交
178 179 180 181
/* --------------------------------------------------------------------------
                            Boot-time Table Parsing
   -------------------------------------------------------------------------- */

L
Len Brown 已提交
182 183 184
static int available_cpus __initdata;
struct acpi_table_madt *acpi_madt __initdata;
static u8 has_8259;
L
Linus Torvalds 已提交
185 186

static int __init
187
acpi_parse_lapic_addr_ovr(struct acpi_subtable_header * header,
L
Len Brown 已提交
188
			  const unsigned long end)
L
Linus Torvalds 已提交
189
{
190
	struct acpi_madt_local_apic_override *lapic;
L
Linus Torvalds 已提交
191

192
	lapic = (struct acpi_madt_local_apic_override *)header;
L
Linus Torvalds 已提交
193 194 195 196 197 198 199 200 201 202 203 204

	if (BAD_MADT_ENTRY(lapic, end))
		return -EINVAL;

	if (lapic->address) {
		iounmap(ipi_base_addr);
		ipi_base_addr = ioremap(lapic->address, 0);
	}
	return 0;
}

static int __init
205
acpi_parse_lsapic(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
206
{
207
	struct acpi_madt_local_sapic *lsapic;
L
Linus Torvalds 已提交
208

209
	lsapic = (struct acpi_madt_local_sapic *)header;
L
Linus Torvalds 已提交
210

211
	/*Skip BAD_MADT_ENTRY check, as lsapic size could vary */
L
Linus Torvalds 已提交
212

213
	if (lsapic->lapic_flags & ACPI_MADT_ENABLED) {
L
Linus Torvalds 已提交
214
#ifdef CONFIG_SMP
L
Len Brown 已提交
215 216
		smp_boot_data.cpu_phys_id[available_cpus] =
		    (lsapic->id << 8) | lsapic->eid;
L
Linus Torvalds 已提交
217 218 219 220 221 222 223 224 225
#endif
		++available_cpus;
	}

	total_cpus++;
	return 0;
}

static int __init
226
acpi_parse_lapic_nmi(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
227
{
228
	struct acpi_madt_local_apic_nmi *lacpi_nmi;
L
Linus Torvalds 已提交
229

230
	lacpi_nmi = (struct acpi_madt_local_apic_nmi *)header;
L
Linus Torvalds 已提交
231 232 233 234 235 236 237 238 239

	if (BAD_MADT_ENTRY(lacpi_nmi, end))
		return -EINVAL;

	/* TBD: Support lapic_nmi entries */
	return 0;
}

static int __init
240
acpi_parse_iosapic(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
241
{
242
	struct acpi_madt_io_sapic *iosapic;
L
Linus Torvalds 已提交
243

244
	iosapic = (struct acpi_madt_io_sapic *)header;
L
Linus Torvalds 已提交
245 246 247 248

	if (BAD_MADT_ENTRY(iosapic, end))
		return -EINVAL;

249
	return iosapic_init(iosapic->address, iosapic->global_irq_base);
L
Linus Torvalds 已提交
250 251
}

L
Len Brown 已提交
252 253
static unsigned int __initdata acpi_madt_rev;

L
Linus Torvalds 已提交
254
static int __init
255
acpi_parse_plat_int_src(struct acpi_subtable_header * header,
L
Len Brown 已提交
256
			const unsigned long end)
L
Linus Torvalds 已提交
257
{
258
	struct acpi_madt_interrupt_source *plintsrc;
L
Linus Torvalds 已提交
259 260
	int vector;

261
	plintsrc = (struct acpi_madt_interrupt_source *)header;
L
Linus Torvalds 已提交
262 263 264 265 266 267 268 269 270 271

	if (BAD_MADT_ENTRY(plintsrc, end))
		return -EINVAL;

	/*
	 * Get vector assignment for this interrupt, set attributes,
	 * and program the IOSAPIC routing table.
	 */
	vector = iosapic_register_platform_intr(plintsrc->type,
						plintsrc->global_irq,
272
						plintsrc->io_sapic_vector,
L
Linus Torvalds 已提交
273 274
						plintsrc->eid,
						plintsrc->id,
275 276 277 278 279 280
						((plintsrc->inti_flags & ACPI_MADT_POLARITY_MASK) ==
						 ACPI_MADT_POLARITY_ACTIVE_HIGH) ?
						IOSAPIC_POL_HIGH : IOSAPIC_POL_LOW,
						((plintsrc->inti_flags & ACPI_MADT_TRIGGER_MASK) ==
						 ACPI_MADT_TRIGGER_EDGE) ?
						IOSAPIC_EDGE : IOSAPIC_LEVEL);
L
Linus Torvalds 已提交
281 282

	platform_intr_list[plintsrc->type] = vector;
283
	if (acpi_madt_rev > 1) {
284
		acpi_cpei_override = plintsrc->flags & ACPI_MADT_CPEI_OVERRIDE;
285 286 287 288 289 290 291
	}

	/*
	 * Save the physical id, so we can check when its being removed
	 */
	acpi_cpei_phys_cpuid = ((plintsrc->id << 8) | (plintsrc->eid)) & 0xffff;

L
Linus Torvalds 已提交
292 293 294
	return 0;
}

295
#ifdef CONFIG_HOTPLUG_CPU
296 297 298
unsigned int can_cpei_retarget(void)
{
	extern int cpe_vector;
A
Ashok Raj 已提交
299
	extern unsigned int force_cpei_retarget;
300 301 302 303 304 305

	/*
	 * Only if CPEI is supported and the override flag
	 * is present, otherwise return that its re-targettable
	 * if we are in polling mode.
	 */
A
Ashok Raj 已提交
306 307 308 309 310 311 312
	if (cpe_vector > 0) {
		if (acpi_cpei_override || force_cpei_retarget)
			return 1;
		else
			return 0;
	}
	return 1;
313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330
}

unsigned int is_cpu_cpei_target(unsigned int cpu)
{
	unsigned int logical_id;

	logical_id = cpu_logical_id(acpi_cpei_phys_cpuid);

	if (logical_id == cpu)
		return 1;
	else
		return 0;
}

void set_cpei_target_cpu(unsigned int cpu)
{
	acpi_cpei_phys_cpuid = cpu_physical_id(cpu);
}
331
#endif
332 333 334 335 336 337

unsigned int get_cpei_target_cpu(void)
{
	return acpi_cpei_phys_cpuid;
}

L
Linus Torvalds 已提交
338
static int __init
339
acpi_parse_int_src_ovr(struct acpi_subtable_header * header,
L
Len Brown 已提交
340
		       const unsigned long end)
L
Linus Torvalds 已提交
341
{
342
	struct acpi_madt_interrupt_override *p;
L
Linus Torvalds 已提交
343

344
	p = (struct acpi_madt_interrupt_override *)header;
L
Linus Torvalds 已提交
345 346 347 348

	if (BAD_MADT_ENTRY(p, end))
		return -EINVAL;

349 350
	iosapic_override_isa_irq(p->source_irq, p->global_irq,
				 ((p->inti_flags & ACPI_MADT_POLARITY_MASK) ==
351 352
				  ACPI_MADT_POLARITY_ACTIVE_LOW) ?
				 IOSAPIC_POL_LOW : IOSAPIC_POL_HIGH,
353
				 ((p->inti_flags & ACPI_MADT_TRIGGER_MASK) ==
354 355
				 ACPI_MADT_TRIGGER_LEVEL) ?
				 IOSAPIC_LEVEL : IOSAPIC_EDGE);
L
Linus Torvalds 已提交
356 357 358 359
	return 0;
}

static int __init
360
acpi_parse_nmi_src(struct acpi_subtable_header * header, const unsigned long end)
L
Linus Torvalds 已提交
361
{
362
	struct acpi_madt_nmi_source *nmi_src;
L
Linus Torvalds 已提交
363

364
	nmi_src = (struct acpi_madt_nmi_source *)header;
L
Linus Torvalds 已提交
365 366 367 368 369 370 371 372

	if (BAD_MADT_ENTRY(nmi_src, end))
		return -EINVAL;

	/* TBD: Support nimsrc entries */
	return 0;
}

L
Len Brown 已提交
373
static void __init acpi_madt_oem_check(char *oem_id, char *oem_table_id)
L
Linus Torvalds 已提交
374
{
L
Len Brown 已提交
375
	if (!strncmp(oem_id, "IBM", 3) && (!strncmp(oem_table_id, "SERMOW", 6))) {
L
Linus Torvalds 已提交
376 377 378 379 380 381 382 383 384 385 386 387

		/*
		 * Unfortunately ITC_DRIFT is not yet part of the
		 * official SAL spec, so the ITC_DRIFT bit is not
		 * set by the BIOS on this hardware.
		 */
		sal_platform_features |= IA64_SAL_PLATFORM_FEATURE_ITC_DRIFT;

		cyclone_setup();
	}
}

388
static int __init acpi_parse_madt(struct acpi_table_header *table)
L
Linus Torvalds 已提交
389
{
390
	if (!table)
L
Linus Torvalds 已提交
391 392
		return -EINVAL;

393
	acpi_madt = (struct acpi_table_madt *)table;
L
Linus Torvalds 已提交
394

395 396
	acpi_madt_rev = acpi_madt->header.revision;

L
Linus Torvalds 已提交
397 398
	/* remember the value for reference after free_initmem() */
#ifdef CONFIG_ITANIUM
L
Len Brown 已提交
399
	has_8259 = 1;		/* Firmware on old Itanium systems is broken */
L
Linus Torvalds 已提交
400
#else
401
	has_8259 = acpi_madt->flags & ACPI_MADT_PCAT_COMPAT;
L
Linus Torvalds 已提交
402 403 404 405 406
#endif
	iosapic_system_init(has_8259);

	/* Get base address of IPI Message Block */

407 408
	if (acpi_madt->address)
		ipi_base_addr = ioremap(acpi_madt->address, 0);
L
Linus Torvalds 已提交
409 410 411 412

	printk(KERN_INFO PREFIX "Local APIC address %p\n", ipi_base_addr);

	acpi_madt_oem_check(acpi_madt->header.oem_id,
L
Len Brown 已提交
413
			    acpi_madt->header.oem_table_id);
L
Linus Torvalds 已提交
414 415 416 417 418 419 420 421 422 423

	return 0;
}

#ifdef CONFIG_ACPI_NUMA

#undef SLIT_DEBUG

#define PXM_FLAG_LEN ((MAX_PXM_DOMAINS + 1)/32)

L
Len Brown 已提交
424
static int __initdata srat_num_cpus;	/* number of cpus */
425
static u32 pxm_flag[PXM_FLAG_LEN];
L
Linus Torvalds 已提交
426 427 428
#define pxm_bit_set(bit)	(set_bit(bit,(void *)pxm_flag))
#define pxm_bit_test(bit)	(test_bit(bit,(void *)pxm_flag))
static struct acpi_table_slit __initdata *slit_table;
429
cpumask_t early_cpu_possible_map = CPU_MASK_NONE;
L
Linus Torvalds 已提交
430

431 432
static int __init
get_processor_proximity_domain(struct acpi_srat_cpu_affinity *pa)
433 434 435
{
	int pxm;

436
	pxm = pa->proximity_domain_lo;
437
	if (ia64_platform_is("sn2") || acpi_srat_revision >= 2)
438
		pxm += pa->proximity_domain_hi[0] << 8;
439 440 441
	return pxm;
}

442 443
static int __init
get_memory_proximity_domain(struct acpi_srat_mem_affinity *ma)
444 445 446 447
{
	int pxm;

	pxm = ma->proximity_domain;
448
	if (!ia64_platform_is("sn2") && acpi_srat_revision <= 1)
449
		pxm &= 0xff;
450

451 452 453
	return pxm;
}

L
Linus Torvalds 已提交
454 455 456 457
/*
 * ACPI 2.0 SLIT (System Locality Information Table)
 * http://devresource.hp.com/devresource/Docs/TechPapers/IA64/slit.pdf
 */
L
Len Brown 已提交
458
void __init acpi_numa_slit_init(struct acpi_table_slit *slit)
L
Linus Torvalds 已提交
459 460 461 462
{
	u32 len;

	len = sizeof(struct acpi_table_header) + 8
463
	    + slit->locality_count * slit->locality_count;
L
Linus Torvalds 已提交
464
	if (slit->header.length != len) {
L
Len Brown 已提交
465 466
		printk(KERN_ERR
		       "ACPI 2.0 SLIT: size mismatch: %d expected, %d actual\n",
L
Linus Torvalds 已提交
467 468 469 470 471 472 473
		       len, slit->header.length);
		return;
	}
	slit_table = slit;
}

void __init
474
acpi_numa_processor_affinity_init(struct acpi_srat_cpu_affinity *pa)
L
Linus Torvalds 已提交
475
{
476 477
	int pxm;

478
	if (!(pa->flags & ACPI_SRAT_CPU_ENABLED))
479 480
		return;

481 482
	if (srat_num_cpus >= ARRAY_SIZE(node_cpuid)) {
		printk_once(KERN_WARNING
483
			    "node_cpuid[%ld] is too small, may not be able to use all cpus\n",
484 485 486
			    ARRAY_SIZE(node_cpuid));
		return;
	}
487 488
	pxm = get_processor_proximity_domain(pa);

L
Linus Torvalds 已提交
489
	/* record this node in proximity bitmap */
490
	pxm_bit_set(pxm);
L
Linus Torvalds 已提交
491

L
Len Brown 已提交
492
	node_cpuid[srat_num_cpus].phys_id =
493
	    (pa->apic_id << 8) | (pa->local_sapic_eid);
L
Linus Torvalds 已提交
494
	/* nid should be overridden as logical node id later */
495
	node_cpuid[srat_num_cpus].nid = pxm;
496
	cpu_set(srat_num_cpus, early_cpu_possible_map);
L
Linus Torvalds 已提交
497 498 499
	srat_num_cpus++;
}

500
int __init
501
acpi_numa_memory_affinity_init(struct acpi_srat_mem_affinity *ma)
L
Linus Torvalds 已提交
502 503
{
	unsigned long paddr, size;
504
	int pxm;
L
Linus Torvalds 已提交
505 506
	struct node_memblk_s *p, *q, *pend;

507
	pxm = get_memory_proximity_domain(ma);
L
Linus Torvalds 已提交
508 509

	/* fill node memory chunk structure */
510 511
	paddr = ma->base_address;
	size = ma->length;
L
Linus Torvalds 已提交
512 513

	/* Ignore disabled entries */
514
	if (!(ma->flags & ACPI_SRAT_MEM_ENABLED))
515
		return -1;
L
Linus Torvalds 已提交
516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533

	/* record this node in proximity bitmap */
	pxm_bit_set(pxm);

	/* Insertion sort based on base address */
	pend = &node_memblk[num_node_memblks];
	for (p = &node_memblk[0]; p < pend; p++) {
		if (paddr < p->start_paddr)
			break;
	}
	if (p < pend) {
		for (q = pend - 1; q >= p; q--)
			*(q + 1) = *q;
	}
	p->start_paddr = paddr;
	p->size = size;
	p->nid = pxm;
	num_node_memblks++;
534
	return 0;
L
Linus Torvalds 已提交
535 536
}

L
Len Brown 已提交
537
void __init acpi_numa_arch_fixup(void)
L
Linus Torvalds 已提交
538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554
{
	int i, j, node_from, node_to;

	/* If there's no SRAT, fix the phys_id and mark node 0 online */
	if (srat_num_cpus == 0) {
		node_set_online(0);
		node_cpuid[0].phys_id = hard_smp_processor_id();
		return;
	}

	/*
	 * MCD - This can probably be dropped now.  No need for pxm ID to node ID
	 * mapping with sparse node numbering iff MAX_PXM_DOMAINS <= MAX_NUMNODES.
	 */
	nodes_clear(node_online_map);
	for (i = 0; i < MAX_PXM_DOMAINS; i++) {
		if (pxm_bit_test(i)) {
555
			int nid = acpi_map_pxm_to_node(i);
L
Linus Torvalds 已提交
556 557 558 559 560 561
			node_set_online(nid);
		}
	}

	/* set logical node id in memory chunk structure */
	for (i = 0; i < num_node_memblks; i++)
562
		node_memblk[i].nid = pxm_to_node(node_memblk[i].nid);
L
Linus Torvalds 已提交
563 564 565 566 567 568 569 570 571 572 573 574

	/* assign memory bank numbers for each chunk on each node */
	for_each_online_node(i) {
		int bank;

		bank = 0;
		for (j = 0; j < num_node_memblks; j++)
			if (node_memblk[j].nid == i)
				node_memblk[j].bank = bank++;
	}

	/* set logical node id in cpu structure */
575
	for_each_possible_early_cpu(i)
576
		node_cpuid[i].nid = pxm_to_node(node_cpuid[i].nid);
L
Linus Torvalds 已提交
577

L
Len Brown 已提交
578 579 580 581
	printk(KERN_INFO "Number of logical nodes in system = %d\n",
	       num_online_nodes());
	printk(KERN_INFO "Number of memory chunks in system = %d\n",
	       num_node_memblks);
L
Linus Torvalds 已提交
582

583 584 585 586 587
	if (!slit_table) {
		for (i = 0; i < MAX_NUMNODES; i++)
			for (j = 0; j < MAX_NUMNODES; j++)
				node_distance(i, j) = i == j ? LOCAL_DISTANCE :
							REMOTE_DISTANCE;
L
Len Brown 已提交
588
		return;
589 590
	}

L
Linus Torvalds 已提交
591
	memset(numa_slit, -1, sizeof(numa_slit));
592
	for (i = 0; i < slit_table->locality_count; i++) {
L
Linus Torvalds 已提交
593 594
		if (!pxm_bit_test(i))
			continue;
595
		node_from = pxm_to_node(i);
596
		for (j = 0; j < slit_table->locality_count; j++) {
L
Linus Torvalds 已提交
597 598
			if (!pxm_bit_test(j))
				continue;
599
			node_to = pxm_to_node(j);
L
Linus Torvalds 已提交
600
			node_distance(node_from, node_to) =
601
			    slit_table->entry[i * slit_table->locality_count + j];
L
Linus Torvalds 已提交
602 603 604 605 606 607 608
		}
	}

#ifdef SLIT_DEBUG
	printk("ACPI 2.0 SLIT locality table:\n");
	for_each_online_node(i) {
		for_each_online_node(j)
L
Len Brown 已提交
609
		    printk("%03d ", node_distance(i, j));
L
Linus Torvalds 已提交
610 611 612 613
		printk("\n");
	}
#endif
}
L
Len Brown 已提交
614
#endif				/* CONFIG_ACPI_NUMA */
L
Linus Torvalds 已提交
615

616 617 618 619
/*
 * success: return IRQ number (>=0)
 * failure: return < 0
 */
620
int acpi_register_gsi(struct device *dev, u32 gsi, int triggering, int polarity)
L
Linus Torvalds 已提交
621
{
J
John Keller 已提交
622 623 624
	if (acpi_irq_model == ACPI_IRQ_MODEL_PLATFORM)
		return gsi;

L
Linus Torvalds 已提交
625 626 627 628
	if (has_8259 && gsi < 16)
		return isa_irq_to_vector(gsi);

	return iosapic_register_intr(gsi,
629
				     (polarity ==
L
Len Brown 已提交
630 631
				      ACPI_ACTIVE_HIGH) ? IOSAPIC_POL_HIGH :
				     IOSAPIC_POL_LOW,
632
				     (triggering ==
L
Len Brown 已提交
633 634
				      ACPI_EDGE_SENSITIVE) ? IOSAPIC_EDGE :
				     IOSAPIC_LEVEL);
L
Linus Torvalds 已提交
635
}
636
EXPORT_SYMBOL_GPL(acpi_register_gsi);
L
Len Brown 已提交
637 638

void acpi_unregister_gsi(u32 gsi)
L
Linus Torvalds 已提交
639
{
640 641 642
	if (acpi_irq_model == ACPI_IRQ_MODEL_PLATFORM)
		return;

643 644 645
	if (has_8259 && gsi < 16)
		return;

L
Linus Torvalds 已提交
646 647
	iosapic_unregister_intr(gsi);
}
648
EXPORT_SYMBOL_GPL(acpi_unregister_gsi);
L
Len Brown 已提交
649

650
static int __init acpi_parse_fadt(struct acpi_table_header *table)
L
Linus Torvalds 已提交
651 652
{
	struct acpi_table_header *fadt_header;
653
	struct acpi_table_fadt *fadt;
L
Linus Torvalds 已提交
654

655
	if (!table)
L
Linus Torvalds 已提交
656 657
		return -EINVAL;

658
	fadt_header = (struct acpi_table_header *)table;
L
Linus Torvalds 已提交
659
	if (fadt_header->revision != 3)
L
Len Brown 已提交
660
		return -ENODEV;	/* Only deal with ACPI 2.0 FADT */
L
Linus Torvalds 已提交
661

662
	fadt = (struct acpi_table_fadt *)fadt_header;
L
Linus Torvalds 已提交
663

664 665
	acpi_register_gsi(NULL, fadt->sci_interrupt, ACPI_LEVEL_SENSITIVE,
				 ACPI_ACTIVE_LOW);
L
Linus Torvalds 已提交
666 667 668
	return 0;
}

669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687
int __init early_acpi_boot_init(void)
{
	int ret;

	/*
	 * do a partial walk of MADT to determine how many CPUs
	 * we have including offline CPUs
	 */
	if (acpi_table_parse(ACPI_SIG_MADT, acpi_parse_madt)) {
		printk(KERN_ERR PREFIX "Can't find MADT\n");
		return 0;
	}

	ret = acpi_table_parse_madt(ACPI_MADT_TYPE_LOCAL_SAPIC,
		acpi_parse_lsapic, NR_CPUS);
	if (ret < 1)
		printk(KERN_ERR PREFIX
		       "Error parsing MADT - no LAPIC entries\n");

T
Tejun Heo 已提交
688 689 690 691 692 693 694 695 696 697 698 699 700 701
#ifdef CONFIG_SMP
	if (available_cpus == 0) {
		printk(KERN_INFO "ACPI: Found 0 CPUS; assuming 1\n");
		printk(KERN_INFO "CPU 0 (0x%04x)", hard_smp_processor_id());
		smp_boot_data.cpu_phys_id[available_cpus] =
		    hard_smp_processor_id();
		available_cpus = 1;	/* We've got at least one of these, no? */
	}
	smp_boot_data.cpu_count = available_cpus;
#endif
	/* Make boot-up look pretty */
	printk(KERN_INFO "%d CPUs available, %d CPUs total\n", available_cpus,
	       total_cpus);

702 703 704
	return 0;
}

L
Len Brown 已提交
705
int __init acpi_boot_init(void)
L
Linus Torvalds 已提交
706 707 708 709 710 711 712 713 714 715
{

	/*
	 * MADT
	 * ----
	 * Parse the Multiple APIC Description Table (MADT), if exists.
	 * Note that this table provides platform SMP configuration
	 * information -- the successor to MPS tables.
	 */

716
	if (acpi_table_parse(ACPI_SIG_MADT, acpi_parse_madt)) {
L
Linus Torvalds 已提交
717 718 719 720 721 722
		printk(KERN_ERR PREFIX "Can't find MADT\n");
		goto skip_madt;
	}

	/* Local APIC */

L
Len Brown 已提交
723
	if (acpi_table_parse_madt
724
	    (ACPI_MADT_TYPE_LOCAL_APIC_OVERRIDE, acpi_parse_lapic_addr_ovr, 0) < 0)
L
Len Brown 已提交
725 726
		printk(KERN_ERR PREFIX
		       "Error parsing LAPIC address override entry\n");
L
Linus Torvalds 已提交
727

728
	if (acpi_table_parse_madt(ACPI_MADT_TYPE_LOCAL_APIC_NMI, acpi_parse_lapic_nmi, 0)
L
Len Brown 已提交
729
	    < 0)
L
Linus Torvalds 已提交
730 731 732 733
		printk(KERN_ERR PREFIX "Error parsing LAPIC NMI entry\n");

	/* I/O APIC */

L
Len Brown 已提交
734
	if (acpi_table_parse_madt
735 736 737 738 739
	    (ACPI_MADT_TYPE_IO_SAPIC, acpi_parse_iosapic, NR_IOSAPICS) < 1) {
		if (!ia64_platform_is("sn2"))
			printk(KERN_ERR PREFIX
			       "Error parsing MADT - no IOSAPIC entries\n");
	}
L
Linus Torvalds 已提交
740 741 742

	/* System-Level Interrupt Routing */

L
Len Brown 已提交
743
	if (acpi_table_parse_madt
744
	    (ACPI_MADT_TYPE_INTERRUPT_SOURCE, acpi_parse_plat_int_src,
L
Len Brown 已提交
745 746 747
	     ACPI_MAX_PLATFORM_INTERRUPTS) < 0)
		printk(KERN_ERR PREFIX
		       "Error parsing platform interrupt source entry\n");
L
Linus Torvalds 已提交
748

L
Len Brown 已提交
749
	if (acpi_table_parse_madt
750
	    (ACPI_MADT_TYPE_INTERRUPT_OVERRIDE, acpi_parse_int_src_ovr, 0) < 0)
L
Len Brown 已提交
751 752
		printk(KERN_ERR PREFIX
		       "Error parsing interrupt source overrides entry\n");
L
Linus Torvalds 已提交
753

754
	if (acpi_table_parse_madt(ACPI_MADT_TYPE_NMI_SOURCE, acpi_parse_nmi_src, 0) < 0)
L
Linus Torvalds 已提交
755
		printk(KERN_ERR PREFIX "Error parsing NMI SRC entry\n");
L
Len Brown 已提交
756
      skip_madt:
L
Linus Torvalds 已提交
757 758 759 760 761 762 763

	/*
	 * FADT says whether a legacy keyboard controller is present.
	 * The FADT also contains an SCI_INT line, by which the system
	 * gets interrupts such as power and sleep buttons.  If it's not
	 * on a Legacy interrupt, it needs to be setup.
	 */
764
	if (acpi_table_parse(ACPI_SIG_FADT, acpi_parse_fadt))
L
Linus Torvalds 已提交
765 766
		printk(KERN_ERR PREFIX "Can't find FADT\n");

T
Tejun Heo 已提交
767
#ifdef CONFIG_ACPI_NUMA
L
Linus Torvalds 已提交
768 769 770 771
#ifdef CONFIG_SMP
	if (srat_num_cpus == 0) {
		int cpu, i = 1;
		for (cpu = 0; cpu < smp_boot_data.cpu_count; cpu++)
L
Len Brown 已提交
772 773 774 775
			if (smp_boot_data.cpu_phys_id[cpu] !=
			    hard_smp_processor_id())
				node_cpuid[i++].phys_id =
				    smp_boot_data.cpu_phys_id[cpu];
L
Linus Torvalds 已提交
776
	}
T
Tony Luck 已提交
777 778
#endif
	build_cpu_to_node_map();
L
Linus Torvalds 已提交
779 780 781 782
#endif
	return 0;
}

L
Len Brown 已提交
783
int acpi_gsi_to_irq(u32 gsi, unsigned int *irq)
L
Linus Torvalds 已提交
784
{
785
	int tmp;
L
Linus Torvalds 已提交
786 787 788 789

	if (has_8259 && gsi < 16)
		*irq = isa_irq_to_vector(gsi);
	else {
790 791
		tmp = gsi_to_irq(gsi);
		if (tmp == -1)
L
Linus Torvalds 已提交
792
			return -1;
793
		*irq = tmp;
L
Linus Torvalds 已提交
794 795 796 797
	}
	return 0;
}

798 799 800 801 802 803 804 805
int acpi_isa_irq_to_gsi(unsigned isa_irq, u32 *gsi)
{
	if (isa_irq >= 16)
		return -1;
	*gsi = isa_irq;
	return 0;
}

L
Linus Torvalds 已提交
806 807 808 809
/*
 *  ACPI based hotplug CPU support
 */
#ifdef CONFIG_ACPI_HOTPLUG_CPU
810
static __cpuinit
811
int acpi_map_cpu2node(acpi_handle handle, int cpu, int physid)
L
Linus Torvalds 已提交
812 813
{
#ifdef CONFIG_ACPI_NUMA
L
Len Brown 已提交
814
	int pxm_id;
815
	int nid;
L
Linus Torvalds 已提交
816 817 818

	pxm_id = acpi_get_pxm(handle);
	/*
819 820 821 822 823
	 * We don't have cpu-only-node hotadd. But if the system equips
	 * SRAT table, pxm is already found and node is ready.
  	 * So, just pxm_to_nid(pxm) is OK.
	 * This code here is for the system which doesn't have full SRAT
  	 * table for possible cpus.
L
Linus Torvalds 已提交
824
	 */
825
	nid = acpi_map_pxm_to_node(pxm_id);
L
Len Brown 已提交
826
	node_cpuid[cpu].phys_id = physid;
827
	node_cpuid[cpu].nid = nid;
L
Linus Torvalds 已提交
828
#endif
L
Len Brown 已提交
829
	return (0);
L
Linus Torvalds 已提交
830 831
}

832 833 834 835 836 837 838 839 840 841 842 843 844
int additional_cpus __initdata = -1;

static __init int setup_additional_cpus(char *s)
{
	if (s)
		additional_cpus = simple_strtol(s, NULL, 0);

	return 0;
}

early_param("additional_cpus", setup_additional_cpus);

/*
845
 * cpu_possible_mask should be static, it cannot change as CPUs
846 847 848
 * are onlined, or offlined. The reason is per-cpu data-structures
 * are allocated by some modules at init time, and dont expect to
 * do this dynamically on cpu arrival/departure.
849
 * cpu_present_mask on the other hand can change dynamically.
850 851 852 853 854 855 856 857 858 859 860 861 862 863 864
 * In case when cpu_hotplug is not compiled, then we resort to current
 * behaviour, which is cpu_possible == cpu_present.
 * - Ashok Raj
 *
 * Three ways to find out the number of additional hotplug CPUs:
 * - If the BIOS specified disabled CPUs in ACPI/mptables use that.
 * - The user can overwrite it with additional_cpus=NUM
 * - Otherwise don't reserve additional CPUs.
 */
__init void prefill_possible_map(void)
{
	int i;
	int possible, disabled_cpus;

	disabled_cpus = total_cpus - available_cpus;
865

866
 	if (additional_cpus == -1) {
867
 		if (disabled_cpus > 0)
868
			additional_cpus = disabled_cpus;
869
 		else
870
			additional_cpus = 0;
871 872 873 874
 	}

	possible = available_cpus + additional_cpus;

875 876
	if (possible > nr_cpu_ids)
		possible = nr_cpu_ids;
877 878

	printk(KERN_INFO "SMP: Allowing %d CPUs, %d hotplug CPUs\n",
879
		possible, max((possible - available_cpus), 0));
880 881

	for (i = 0; i < possible; i++)
882
		set_cpu_possible(i, true);
883 884
}

885
static int __cpuinit _acpi_map_lsapic(acpi_handle handle, int *pcpu)
L
Linus Torvalds 已提交
886
{
L
Len Brown 已提交
887
	struct acpi_buffer buffer = { ACPI_ALLOCATE_BUFFER, NULL };
L
Linus Torvalds 已提交
888
	union acpi_object *obj;
889
	struct acpi_madt_local_sapic *lsapic;
L
Linus Torvalds 已提交
890
	cpumask_t tmp_map;
891
	int cpu, physid;
L
Len Brown 已提交
892

L
Linus Torvalds 已提交
893 894 895
	if (ACPI_FAILURE(acpi_evaluate_object(handle, "_MAT", NULL, &buffer)))
		return -EINVAL;

L
Len Brown 已提交
896
	if (!buffer.length || !buffer.pointer)
L
Linus Torvalds 已提交
897
		return -EINVAL;
L
Len Brown 已提交
898

L
Linus Torvalds 已提交
899
	obj = buffer.pointer;
900 901
	if (obj->type != ACPI_TYPE_BUFFER)
	{
902
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
903 904 905
		return -EINVAL;
	}

906
	lsapic = (struct acpi_madt_local_sapic *)obj->buffer.pointer;
L
Linus Torvalds 已提交
907

908
	if ((lsapic->header.type != ACPI_MADT_TYPE_LOCAL_SAPIC) ||
909
	    (!(lsapic->lapic_flags & ACPI_MADT_ENABLED))) {
910
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
911 912 913
		return -EINVAL;
	}

L
Len Brown 已提交
914
	physid = ((lsapic->id << 8) | (lsapic->eid));
L
Linus Torvalds 已提交
915

916
	kfree(buffer.pointer);
L
Linus Torvalds 已提交
917 918 919
	buffer.length = ACPI_ALLOCATE_BUFFER;
	buffer.pointer = NULL;

920 921 922
	cpumask_complement(&tmp_map, cpu_present_mask);
	cpu = cpumask_first(&tmp_map);
	if (cpu >= nr_cpu_ids)
L
Linus Torvalds 已提交
923 924 925 926
		return -EINVAL;

	acpi_map_cpu2node(handle, cpu, physid);

927
	set_cpu_present(cpu, true);
L
Linus Torvalds 已提交
928 929
	ia64_cpu_to_sapicid[cpu] = physid;

930 931
	acpi_processor_set_pdc(handle);

L
Linus Torvalds 已提交
932
	*pcpu = cpu;
L
Len Brown 已提交
933
	return (0);
L
Linus Torvalds 已提交
934 935
}

936 937 938 939 940
/* wrapper to silence section mismatch warning */
int __ref acpi_map_lsapic(acpi_handle handle, int *pcpu)
{
	return _acpi_map_lsapic(handle, pcpu);
}
L
Len Brown 已提交
941
EXPORT_SYMBOL(acpi_map_lsapic);
L
Linus Torvalds 已提交
942

L
Len Brown 已提交
943
int acpi_unmap_lsapic(int cpu)
L
Linus Torvalds 已提交
944 945
{
	ia64_cpu_to_sapicid[cpu] = -1;
946
	set_cpu_present(cpu, false);
L
Linus Torvalds 已提交
947 948 949 950 951

#ifdef CONFIG_ACPI_NUMA
	/* NUMA specific cleanup's */
#endif

L
Len Brown 已提交
952
	return (0);
L
Linus Torvalds 已提交
953
}
L
Len Brown 已提交
954

L
Linus Torvalds 已提交
955
EXPORT_SYMBOL(acpi_unmap_lsapic);
L
Len Brown 已提交
956
#endif				/* CONFIG_ACPI_HOTPLUG_CPU */
L
Linus Torvalds 已提交
957 958

#ifdef CONFIG_ACPI_NUMA
959 960
static acpi_status acpi_map_iosapic(acpi_handle handle, u32 depth,
				    void *context, void **ret)
L
Linus Torvalds 已提交
961
{
L
Len Brown 已提交
962
	struct acpi_buffer buffer = { ACPI_ALLOCATE_BUFFER, NULL };
L
Linus Torvalds 已提交
963
	union acpi_object *obj;
964
	struct acpi_madt_io_sapic *iosapic;
L
Linus Torvalds 已提交
965
	unsigned int gsi_base;
A
Alex Williamson 已提交
966
	int pxm, node;
L
Linus Torvalds 已提交
967 968 969 970 971 972 973 974 975 976 977

	/* Only care about objects w/ a method that returns the MADT */
	if (ACPI_FAILURE(acpi_evaluate_object(handle, "_MAT", NULL, &buffer)))
		return AE_OK;

	if (!buffer.length || !buffer.pointer)
		return AE_OK;

	obj = buffer.pointer;
	if (obj->type != ACPI_TYPE_BUFFER ||
	    obj->buffer.length < sizeof(*iosapic)) {
978
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
979 980 981
		return AE_OK;
	}

982
	iosapic = (struct acpi_madt_io_sapic *)obj->buffer.pointer;
L
Linus Torvalds 已提交
983

984
	if (iosapic->header.type != ACPI_MADT_TYPE_IO_SAPIC) {
985
		kfree(buffer.pointer);
L
Linus Torvalds 已提交
986 987 988 989 990
		return AE_OK;
	}

	gsi_base = iosapic->global_irq_base;

991
	kfree(buffer.pointer);
L
Linus Torvalds 已提交
992 993

	/*
A
Alex Williamson 已提交
994
	 * OK, it's an IOSAPIC MADT entry, look for a _PXM value to tell
L
Linus Torvalds 已提交
995 996
	 * us which node to associate this with.
	 */
A
Alex Williamson 已提交
997 998
	pxm = acpi_get_pxm(handle);
	if (pxm < 0)
L
Linus Torvalds 已提交
999 1000
		return AE_OK;

1001
	node = pxm_to_node(pxm);
L
Linus Torvalds 已提交
1002 1003

	if (node >= MAX_NUMNODES || !node_online(node) ||
1004
	    cpumask_empty(cpumask_of_node(node)))
L
Linus Torvalds 已提交
1005 1006 1007 1008 1009 1010
		return AE_OK;

	/* We know a gsi to node mapping! */
	map_iosapic_to_node(gsi_base, node);
	return AE_OK;
}
1011 1012 1013 1014 1015 1016 1017 1018 1019 1020

static int __init
acpi_map_iosapics (void)
{
	acpi_get_devices(NULL, acpi_map_iosapic, NULL, NULL);
	return 0;
}

fs_initcall(acpi_map_iosapics);
#endif				/* CONFIG_ACPI_NUMA */
1021

1022
int __ref acpi_register_ioapic(acpi_handle handle, u64 phys_addr, u32 gsi_base)
1023
{
1024 1025 1026 1027 1028
	int err;

	if ((err = iosapic_init(phys_addr, gsi_base)))
		return err;

1029
#ifdef CONFIG_ACPI_NUMA
1030
	acpi_map_iosapic(handle, 0, NULL, NULL);
L
Len Brown 已提交
1031
#endif				/* CONFIG_ACPI_NUMA */
1032 1033

	return 0;
1034
}
L
Len Brown 已提交
1035

1036 1037
EXPORT_SYMBOL(acpi_register_ioapic);

L
Len Brown 已提交
1038
int acpi_unregister_ioapic(acpi_handle handle, u32 gsi_base)
1039
{
1040
	return iosapic_remove(gsi_base);
1041
}
L
Len Brown 已提交
1042

1043 1044
EXPORT_SYMBOL(acpi_unregister_ioapic);

1045
/*
1046
 * acpi_suspend_lowlevel() - save kernel state and suspend.
1047 1048 1049
 *
 * TBD when when IA64 starts to support suspend...
 */
1050
int acpi_suspend_lowlevel(void) { return 0; }