irq.c 27.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5
/*
 *  Derived from arch/i386/kernel/irq.c
 *    Copyright (C) 1992 Linus Torvalds
 *  Adapted from arch/i386 by Gary Thomas
 *    Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
S
Stephen Rothwell 已提交
6 7
 *  Updated and modified by Cort Dougan <cort@fsmlabs.com>
 *    Copyright (C) 1996-2001 Cort Dougan
L
Linus Torvalds 已提交
8 9
 *  Adapted for Power Macintosh by Paul Mackerras
 *    Copyright (C) 1996 Paul Mackerras (paulus@cs.anu.edu.au)
S
Stephen Rothwell 已提交
10
 *
L
Linus Torvalds 已提交
11 12 13 14 15 16 17 18 19 20
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version
 * 2 of the License, or (at your option) any later version.
 *
 * This file contains the code used by various IRQ handling routines:
 * asking for different IRQ's should be done through these routines
 * instead of just grabbing them. Thus setups with different IRQ numbers
 * shouldn't result in any weird surprises, and installing new handlers
 * should be easier.
S
Stephen Rothwell 已提交
21 22 23 24 25 26 27 28
 *
 * The MPC8xx has an interrupt mask in the SIU.  If a bit is set, the
 * interrupt is _enabled_.  As expected, IRQ0 is bit 0 in the 32-bit
 * mask register (of which only 16 are defined), hence the weird shifting
 * and complement of the cached_irq_mask.  I want to be able to stuff
 * this right into the SIU SMASK register.
 * Many of the prep/chrp functions are conditional compiled on CONFIG_8xx
 * to reduce code space and undefined function references.
L
Linus Torvalds 已提交
29 30
 */

31 32
#undef DEBUG

L
Linus Torvalds 已提交
33 34 35 36 37
#include <linux/module.h>
#include <linux/threads.h>
#include <linux/kernel_stat.h>
#include <linux/signal.h>
#include <linux/sched.h>
S
Stephen Rothwell 已提交
38
#include <linux/ptrace.h>
L
Linus Torvalds 已提交
39 40 41 42 43 44 45
#include <linux/ioport.h>
#include <linux/interrupt.h>
#include <linux/timex.h>
#include <linux/init.h>
#include <linux/slab.h>
#include <linux/delay.h>
#include <linux/irq.h>
S
Stephen Rothwell 已提交
46 47
#include <linux/seq_file.h>
#include <linux/cpumask.h>
L
Linus Torvalds 已提交
48 49
#include <linux/profile.h>
#include <linux/bitops.h>
50 51 52 53
#include <linux/list.h>
#include <linux/radix-tree.h>
#include <linux/mutex.h>
#include <linux/bootmem.h>
J
Jake Moilanen 已提交
54
#include <linux/pci.h>
55
#include <linux/debugfs.h>
56 57
#include <linux/of.h>
#include <linux/of_irq.h>
L
Linus Torvalds 已提交
58 59 60 61 62 63 64 65 66 67

#include <asm/uaccess.h>
#include <asm/system.h>
#include <asm/io.h>
#include <asm/pgtable.h>
#include <asm/irq.h>
#include <asm/cache.h>
#include <asm/prom.h>
#include <asm/ptrace.h>
#include <asm/machdep.h>
68
#include <asm/udbg.h>
69
#include <asm/smp.h>
70

71
#ifdef CONFIG_PPC64
L
Linus Torvalds 已提交
72
#include <asm/paca.h>
73
#include <asm/firmware.h>
74
#include <asm/lv1call.h>
S
Stephen Rothwell 已提交
75
#endif
76 77
#define CREATE_TRACE_POINTS
#include <asm/trace.h>
L
Linus Torvalds 已提交
78

79 80 81
DEFINE_PER_CPU_SHARED_ALIGNED(irq_cpustat_t, irq_stat);
EXPORT_PER_CPU_SYMBOL(irq_stat);

82
int __irq_offset_value;
S
Stephen Rothwell 已提交
83 84

#ifdef CONFIG_PPC32
85 86
EXPORT_SYMBOL(__irq_offset_value);
atomic_t ppc_n_lost_interrupts;
S
Stephen Rothwell 已提交
87 88 89 90 91

#ifdef CONFIG_TAU_INT
extern int tau_initialized;
extern int tau_interrupts(int);
#endif
92
#endif /* CONFIG_PPC32 */
S
Stephen Rothwell 已提交
93 94

#ifdef CONFIG_PPC64
95 96

#ifndef CONFIG_SPARSE_IRQ
L
Linus Torvalds 已提交
97
EXPORT_SYMBOL(irq_desc);
98
#endif
L
Linus Torvalds 已提交
99 100

int distribute_irqs = 1;
101

S
Steven Rostedt 已提交
102
static inline notrace unsigned long get_hard_enabled(void)
103 104 105 106 107 108 109 110 111
{
	unsigned long enabled;

	__asm__ __volatile__("lbz %0,%1(13)"
	: "=r" (enabled) : "i" (offsetof(struct paca_struct, hard_enabled)));

	return enabled;
}

S
Steven Rostedt 已提交
112
static inline notrace void set_soft_enabled(unsigned long enable)
113 114 115 116 117
{
	__asm__ __volatile__("stb %0,%1(13)"
	: : "r" (enable), "i" (offsetof(struct paca_struct, soft_enabled)));
}

D
David Howells 已提交
118
notrace void arch_local_irq_restore(unsigned long en)
119
{
120 121 122 123 124 125 126 127
	/*
	 * get_paca()->soft_enabled = en;
	 * Is it ever valid to use local_irq_restore(0) when soft_enabled is 1?
	 * That was allowed before, and in such a case we do need to take care
	 * that gcc will set soft_enabled directly via r13, not choose to use
	 * an intermediate register, lest we're preempted to a different cpu.
	 */
	set_soft_enabled(en);
128 129 130
	if (!en)
		return;

131
#ifdef CONFIG_PPC_STD_MMU_64
132
	if (firmware_has_feature(FW_FEATURE_ISERIES)) {
133 134 135 136 137 138 139 140 141 142 143 144 145 146
		/*
		 * Do we need to disable preemption here?  Not really: in the
		 * unlikely event that we're preempted to a different cpu in
		 * between getting r13, loading its lppaca_ptr, and loading
		 * its any_int, we might call iseries_handle_interrupts without
		 * an interrupt pending on the new cpu, but that's no disaster,
		 * is it?  And the business of preempting us off the old cpu
		 * would itself involve a local_irq_restore which handles the
		 * interrupt to that cpu.
		 *
		 * But use "local_paca->lppaca_ptr" instead of "get_lppaca()"
		 * to avoid any preemption checking added into get_paca().
		 */
		if (local_paca->lppaca_ptr->int_dword.any_int)
147 148
			iseries_handle_interrupts();
	}
149
#endif /* CONFIG_PPC_STD_MMU_64 */
150

151 152 153 154 155 156 157
	/*
	 * if (get_paca()->hard_enabled) return;
	 * But again we need to take care that gcc gets hard_enabled directly
	 * via r13, not choose to use an intermediate register, lest we're
	 * preempted to a different cpu in between the two instructions.
	 */
	if (get_hard_enabled())
158
		return;
159 160 161 162 163 164 165

	/*
	 * Need to hard-enable interrupts here.  Since currently disabled,
	 * no need to take further asm precautions against preemption; but
	 * use local_paca instead of get_paca() to avoid preemption checking.
	 */
	local_paca->hard_enabled = en;
166 167 168 169 170 171 172 173

#ifndef CONFIG_BOOKE
	/* On server, re-trigger the decrementer if it went negative since
	 * some processors only trigger on edge transitions of the sign bit.
	 *
	 * BookE has a level sensitive decrementer (latches in TSR) so we
	 * don't need that
	 */
174 175
	if ((int)mfspr(SPRN_DEC) < 0)
		mtspr(SPRN_DEC, 1);
176
#endif /* CONFIG_BOOKE */
177 178 179 180 181 182 183 184 185 186

	/*
	 * Force the delivery of pending soft-disabled interrupts on PS3.
	 * Any HV call will have this side effect.
	 */
	if (firmware_has_feature(FW_FEATURE_PS3_LV1)) {
		u64 tmp;
		lv1_get_version_info(&tmp);
	}

187
	__hard_irq_enable();
188
}
D
David Howells 已提交
189
EXPORT_SYMBOL(arch_local_irq_restore);
S
Stephen Rothwell 已提交
190
#endif /* CONFIG_PPC64 */
L
Linus Torvalds 已提交
191

192
int arch_show_interrupts(struct seq_file *p, int prec)
193 194 195 196 197 198 199 200 201 202 203 204
{
	int j;

#if defined(CONFIG_PPC32) && defined(CONFIG_TAU_INT)
	if (tau_initialized) {
		seq_printf(p, "%*s: ", prec, "TAU");
		for_each_online_cpu(j)
			seq_printf(p, "%10u ", tau_interrupts(j));
		seq_puts(p, "  PowerPC             Thermal Assist (cpu temp)\n");
	}
#endif /* CONFIG_PPC32 && CONFIG_TAU_INT */

205 206 207 208 209
	seq_printf(p, "%*s: ", prec, "LOC");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).timer_irqs);
        seq_printf(p, "  Local timer interrupts\n");

210 211 212 213 214
	seq_printf(p, "%*s: ", prec, "SPU");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).spurious_irqs);
	seq_printf(p, "  Spurious interrupts\n");

215 216 217 218 219 220 221 222 223 224
	seq_printf(p, "%*s: ", prec, "CNT");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).pmu_irqs);
	seq_printf(p, "  Performance monitoring interrupts\n");

	seq_printf(p, "%*s: ", prec, "MCE");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).mce_exceptions);
	seq_printf(p, "  Machine check exceptions\n");

225 226 227
	return 0;
}

228 229 230 231 232 233 234 235 236
/*
 * /proc/stat helpers
 */
u64 arch_irq_stat_cpu(unsigned int cpu)
{
	u64 sum = per_cpu(irq_stat, cpu).timer_irqs;

	sum += per_cpu(irq_stat, cpu).pmu_irqs;
	sum += per_cpu(irq_stat, cpu).mce_exceptions;
237
	sum += per_cpu(irq_stat, cpu).spurious_irqs;
238 239 240 241

	return sum;
}

L
Linus Torvalds 已提交
242
#ifdef CONFIG_HOTPLUG_CPU
243
void migrate_irqs(void)
L
Linus Torvalds 已提交
244
{
M
Michael Ellerman 已提交
245
	struct irq_desc *desc;
L
Linus Torvalds 已提交
246 247
	unsigned int irq;
	static int warned;
248
	cpumask_var_t mask;
249
	const struct cpumask *map = cpu_online_mask;
L
Linus Torvalds 已提交
250

251
	alloc_cpumask_var(&mask, GFP_KERNEL);
L
Linus Torvalds 已提交
252

253
	for_each_irq(irq) {
254
		struct irq_data *data;
255 256
		struct irq_chip *chip;

M
Michael Ellerman 已提交
257
		desc = irq_to_desc(irq);
258 259 260
		if (!desc)
			continue;

261 262
		data = irq_desc_get_irq_data(desc);
		if (irqd_is_per_cpu(data))
L
Linus Torvalds 已提交
263 264
			continue;

265
		chip = irq_data_get_irq_chip(data);
266

267
		cpumask_and(mask, data->affinity, map);
268
		if (cpumask_any(mask) >= nr_cpu_ids) {
L
Linus Torvalds 已提交
269
			printk("Breaking affinity for irq %i\n", irq);
270
			cpumask_copy(mask, map);
L
Linus Torvalds 已提交
271
		}
272
		if (chip->irq_set_affinity)
273
			chip->irq_set_affinity(data, mask, true);
M
Michael Ellerman 已提交
274
		else if (desc->action && !(warned++))
L
Linus Torvalds 已提交
275 276 277
			printk("Cannot set affinity for irq %i\n", irq);
	}

278 279
	free_cpumask_var(mask);

L
Linus Torvalds 已提交
280 281 282 283 284 285
	local_irq_enable();
	mdelay(1);
	local_irq_disable();
}
#endif

286 287 288 289 290 291
static inline void handle_one_irq(unsigned int irq)
{
	struct thread_info *curtp, *irqtp;
	unsigned long saved_sp_limit;
	struct irq_desc *desc;

292 293 294 295
	desc = irq_to_desc(irq);
	if (!desc)
		return;

296 297 298 299 300 301
	/* Switch to the irq stack to handle this */
	curtp = current_thread_info();
	irqtp = hardirq_ctx[smp_processor_id()];

	if (curtp == irqtp) {
		/* We're already on the irq stack, just handle it */
302
		desc->handle_irq(irq, desc);
303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318
		return;
	}

	saved_sp_limit = current->thread.ksp_limit;

	irqtp->task = curtp->task;
	irqtp->flags = 0;

	/* Copy the softirq bits in preempt_count so that the
	 * softirq checks work in the hardirq context. */
	irqtp->preempt_count = (irqtp->preempt_count & ~SOFTIRQ_MASK) |
			       (curtp->preempt_count & SOFTIRQ_MASK);

	current->thread.ksp_limit = (unsigned long)irqtp +
		_ALIGN_UP(sizeof(struct thread_info), 16);

319
	call_handle_irq(irq, desc, irqtp, desc->handle_irq);
320 321 322 323 324 325 326 327 328 329
	current->thread.ksp_limit = saved_sp_limit;
	irqtp->task = NULL;

	/* Set any flag that may have been set on the
	 * alternate stack
	 */
	if (irqtp->flags)
		set_bits(irqtp->flags, &curtp->flags);
}

330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345
static inline void check_stack_overflow(void)
{
#ifdef CONFIG_DEBUG_STACKOVERFLOW
	long sp;

	sp = __get_SP() & (THREAD_SIZE-1);

	/* check for stack overflow: is there less than 2KB free? */
	if (unlikely(sp < (sizeof(struct thread_info) + 2048))) {
		printk("do_IRQ: stack overflow: %ld\n",
			sp - sizeof(struct thread_info));
		dump_stack();
	}
#endif
}

L
Linus Torvalds 已提交
346 347
void do_IRQ(struct pt_regs *regs)
{
348
	struct pt_regs *old_regs = set_irq_regs(regs);
349
	unsigned int irq;
L
Linus Torvalds 已提交
350

351 352
	trace_irq_entry(regs);

353
	irq_enter();
L
Linus Torvalds 已提交
354

355
	check_stack_overflow();
L
Linus Torvalds 已提交
356

O
Olaf Hering 已提交
357
	irq = ppc_md.get_irq();
L
Linus Torvalds 已提交
358

359 360 361
	if (irq != NO_IRQ && irq != NO_IRQ_IGNORE)
		handle_one_irq(irq);
	else if (irq != NO_IRQ_IGNORE)
362
		__get_cpu_var(irq_stat).spurious_irqs++;
363

364
	irq_exit();
365
	set_irq_regs(old_regs);
S
Stephen Rothwell 已提交
366

367
#ifdef CONFIG_PPC_ISERIES
368 369
	if (firmware_has_feature(FW_FEATURE_ISERIES) &&
			get_lppaca()->int_dword.fields.decr_int) {
370 371 372
		get_lppaca()->int_dword.fields.decr_int = 0;
		/* Signal a fake decrementer interrupt */
		timer_interrupt(regs);
373 374
	}
#endif
375 376

	trace_irq_exit(regs);
377
}
L
Linus Torvalds 已提交
378 379 380

void __init init_IRQ(void)
{
381 382
	if (ppc_md.init_IRQ)
		ppc_md.init_IRQ();
383 384 385

	exc_lvl_ctx_init();

L
Linus Torvalds 已提交
386 387 388
	irq_ctx_init();
}

389 390 391 392 393 394 395 396
#if defined(CONFIG_BOOKE) || defined(CONFIG_40x)
struct thread_info   *critirq_ctx[NR_CPUS] __read_mostly;
struct thread_info    *dbgirq_ctx[NR_CPUS] __read_mostly;
struct thread_info *mcheckirq_ctx[NR_CPUS] __read_mostly;

void exc_lvl_ctx_init(void)
{
	struct thread_info *tp;
397
	int i, cpu_nr;
398 399

	for_each_possible_cpu(i) {
400 401 402 403 404 405 406 407
#ifdef CONFIG_PPC64
		cpu_nr = i;
#else
		cpu_nr = get_hard_smp_processor_id(i);
#endif
		memset((void *)critirq_ctx[cpu_nr], 0, THREAD_SIZE);
		tp = critirq_ctx[cpu_nr];
		tp->cpu = cpu_nr;
408 409 410
		tp->preempt_count = 0;

#ifdef CONFIG_BOOKE
411 412 413
		memset((void *)dbgirq_ctx[cpu_nr], 0, THREAD_SIZE);
		tp = dbgirq_ctx[cpu_nr];
		tp->cpu = cpu_nr;
414 415
		tp->preempt_count = 0;

416 417 418
		memset((void *)mcheckirq_ctx[cpu_nr], 0, THREAD_SIZE);
		tp = mcheckirq_ctx[cpu_nr];
		tp->cpu = cpu_nr;
419 420 421 422 423
		tp->preempt_count = HARDIRQ_OFFSET;
#endif
	}
}
#endif
L
Linus Torvalds 已提交
424

425 426
struct thread_info *softirq_ctx[NR_CPUS] __read_mostly;
struct thread_info *hardirq_ctx[NR_CPUS] __read_mostly;
L
Linus Torvalds 已提交
427 428 429 430 431 432

void irq_ctx_init(void)
{
	struct thread_info *tp;
	int i;

433
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
434 435 436
		memset((void *)softirq_ctx[i], 0, THREAD_SIZE);
		tp = softirq_ctx[i];
		tp->cpu = i;
437
		tp->preempt_count = 0;
L
Linus Torvalds 已提交
438 439 440 441 442 443 444 445

		memset((void *)hardirq_ctx[i], 0, THREAD_SIZE);
		tp = hardirq_ctx[i];
		tp->cpu = i;
		tp->preempt_count = HARDIRQ_OFFSET;
	}
}

446 447 448
static inline void do_softirq_onstack(void)
{
	struct thread_info *curtp, *irqtp;
449
	unsigned long saved_sp_limit = current->thread.ksp_limit;
450 451 452 453

	curtp = current_thread_info();
	irqtp = softirq_ctx[smp_processor_id()];
	irqtp->task = curtp->task;
454
	irqtp->flags = 0;
455 456
	current->thread.ksp_limit = (unsigned long)irqtp +
				    _ALIGN_UP(sizeof(struct thread_info), 16);
457
	call_do_softirq(irqtp);
458
	current->thread.ksp_limit = saved_sp_limit;
459
	irqtp->task = NULL;
460 461 462 463 464 465

	/* Set any flag that may have been set on the
	 * alternate stack
	 */
	if (irqtp->flags)
		set_bits(irqtp->flags, &curtp->flags);
466
}
L
Linus Torvalds 已提交
467 468 469 470 471 472 473 474 475 476

void do_softirq(void)
{
	unsigned long flags;

	if (in_interrupt())
		return;

	local_irq_save(flags);

477
	if (local_softirq_pending())
478
		do_softirq_onstack();
L
Linus Torvalds 已提交
479 480 481 482 483 484

	local_irq_restore(flags);
}


/*
485
 * IRQ controller and virtual interrupts
L
Linus Torvalds 已提交
486 487
 */

488 489 490 491 492 493 494 495 496 497
/* The main irq map itself is an array of NR_IRQ entries containing the
 * associate host and irq number. An entry with a host of NULL is free.
 * An entry can be allocated if it's free, the allocator always then sets
 * hwirq first to the host's invalid irq number and then fills ops.
 */
struct irq_map_entry {
	irq_hw_number_t	hwirq;
	struct irq_host	*host;
};

498
static LIST_HEAD(irq_hosts);
499
static DEFINE_RAW_SPINLOCK(irq_big_lock);
500
static DEFINE_MUTEX(revmap_trees_mutex);
501
static struct irq_map_entry irq_map[NR_IRQS];
502 503
static unsigned int irq_virq_count = NR_IRQS;
static struct irq_host *irq_default_host;
L
Linus Torvalds 已提交
504

505 506 507 508 509 510
irq_hw_number_t irqd_to_hwirq(struct irq_data *d)
{
	return irq_map[d->irq].hwirq;
}
EXPORT_SYMBOL_GPL(irqd_to_hwirq);

511 512 513 514 515 516
irq_hw_number_t virq_to_hw(unsigned int virq)
{
	return irq_map[virq].hwirq;
}
EXPORT_SYMBOL_GPL(virq_to_hw);

517 518 519 520 521 522
bool virq_is_host(unsigned int virq, struct irq_host *host)
{
	return irq_map[virq].host == host;
}
EXPORT_SYMBOL_GPL(virq_is_host);

523 524 525 526 527
static int default_irq_host_match(struct irq_host *h, struct device_node *np)
{
	return h->of_node != NULL && h->of_node == np;
}

528
struct irq_host *irq_alloc_host(struct device_node *of_node,
529 530 531 532
				unsigned int revmap_type,
				unsigned int revmap_arg,
				struct irq_host_ops *ops,
				irq_hw_number_t inval_irq)
L
Linus Torvalds 已提交
533
{
534 535 536 537 538 539 540 541 542
	struct irq_host *host;
	unsigned int size = sizeof(struct irq_host);
	unsigned int i;
	unsigned int *rmap;
	unsigned long flags;

	/* Allocate structure and revmap table if using linear mapping */
	if (revmap_type == IRQ_HOST_MAP_LINEAR)
		size += revmap_arg * sizeof(unsigned int);
543
	host = kzalloc(size, GFP_KERNEL);
544 545
	if (host == NULL)
		return NULL;
546

547 548 549 550
	/* Fill structure */
	host->revmap_type = revmap_type;
	host->inval_irq = inval_irq;
	host->ops = ops;
551
	host->of_node = of_node_get(of_node);
552

553 554
	if (host->ops->match == NULL)
		host->ops->match = default_irq_host_match;
555

556
	raw_spin_lock_irqsave(&irq_big_lock, flags);
557 558 559 560 561 562

	/* If it's a legacy controller, check for duplicates and
	 * mark it as allocated (we use irq 0 host pointer for that
	 */
	if (revmap_type == IRQ_HOST_MAP_LEGACY) {
		if (irq_map[0].host != NULL) {
563
			raw_spin_unlock_irqrestore(&irq_big_lock, flags);
564 565
			of_node_put(host->of_node);
			kfree(host);
566 567 568 569 570 571
			return NULL;
		}
		irq_map[0].host = host;
	}

	list_add(&host->link, &irq_hosts);
572
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
573 574 575 576 577 578 579 580

	/* Additional setups per revmap type */
	switch(revmap_type) {
	case IRQ_HOST_MAP_LEGACY:
		/* 0 is always the invalid number for legacy */
		host->inval_irq = 0;
		/* setup us as the host for all legacy interrupts */
		for (i = 1; i < NUM_ISA_INTERRUPTS; i++) {
581
			irq_map[i].hwirq = i;
582 583 584 585 586 587
			smp_wmb();
			irq_map[i].host = host;
			smp_wmb();

			/* Legacy flags are left to default at this point,
			 * one can then use irq_create_mapping() to
J
Jean Delvare 已提交
588
			 * explicitly change them
589
			 */
590
			ops->map(host, i, i);
591 592 593

			/* Clear norequest flags */
			irq_clear_status_flags(i, IRQ_NOREQUEST);
594 595 596 597 598
		}
		break;
	case IRQ_HOST_MAP_LINEAR:
		rmap = (unsigned int *)(host + 1);
		for (i = 0; i < revmap_arg; i++)
599
			rmap[i] = NO_IRQ;
600 601 602 603
		host->revmap_data.linear.size = revmap_arg;
		smp_wmb();
		host->revmap_data.linear.revmap = rmap;
		break;
604 605 606
	case IRQ_HOST_MAP_TREE:
		INIT_RADIX_TREE(&host->revmap_data.tree, GFP_KERNEL);
		break;
607 608 609 610 611 612 613
	default:
		break;
	}

	pr_debug("irq: Allocated host of type %d @0x%p\n", revmap_type, host);

	return host;
L
Linus Torvalds 已提交
614 615
}

616
struct irq_host *irq_find_host(struct device_node *node)
L
Linus Torvalds 已提交
617
{
618 619 620 621 622 623 624 625
	struct irq_host *h, *found = NULL;
	unsigned long flags;

	/* We might want to match the legacy controller last since
	 * it might potentially be set to match all interrupts in
	 * the absence of a device node. This isn't a problem so far
	 * yet though...
	 */
626
	raw_spin_lock_irqsave(&irq_big_lock, flags);
627
	list_for_each_entry(h, &irq_hosts, link)
628
		if (h->ops->match(h, node)) {
629 630 631
			found = h;
			break;
		}
632
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
633 634 635 636 637 638 639
	return found;
}
EXPORT_SYMBOL_GPL(irq_find_host);

void irq_set_default_host(struct irq_host *host)
{
	pr_debug("irq: Default host set to @0x%p\n", host);
L
Linus Torvalds 已提交
640

641 642
	irq_default_host = host;
}
L
Linus Torvalds 已提交
643

644 645 646
void irq_set_virq_count(unsigned int count)
{
	pr_debug("irq: Trying to set virq count to %d\n", count);
647

648 649 650 651 652
	BUG_ON(count < NUM_ISA_INTERRUPTS);
	if (count < NR_IRQS)
		irq_virq_count = count;
}

653 654 655
static int irq_setup_virq(struct irq_host *host, unsigned int virq,
			    irq_hw_number_t hwirq)
{
T
Thomas Gleixner 已提交
656
	int res;
657

T
Thomas Gleixner 已提交
658 659
	res = irq_alloc_desc_at(virq, 0);
	if (res != virq) {
660 661 662 663
		pr_debug("irq: -> allocating desc failed\n");
		goto error;
	}

664 665 666 667 668 669 670
	/* map it */
	smp_wmb();
	irq_map[virq].hwirq = hwirq;
	smp_mb();

	if (host->ops->map(host, virq, hwirq)) {
		pr_debug("irq: -> mapping failed, freeing\n");
T
Thomas Gleixner 已提交
671
		goto errdesc;
672 673
	}

674 675
	irq_clear_status_flags(virq, IRQ_NOREQUEST);

676
	return 0;
677

T
Thomas Gleixner 已提交
678 679
errdesc:
	irq_free_descs(virq, 1);
680 681 682
error:
	irq_free_virt(virq, 1);
	return -1;
683
}
684

685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708
unsigned int irq_create_direct_mapping(struct irq_host *host)
{
	unsigned int virq;

	if (host == NULL)
		host = irq_default_host;

	BUG_ON(host == NULL);
	WARN_ON(host->revmap_type != IRQ_HOST_MAP_NOMAP);

	virq = irq_alloc_virt(host, 1, 0);
	if (virq == NO_IRQ) {
		pr_debug("irq: create_direct virq allocation failed\n");
		return NO_IRQ;
	}

	pr_debug("irq: create_direct obtained virq %d\n", virq);

	if (irq_setup_virq(host, virq, virq))
		return NO_IRQ;

	return virq;
}

709
unsigned int irq_create_mapping(struct irq_host *host,
710
				irq_hw_number_t hwirq)
711 712 713
{
	unsigned int virq, hint;

714
	pr_debug("irq: irq_create_mapping(0x%p, 0x%lx)\n", host, hwirq);
715 716 717 718 719 720 721 722 723

	/* Look for default host if nececssary */
	if (host == NULL)
		host = irq_default_host;
	if (host == NULL) {
		printk(KERN_WARNING "irq_create_mapping called for"
		       " NULL host, hwirq=%lx\n", hwirq);
		WARN_ON(1);
		return NO_IRQ;
L
Linus Torvalds 已提交
724
	}
725
	pr_debug("irq: -> using host @%p\n", host);
L
Linus Torvalds 已提交
726

727
	/* Check if mapping already exists */
728
	virq = irq_find_mapping(host, hwirq);
729
	if (virq != NO_IRQ) {
730 731
		pr_debug("irq: -> existing mapping on virq %d\n", virq);
		return virq;
L
Linus Torvalds 已提交
732 733
	}

734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750
	/* Get a virtual interrupt number */
	if (host->revmap_type == IRQ_HOST_MAP_LEGACY) {
		/* Handle legacy */
		virq = (unsigned int)hwirq;
		if (virq == 0 || virq >= NUM_ISA_INTERRUPTS)
			return NO_IRQ;
		return virq;
	} else {
		/* Allocate a virtual interrupt number */
		hint = hwirq % irq_virq_count;
		virq = irq_alloc_virt(host, 1, hint);
		if (virq == NO_IRQ) {
			pr_debug("irq: -> virq allocation failed\n");
			return NO_IRQ;
		}
	}

751
	if (irq_setup_virq(host, virq, hwirq))
752
		return NO_IRQ;
753

754
	pr_debug("irq: irq %lu on host %s mapped to virtual irq %u\n",
755 756
		hwirq, host->of_node ? host->of_node->full_name : "null", virq);

L
Linus Torvalds 已提交
757
	return virq;
758 759 760
}
EXPORT_SYMBOL_GPL(irq_create_mapping);

761
unsigned int irq_create_of_mapping(struct device_node *controller,
762
				   const u32 *intspec, unsigned int intsize)
763 764 765
{
	struct irq_host *host;
	irq_hw_number_t hwirq;
766 767
	unsigned int type = IRQ_TYPE_NONE;
	unsigned int virq;
L
Linus Torvalds 已提交
768

769 770 771 772
	if (controller == NULL)
		host = irq_default_host;
	else
		host = irq_find_host(controller);
773 774 775
	if (host == NULL) {
		printk(KERN_WARNING "irq: no irq host found for %s !\n",
		       controller->full_name);
776
		return NO_IRQ;
777
	}
778 779 780 781 782 783

	/* If host has no translation, then we assume interrupt line */
	if (host->ops->xlate == NULL)
		hwirq = intspec[0];
	else {
		if (host->ops->xlate(host, controller, intspec, intsize,
784
				     &hwirq, &type))
785
			return NO_IRQ;
L
Linus Torvalds 已提交
786
	}
787

788 789 790 791 792 793 794
	/* Create mapping */
	virq = irq_create_mapping(host, hwirq);
	if (virq == NO_IRQ)
		return virq;

	/* Set type if specified and different than the current one */
	if (type != IRQ_TYPE_NONE &&
795
	    type != (irqd_get_trigger_type(irq_get_irq_data(virq))))
796
		irq_set_irq_type(virq, type);
797
	return virq;
L
Linus Torvalds 已提交
798
}
799
EXPORT_SYMBOL_GPL(irq_create_of_mapping);
L
Linus Torvalds 已提交
800

801 802
void irq_dispose_mapping(unsigned int virq)
{
803
	struct irq_host *host;
804
	irq_hw_number_t hwirq;
L
Linus Torvalds 已提交
805

806 807 808 809
	if (virq == NO_IRQ)
		return;

	host = irq_map[virq].host;
810
	if (WARN_ON(host == NULL))
811
		return;
L
Linus Torvalds 已提交
812

813 814 815
	/* Never unmap legacy interrupts */
	if (host->revmap_type == IRQ_HOST_MAP_LEGACY)
		return;
L
Linus Torvalds 已提交
816

817 818
	irq_set_status_flags(virq, IRQ_NOREQUEST);

819
	/* remove chip and handler */
820
	irq_set_chip_and_handler(virq, NULL, NULL);
821 822 823 824 825 826 827 828 829 830 831 832 833 834

	/* Make sure it's completed */
	synchronize_irq(virq);

	/* Tell the PIC about it */
	if (host->ops->unmap)
		host->ops->unmap(host, virq);
	smp_mb();

	/* Clear reverse map */
	hwirq = irq_map[virq].hwirq;
	switch(host->revmap_type) {
	case IRQ_HOST_MAP_LINEAR:
		if (hwirq < host->revmap_data.linear.size)
835
			host->revmap_data.linear.revmap[hwirq] = NO_IRQ;
836 837
		break;
	case IRQ_HOST_MAP_TREE:
838
		mutex_lock(&revmap_trees_mutex);
839
		radix_tree_delete(&host->revmap_data.tree, hwirq);
840
		mutex_unlock(&revmap_trees_mutex);
841 842
		break;
	}
L
Linus Torvalds 已提交
843

844 845 846
	/* Destroy map */
	smp_mb();
	irq_map[virq].hwirq = host->inval_irq;
L
Linus Torvalds 已提交
847

T
Thomas Gleixner 已提交
848
	irq_free_descs(virq, 1);
849 850
	/* Free it */
	irq_free_virt(virq, 1);
L
Linus Torvalds 已提交
851
}
852
EXPORT_SYMBOL_GPL(irq_dispose_mapping);
L
Linus Torvalds 已提交
853

854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884
unsigned int irq_find_mapping(struct irq_host *host,
			      irq_hw_number_t hwirq)
{
	unsigned int i;
	unsigned int hint = hwirq % irq_virq_count;

	/* Look for default host if nececssary */
	if (host == NULL)
		host = irq_default_host;
	if (host == NULL)
		return NO_IRQ;

	/* legacy -> bail early */
	if (host->revmap_type == IRQ_HOST_MAP_LEGACY)
		return hwirq;

	/* Slow path does a linear search of the map */
	if (hint < NUM_ISA_INTERRUPTS)
		hint = NUM_ISA_INTERRUPTS;
	i = hint;
	do  {
		if (irq_map[i].host == host &&
		    irq_map[i].hwirq == hwirq)
			return i;
		i++;
		if (i >= irq_virq_count)
			i = NUM_ISA_INTERRUPTS;
	} while(i != hint);
	return NO_IRQ;
}
EXPORT_SYMBOL_GPL(irq_find_mapping);
L
Linus Torvalds 已提交
885

886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920
#ifdef CONFIG_SMP
int irq_choose_cpu(const struct cpumask *mask)
{
	int cpuid;

	if (cpumask_equal(mask, cpu_all_mask)) {
		static int irq_rover;
		static DEFINE_RAW_SPINLOCK(irq_rover_lock);
		unsigned long flags;

		/* Round-robin distribution... */
do_round_robin:
		raw_spin_lock_irqsave(&irq_rover_lock, flags);

		irq_rover = cpumask_next(irq_rover, cpu_online_mask);
		if (irq_rover >= nr_cpu_ids)
			irq_rover = cpumask_first(cpu_online_mask);

		cpuid = irq_rover;

		raw_spin_unlock_irqrestore(&irq_rover_lock, flags);
	} else {
		cpuid = cpumask_first_and(mask, cpu_online_mask);
		if (cpuid >= nr_cpu_ids)
			goto do_round_robin;
	}

	return get_hard_smp_processor_id(cpuid);
}
#else
int irq_choose_cpu(const struct cpumask *mask)
{
	return hard_smp_processor_id();
}
#endif
921

922 923
unsigned int irq_radix_revmap_lookup(struct irq_host *host,
				     irq_hw_number_t hwirq)
L
Linus Torvalds 已提交
924
{
925 926
	struct irq_map_entry *ptr;
	unsigned int virq;
L
Linus Torvalds 已提交
927

928 929
	if (WARN_ON_ONCE(host->revmap_type != IRQ_HOST_MAP_TREE))
		return irq_find_mapping(host, hwirq);
L
Linus Torvalds 已提交
930

931
	/*
932 933 934
	 * The ptr returned references the static global irq_map.
	 * but freeing an irq can delete nodes along the path to
	 * do the lookup via call_rcu.
935
	 */
936
	rcu_read_lock();
937
	ptr = radix_tree_lookup(&host->revmap_data.tree, hwirq);
938
	rcu_read_unlock();
939

940 941 942 943 944 945
	/*
	 * If found in radix tree, then fine.
	 * Else fallback to linear lookup - this should not happen in practice
	 * as it means that we failed to insert the node in the radix tree.
	 */
	if (ptr)
946
		virq = ptr - irq_map;
947 948 949 950 951 952 953 954 955
	else
		virq = irq_find_mapping(host, hwirq);

	return virq;
}

void irq_radix_revmap_insert(struct irq_host *host, unsigned int virq,
			     irq_hw_number_t hwirq)
{
956 957
	if (WARN_ON(host->revmap_type != IRQ_HOST_MAP_TREE))
		return;
958

959
	if (virq != NO_IRQ) {
960
		mutex_lock(&revmap_trees_mutex);
961 962
		radix_tree_insert(&host->revmap_data.tree, hwirq,
				  &irq_map[virq]);
963
		mutex_unlock(&revmap_trees_mutex);
964
	}
L
Linus Torvalds 已提交
965 966
}

967 968
unsigned int irq_linear_revmap(struct irq_host *host,
			       irq_hw_number_t hwirq)
969
{
970
	unsigned int *revmap;
971

972 973
	if (WARN_ON_ONCE(host->revmap_type != IRQ_HOST_MAP_LINEAR))
		return irq_find_mapping(host, hwirq);
974 975 976 977 978 979 980 981 982 983 984 985 986 987 988

	/* Check revmap bounds */
	if (unlikely(hwirq >= host->revmap_data.linear.size))
		return irq_find_mapping(host, hwirq);

	/* Check if revmap was allocated */
	revmap = host->revmap_data.linear.revmap;
	if (unlikely(revmap == NULL))
		return irq_find_mapping(host, hwirq);

	/* Fill up revmap with slow path if no mapping found */
	if (unlikely(revmap[hwirq] == NO_IRQ))
		revmap[hwirq] = irq_find_mapping(host, hwirq);

	return revmap[hwirq];
989 990
}

991 992 993 994 995 996
unsigned int irq_alloc_virt(struct irq_host *host,
			    unsigned int count,
			    unsigned int hint)
{
	unsigned long flags;
	unsigned int i, j, found = NO_IRQ;
997

998 999 1000
	if (count == 0 || count > (irq_virq_count - NUM_ISA_INTERRUPTS))
		return NO_IRQ;

1001
	raw_spin_lock_irqsave(&irq_big_lock, flags);
1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012

	/* Use hint for 1 interrupt if any */
	if (count == 1 && hint >= NUM_ISA_INTERRUPTS &&
	    hint < irq_virq_count && irq_map[hint].host == NULL) {
		found = hint;
		goto hint_found;
	}

	/* Look for count consecutive numbers in the allocatable
	 * (non-legacy) space
	 */
1013 1014 1015 1016 1017 1018 1019 1020 1021 1022
	for (i = NUM_ISA_INTERRUPTS, j = 0; i < irq_virq_count; i++) {
		if (irq_map[i].host != NULL)
			j = 0;
		else
			j++;

		if (j == count) {
			found = i - count + 1;
			break;
		}
1023 1024
	}
	if (found == NO_IRQ) {
1025
		raw_spin_unlock_irqrestore(&irq_big_lock, flags);
1026 1027 1028 1029 1030 1031 1032 1033
		return NO_IRQ;
	}
 hint_found:
	for (i = found; i < (found + count); i++) {
		irq_map[i].hwirq = host->inval_irq;
		smp_wmb();
		irq_map[i].host = host;
	}
1034
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
1035 1036 1037 1038
	return found;
}

void irq_free_virt(unsigned int virq, unsigned int count)
L
Linus Torvalds 已提交
1039 1040
{
	unsigned long flags;
1041
	unsigned int i;
L
Linus Torvalds 已提交
1042

1043 1044
	WARN_ON (virq < NUM_ISA_INTERRUPTS);
	WARN_ON (count == 0 || (virq + count) > irq_virq_count);
L
Linus Torvalds 已提交
1045

1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058
	if (virq < NUM_ISA_INTERRUPTS) {
		if (virq + count < NUM_ISA_INTERRUPTS)
			return;
		count  =- NUM_ISA_INTERRUPTS - virq;
		virq = NUM_ISA_INTERRUPTS;
	}

	if (count > irq_virq_count || virq > irq_virq_count - count) {
		if (virq > irq_virq_count)
			return;
		count = irq_virq_count - virq;
	}

1059
	raw_spin_lock_irqsave(&irq_big_lock, flags);
1060 1061
	for (i = virq; i < (virq + count); i++) {
		struct irq_host *host;
L
Linus Torvalds 已提交
1062

1063 1064 1065 1066 1067
		host = irq_map[i].host;
		irq_map[i].hwirq = host->inval_irq;
		smp_wmb();
		irq_map[i].host = NULL;
	}
1068
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
L
Linus Torvalds 已提交
1069
}
1070

1071
int arch_early_irq_init(void)
1072
{
1073
	return 0;
1074 1075
}

1076 1077 1078 1079
#ifdef CONFIG_VIRQ_DEBUG
static int virq_debug_show(struct seq_file *m, void *private)
{
	unsigned long flags;
1080
	struct irq_desc *desc;
1081
	const char *p;
1082
	static const char none[] = "none";
1083
	void *data;
1084 1085
	int i;

1086 1087
	seq_printf(m, "%-5s  %-7s  %-15s  %-18s  %s\n", "virq", "hwirq",
		      "chip name", "chip data", "host name");
1088

1089
	for (i = 1; i < nr_irqs; i++) {
M
Michael Ellerman 已提交
1090
		desc = irq_to_desc(i);
1091 1092 1093
		if (!desc)
			continue;

1094
		raw_spin_lock_irqsave(&desc->lock, flags);
1095 1096

		if (desc->action && desc->action->handler) {
1097 1098
			struct irq_chip *chip;

1099
			seq_printf(m, "%5d  ", i);
1100
			seq_printf(m, "0x%05lx  ", irq_map[i].hwirq);
1101

1102
			chip = irq_desc_get_chip(desc);
1103 1104
			if (chip && chip->name)
				p = chip->name;
1105 1106 1107 1108
			else
				p = none;
			seq_printf(m, "%-15s  ", p);

1109 1110 1111
			data = irq_desc_get_chip_data(desc);
			seq_printf(m, "0x%16p  ", data);

1112 1113 1114 1115 1116 1117 1118
			if (irq_map[i].host && irq_map[i].host->of_node)
				p = irq_map[i].host->of_node->full_name;
			else
				p = none;
			seq_printf(m, "%s\n", p);
		}

1119
		raw_spin_unlock_irqrestore(&desc->lock, flags);
1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139
	}

	return 0;
}

static int virq_debug_open(struct inode *inode, struct file *file)
{
	return single_open(file, virq_debug_show, inode->i_private);
}

static const struct file_operations virq_debug_fops = {
	.open = virq_debug_open,
	.read = seq_read,
	.llseek = seq_lseek,
	.release = single_release,
};

static int __init irq_debugfs_init(void)
{
	if (debugfs_create_file("virq_mapping", S_IRUGO, powerpc_debugfs_root,
1140
				 NULL, &virq_debug_fops) == NULL)
1141 1142 1143 1144 1145 1146 1147
		return -ENOMEM;

	return 0;
}
__initcall(irq_debugfs_init);
#endif /* CONFIG_VIRQ_DEBUG */

1148
#ifdef CONFIG_PPC64
L
Linus Torvalds 已提交
1149 1150 1151 1152 1153 1154 1155
static int __init setup_noirqdistrib(char *str)
{
	distribute_irqs = 0;
	return 1;
}

__setup("noirqdistrib", setup_noirqdistrib);
S
Stephen Rothwell 已提交
1156
#endif /* CONFIG_PPC64 */