irq.c 27.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5
/*
 *  Derived from arch/i386/kernel/irq.c
 *    Copyright (C) 1992 Linus Torvalds
 *  Adapted from arch/i386 by Gary Thomas
 *    Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
S
Stephen Rothwell 已提交
6 7
 *  Updated and modified by Cort Dougan <cort@fsmlabs.com>
 *    Copyright (C) 1996-2001 Cort Dougan
L
Linus Torvalds 已提交
8 9
 *  Adapted for Power Macintosh by Paul Mackerras
 *    Copyright (C) 1996 Paul Mackerras (paulus@cs.anu.edu.au)
S
Stephen Rothwell 已提交
10
 *
L
Linus Torvalds 已提交
11 12 13 14 15 16 17 18 19 20
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version
 * 2 of the License, or (at your option) any later version.
 *
 * This file contains the code used by various IRQ handling routines:
 * asking for different IRQ's should be done through these routines
 * instead of just grabbing them. Thus setups with different IRQ numbers
 * shouldn't result in any weird surprises, and installing new handlers
 * should be easier.
S
Stephen Rothwell 已提交
21 22 23 24 25 26 27 28
 *
 * The MPC8xx has an interrupt mask in the SIU.  If a bit is set, the
 * interrupt is _enabled_.  As expected, IRQ0 is bit 0 in the 32-bit
 * mask register (of which only 16 are defined), hence the weird shifting
 * and complement of the cached_irq_mask.  I want to be able to stuff
 * this right into the SIU SMASK register.
 * Many of the prep/chrp functions are conditional compiled on CONFIG_8xx
 * to reduce code space and undefined function references.
L
Linus Torvalds 已提交
29 30
 */

31 32
#undef DEBUG

33
#include <linux/export.h>
L
Linus Torvalds 已提交
34 35 36 37
#include <linux/threads.h>
#include <linux/kernel_stat.h>
#include <linux/signal.h>
#include <linux/sched.h>
S
Stephen Rothwell 已提交
38
#include <linux/ptrace.h>
L
Linus Torvalds 已提交
39 40 41 42 43 44 45
#include <linux/ioport.h>
#include <linux/interrupt.h>
#include <linux/timex.h>
#include <linux/init.h>
#include <linux/slab.h>
#include <linux/delay.h>
#include <linux/irq.h>
S
Stephen Rothwell 已提交
46 47
#include <linux/seq_file.h>
#include <linux/cpumask.h>
L
Linus Torvalds 已提交
48 49
#include <linux/profile.h>
#include <linux/bitops.h>
50 51 52 53
#include <linux/list.h>
#include <linux/radix-tree.h>
#include <linux/mutex.h>
#include <linux/bootmem.h>
J
Jake Moilanen 已提交
54
#include <linux/pci.h>
55
#include <linux/debugfs.h>
56 57
#include <linux/of.h>
#include <linux/of_irq.h>
L
Linus Torvalds 已提交
58 59 60 61 62 63 64 65 66 67

#include <asm/uaccess.h>
#include <asm/system.h>
#include <asm/io.h>
#include <asm/pgtable.h>
#include <asm/irq.h>
#include <asm/cache.h>
#include <asm/prom.h>
#include <asm/ptrace.h>
#include <asm/machdep.h>
68
#include <asm/udbg.h>
69
#include <asm/smp.h>
70

71
#ifdef CONFIG_PPC64
L
Linus Torvalds 已提交
72
#include <asm/paca.h>
73
#include <asm/firmware.h>
74
#include <asm/lv1call.h>
S
Stephen Rothwell 已提交
75
#endif
76 77
#define CREATE_TRACE_POINTS
#include <asm/trace.h>
L
Linus Torvalds 已提交
78

79 80 81
DEFINE_PER_CPU_SHARED_ALIGNED(irq_cpustat_t, irq_stat);
EXPORT_PER_CPU_SYMBOL(irq_stat);

82
int __irq_offset_value;
S
Stephen Rothwell 已提交
83 84

#ifdef CONFIG_PPC32
85 86
EXPORT_SYMBOL(__irq_offset_value);
atomic_t ppc_n_lost_interrupts;
S
Stephen Rothwell 已提交
87 88 89 90 91

#ifdef CONFIG_TAU_INT
extern int tau_initialized;
extern int tau_interrupts(int);
#endif
92
#endif /* CONFIG_PPC32 */
S
Stephen Rothwell 已提交
93 94

#ifdef CONFIG_PPC64
95

L
Linus Torvalds 已提交
96
int distribute_irqs = 1;
97

S
Steven Rostedt 已提交
98
static inline notrace unsigned long get_hard_enabled(void)
99 100 101 102 103 104 105 106 107
{
	unsigned long enabled;

	__asm__ __volatile__("lbz %0,%1(13)"
	: "=r" (enabled) : "i" (offsetof(struct paca_struct, hard_enabled)));

	return enabled;
}

S
Steven Rostedt 已提交
108
static inline notrace void set_soft_enabled(unsigned long enable)
109 110 111 112 113
{
	__asm__ __volatile__("stb %0,%1(13)"
	: : "r" (enable), "i" (offsetof(struct paca_struct, soft_enabled)));
}

114 115 116
static inline notrace void decrementer_check_overflow(void)
{
	u64 now = get_tb_or_rtc();
117 118 119 120
	u64 *next_tb;

	preempt_disable();
	next_tb = &__get_cpu_var(decrementers_next_tb);
121 122 123

	if (now >= *next_tb)
		set_dec(1);
124
	preempt_enable();
125 126
}

D
David Howells 已提交
127
notrace void arch_local_irq_restore(unsigned long en)
128
{
129 130 131 132 133 134 135 136
	/*
	 * get_paca()->soft_enabled = en;
	 * Is it ever valid to use local_irq_restore(0) when soft_enabled is 1?
	 * That was allowed before, and in such a case we do need to take care
	 * that gcc will set soft_enabled directly via r13, not choose to use
	 * an intermediate register, lest we're preempted to a different cpu.
	 */
	set_soft_enabled(en);
137 138 139
	if (!en)
		return;

140
#ifdef CONFIG_PPC_STD_MMU_64
141
	if (firmware_has_feature(FW_FEATURE_ISERIES)) {
142 143 144 145 146 147 148 149 150 151 152 153 154 155
		/*
		 * Do we need to disable preemption here?  Not really: in the
		 * unlikely event that we're preempted to a different cpu in
		 * between getting r13, loading its lppaca_ptr, and loading
		 * its any_int, we might call iseries_handle_interrupts without
		 * an interrupt pending on the new cpu, but that's no disaster,
		 * is it?  And the business of preempting us off the old cpu
		 * would itself involve a local_irq_restore which handles the
		 * interrupt to that cpu.
		 *
		 * But use "local_paca->lppaca_ptr" instead of "get_lppaca()"
		 * to avoid any preemption checking added into get_paca().
		 */
		if (local_paca->lppaca_ptr->int_dword.any_int)
156 157
			iseries_handle_interrupts();
	}
158
#endif /* CONFIG_PPC_STD_MMU_64 */
159

160 161 162 163 164 165 166
	/*
	 * if (get_paca()->hard_enabled) return;
	 * But again we need to take care that gcc gets hard_enabled directly
	 * via r13, not choose to use an intermediate register, lest we're
	 * preempted to a different cpu in between the two instructions.
	 */
	if (get_hard_enabled())
167
		return;
168 169 170 171 172 173 174

	/*
	 * Need to hard-enable interrupts here.  Since currently disabled,
	 * no need to take further asm precautions against preemption; but
	 * use local_paca instead of get_paca() to avoid preemption checking.
	 */
	local_paca->hard_enabled = en;
175

176 177 178 179 180
	/*
	 * Trigger the decrementer if we have a pending event. Some processors
	 * only trigger on edge transitions of the sign bit. We might also
	 * have disabled interrupts long enough that the decrementer wrapped
	 * to positive.
181
	 */
182
	decrementer_check_overflow();
183 184 185 186 187 188

	/*
	 * Force the delivery of pending soft-disabled interrupts on PS3.
	 * Any HV call will have this side effect.
	 */
	if (firmware_has_feature(FW_FEATURE_PS3_LV1)) {
189 190
		u64 tmp, tmp2;
		lv1_get_version_info(&tmp, &tmp2);
191 192
	}

193
	__hard_irq_enable();
194
}
D
David Howells 已提交
195
EXPORT_SYMBOL(arch_local_irq_restore);
S
Stephen Rothwell 已提交
196
#endif /* CONFIG_PPC64 */
L
Linus Torvalds 已提交
197

198
int arch_show_interrupts(struct seq_file *p, int prec)
199 200 201 202 203 204 205 206 207 208 209 210
{
	int j;

#if defined(CONFIG_PPC32) && defined(CONFIG_TAU_INT)
	if (tau_initialized) {
		seq_printf(p, "%*s: ", prec, "TAU");
		for_each_online_cpu(j)
			seq_printf(p, "%10u ", tau_interrupts(j));
		seq_puts(p, "  PowerPC             Thermal Assist (cpu temp)\n");
	}
#endif /* CONFIG_PPC32 && CONFIG_TAU_INT */

211 212 213 214 215
	seq_printf(p, "%*s: ", prec, "LOC");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).timer_irqs);
        seq_printf(p, "  Local timer interrupts\n");

216 217 218 219 220
	seq_printf(p, "%*s: ", prec, "SPU");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).spurious_irqs);
	seq_printf(p, "  Spurious interrupts\n");

221 222 223 224 225 226 227 228 229 230
	seq_printf(p, "%*s: ", prec, "CNT");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).pmu_irqs);
	seq_printf(p, "  Performance monitoring interrupts\n");

	seq_printf(p, "%*s: ", prec, "MCE");
	for_each_online_cpu(j)
		seq_printf(p, "%10u ", per_cpu(irq_stat, j).mce_exceptions);
	seq_printf(p, "  Machine check exceptions\n");

231 232 233
	return 0;
}

234 235 236 237 238 239 240 241 242
/*
 * /proc/stat helpers
 */
u64 arch_irq_stat_cpu(unsigned int cpu)
{
	u64 sum = per_cpu(irq_stat, cpu).timer_irqs;

	sum += per_cpu(irq_stat, cpu).pmu_irqs;
	sum += per_cpu(irq_stat, cpu).mce_exceptions;
243
	sum += per_cpu(irq_stat, cpu).spurious_irqs;
244 245 246 247

	return sum;
}

L
Linus Torvalds 已提交
248
#ifdef CONFIG_HOTPLUG_CPU
249
void migrate_irqs(void)
L
Linus Torvalds 已提交
250
{
M
Michael Ellerman 已提交
251
	struct irq_desc *desc;
L
Linus Torvalds 已提交
252 253
	unsigned int irq;
	static int warned;
254
	cpumask_var_t mask;
255
	const struct cpumask *map = cpu_online_mask;
L
Linus Torvalds 已提交
256

257
	alloc_cpumask_var(&mask, GFP_KERNEL);
L
Linus Torvalds 已提交
258

259
	for_each_irq(irq) {
260
		struct irq_data *data;
261 262
		struct irq_chip *chip;

M
Michael Ellerman 已提交
263
		desc = irq_to_desc(irq);
264 265 266
		if (!desc)
			continue;

267 268
		data = irq_desc_get_irq_data(desc);
		if (irqd_is_per_cpu(data))
L
Linus Torvalds 已提交
269 270
			continue;

271
		chip = irq_data_get_irq_chip(data);
272

273
		cpumask_and(mask, data->affinity, map);
274
		if (cpumask_any(mask) >= nr_cpu_ids) {
L
Linus Torvalds 已提交
275
			printk("Breaking affinity for irq %i\n", irq);
276
			cpumask_copy(mask, map);
L
Linus Torvalds 已提交
277
		}
278
		if (chip->irq_set_affinity)
279
			chip->irq_set_affinity(data, mask, true);
M
Michael Ellerman 已提交
280
		else if (desc->action && !(warned++))
L
Linus Torvalds 已提交
281 282 283
			printk("Cannot set affinity for irq %i\n", irq);
	}

284 285
	free_cpumask_var(mask);

L
Linus Torvalds 已提交
286 287 288 289 290 291
	local_irq_enable();
	mdelay(1);
	local_irq_disable();
}
#endif

292 293 294 295 296 297
static inline void handle_one_irq(unsigned int irq)
{
	struct thread_info *curtp, *irqtp;
	unsigned long saved_sp_limit;
	struct irq_desc *desc;

298 299 300 301
	desc = irq_to_desc(irq);
	if (!desc)
		return;

302 303 304 305 306 307
	/* Switch to the irq stack to handle this */
	curtp = current_thread_info();
	irqtp = hardirq_ctx[smp_processor_id()];

	if (curtp == irqtp) {
		/* We're already on the irq stack, just handle it */
308
		desc->handle_irq(irq, desc);
309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324
		return;
	}

	saved_sp_limit = current->thread.ksp_limit;

	irqtp->task = curtp->task;
	irqtp->flags = 0;

	/* Copy the softirq bits in preempt_count so that the
	 * softirq checks work in the hardirq context. */
	irqtp->preempt_count = (irqtp->preempt_count & ~SOFTIRQ_MASK) |
			       (curtp->preempt_count & SOFTIRQ_MASK);

	current->thread.ksp_limit = (unsigned long)irqtp +
		_ALIGN_UP(sizeof(struct thread_info), 16);

325
	call_handle_irq(irq, desc, irqtp, desc->handle_irq);
326 327 328 329 330 331 332 333 334 335
	current->thread.ksp_limit = saved_sp_limit;
	irqtp->task = NULL;

	/* Set any flag that may have been set on the
	 * alternate stack
	 */
	if (irqtp->flags)
		set_bits(irqtp->flags, &curtp->flags);
}

336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351
static inline void check_stack_overflow(void)
{
#ifdef CONFIG_DEBUG_STACKOVERFLOW
	long sp;

	sp = __get_SP() & (THREAD_SIZE-1);

	/* check for stack overflow: is there less than 2KB free? */
	if (unlikely(sp < (sizeof(struct thread_info) + 2048))) {
		printk("do_IRQ: stack overflow: %ld\n",
			sp - sizeof(struct thread_info));
		dump_stack();
	}
#endif
}

L
Linus Torvalds 已提交
352 353
void do_IRQ(struct pt_regs *regs)
{
354
	struct pt_regs *old_regs = set_irq_regs(regs);
355
	unsigned int irq;
L
Linus Torvalds 已提交
356

357 358
	trace_irq_entry(regs);

359
	irq_enter();
L
Linus Torvalds 已提交
360

361
	check_stack_overflow();
L
Linus Torvalds 已提交
362

O
Olaf Hering 已提交
363
	irq = ppc_md.get_irq();
L
Linus Torvalds 已提交
364

365 366 367
	if (irq != NO_IRQ && irq != NO_IRQ_IGNORE)
		handle_one_irq(irq);
	else if (irq != NO_IRQ_IGNORE)
368
		__get_cpu_var(irq_stat).spurious_irqs++;
369

370
	irq_exit();
371
	set_irq_regs(old_regs);
S
Stephen Rothwell 已提交
372

373
#ifdef CONFIG_PPC_ISERIES
374 375
	if (firmware_has_feature(FW_FEATURE_ISERIES) &&
			get_lppaca()->int_dword.fields.decr_int) {
376 377 378
		get_lppaca()->int_dword.fields.decr_int = 0;
		/* Signal a fake decrementer interrupt */
		timer_interrupt(regs);
379 380
	}
#endif
381 382

	trace_irq_exit(regs);
383
}
L
Linus Torvalds 已提交
384 385 386

void __init init_IRQ(void)
{
387 388
	if (ppc_md.init_IRQ)
		ppc_md.init_IRQ();
389 390 391

	exc_lvl_ctx_init();

L
Linus Torvalds 已提交
392 393 394
	irq_ctx_init();
}

395 396 397 398 399 400 401 402
#if defined(CONFIG_BOOKE) || defined(CONFIG_40x)
struct thread_info   *critirq_ctx[NR_CPUS] __read_mostly;
struct thread_info    *dbgirq_ctx[NR_CPUS] __read_mostly;
struct thread_info *mcheckirq_ctx[NR_CPUS] __read_mostly;

void exc_lvl_ctx_init(void)
{
	struct thread_info *tp;
403
	int i, cpu_nr;
404 405

	for_each_possible_cpu(i) {
406 407 408 409 410 411 412 413
#ifdef CONFIG_PPC64
		cpu_nr = i;
#else
		cpu_nr = get_hard_smp_processor_id(i);
#endif
		memset((void *)critirq_ctx[cpu_nr], 0, THREAD_SIZE);
		tp = critirq_ctx[cpu_nr];
		tp->cpu = cpu_nr;
414 415 416
		tp->preempt_count = 0;

#ifdef CONFIG_BOOKE
417 418 419
		memset((void *)dbgirq_ctx[cpu_nr], 0, THREAD_SIZE);
		tp = dbgirq_ctx[cpu_nr];
		tp->cpu = cpu_nr;
420 421
		tp->preempt_count = 0;

422 423 424
		memset((void *)mcheckirq_ctx[cpu_nr], 0, THREAD_SIZE);
		tp = mcheckirq_ctx[cpu_nr];
		tp->cpu = cpu_nr;
425 426 427 428 429
		tp->preempt_count = HARDIRQ_OFFSET;
#endif
	}
}
#endif
L
Linus Torvalds 已提交
430

431 432
struct thread_info *softirq_ctx[NR_CPUS] __read_mostly;
struct thread_info *hardirq_ctx[NR_CPUS] __read_mostly;
L
Linus Torvalds 已提交
433 434 435 436 437 438

void irq_ctx_init(void)
{
	struct thread_info *tp;
	int i;

439
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
440 441 442
		memset((void *)softirq_ctx[i], 0, THREAD_SIZE);
		tp = softirq_ctx[i];
		tp->cpu = i;
443
		tp->preempt_count = 0;
L
Linus Torvalds 已提交
444 445 446 447 448 449 450 451

		memset((void *)hardirq_ctx[i], 0, THREAD_SIZE);
		tp = hardirq_ctx[i];
		tp->cpu = i;
		tp->preempt_count = HARDIRQ_OFFSET;
	}
}

452 453 454
static inline void do_softirq_onstack(void)
{
	struct thread_info *curtp, *irqtp;
455
	unsigned long saved_sp_limit = current->thread.ksp_limit;
456 457 458 459

	curtp = current_thread_info();
	irqtp = softirq_ctx[smp_processor_id()];
	irqtp->task = curtp->task;
460
	irqtp->flags = 0;
461 462
	current->thread.ksp_limit = (unsigned long)irqtp +
				    _ALIGN_UP(sizeof(struct thread_info), 16);
463
	call_do_softirq(irqtp);
464
	current->thread.ksp_limit = saved_sp_limit;
465
	irqtp->task = NULL;
466 467 468 469 470 471

	/* Set any flag that may have been set on the
	 * alternate stack
	 */
	if (irqtp->flags)
		set_bits(irqtp->flags, &curtp->flags);
472
}
L
Linus Torvalds 已提交
473 474 475 476 477 478 479 480 481 482

void do_softirq(void)
{
	unsigned long flags;

	if (in_interrupt())
		return;

	local_irq_save(flags);

483
	if (local_softirq_pending())
484
		do_softirq_onstack();
L
Linus Torvalds 已提交
485 486 487 488 489 490

	local_irq_restore(flags);
}


/*
491
 * IRQ controller and virtual interrupts
L
Linus Torvalds 已提交
492 493
 */

494 495 496 497 498 499 500 501 502 503
/* The main irq map itself is an array of NR_IRQ entries containing the
 * associate host and irq number. An entry with a host of NULL is free.
 * An entry can be allocated if it's free, the allocator always then sets
 * hwirq first to the host's invalid irq number and then fills ops.
 */
struct irq_map_entry {
	irq_hw_number_t	hwirq;
	struct irq_host	*host;
};

504
static LIST_HEAD(irq_hosts);
505
static DEFINE_RAW_SPINLOCK(irq_big_lock);
506
static DEFINE_MUTEX(revmap_trees_mutex);
507
static struct irq_map_entry irq_map[NR_IRQS];
508 509
static unsigned int irq_virq_count = NR_IRQS;
static struct irq_host *irq_default_host;
L
Linus Torvalds 已提交
510

511 512 513 514 515 516
irq_hw_number_t irqd_to_hwirq(struct irq_data *d)
{
	return irq_map[d->irq].hwirq;
}
EXPORT_SYMBOL_GPL(irqd_to_hwirq);

517 518 519 520 521 522
irq_hw_number_t virq_to_hw(unsigned int virq)
{
	return irq_map[virq].hwirq;
}
EXPORT_SYMBOL_GPL(virq_to_hw);

523 524 525 526 527 528
bool virq_is_host(unsigned int virq, struct irq_host *host)
{
	return irq_map[virq].host == host;
}
EXPORT_SYMBOL_GPL(virq_is_host);

529 530 531 532 533
static int default_irq_host_match(struct irq_host *h, struct device_node *np)
{
	return h->of_node != NULL && h->of_node == np;
}

534
struct irq_host *irq_alloc_host(struct device_node *of_node,
535 536 537 538
				unsigned int revmap_type,
				unsigned int revmap_arg,
				struct irq_host_ops *ops,
				irq_hw_number_t inval_irq)
L
Linus Torvalds 已提交
539
{
540 541 542 543 544 545 546 547 548
	struct irq_host *host;
	unsigned int size = sizeof(struct irq_host);
	unsigned int i;
	unsigned int *rmap;
	unsigned long flags;

	/* Allocate structure and revmap table if using linear mapping */
	if (revmap_type == IRQ_HOST_MAP_LINEAR)
		size += revmap_arg * sizeof(unsigned int);
549
	host = kzalloc(size, GFP_KERNEL);
550 551
	if (host == NULL)
		return NULL;
552

553 554 555 556
	/* Fill structure */
	host->revmap_type = revmap_type;
	host->inval_irq = inval_irq;
	host->ops = ops;
557
	host->of_node = of_node_get(of_node);
558

559 560
	if (host->ops->match == NULL)
		host->ops->match = default_irq_host_match;
561

562
	raw_spin_lock_irqsave(&irq_big_lock, flags);
563 564 565 566 567 568

	/* If it's a legacy controller, check for duplicates and
	 * mark it as allocated (we use irq 0 host pointer for that
	 */
	if (revmap_type == IRQ_HOST_MAP_LEGACY) {
		if (irq_map[0].host != NULL) {
569
			raw_spin_unlock_irqrestore(&irq_big_lock, flags);
570 571
			of_node_put(host->of_node);
			kfree(host);
572 573 574 575 576 577
			return NULL;
		}
		irq_map[0].host = host;
	}

	list_add(&host->link, &irq_hosts);
578
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
579 580 581 582 583 584 585 586

	/* Additional setups per revmap type */
	switch(revmap_type) {
	case IRQ_HOST_MAP_LEGACY:
		/* 0 is always the invalid number for legacy */
		host->inval_irq = 0;
		/* setup us as the host for all legacy interrupts */
		for (i = 1; i < NUM_ISA_INTERRUPTS; i++) {
587
			irq_map[i].hwirq = i;
588 589 590 591 592 593
			smp_wmb();
			irq_map[i].host = host;
			smp_wmb();

			/* Legacy flags are left to default at this point,
			 * one can then use irq_create_mapping() to
J
Jean Delvare 已提交
594
			 * explicitly change them
595
			 */
596
			ops->map(host, i, i);
597 598 599

			/* Clear norequest flags */
			irq_clear_status_flags(i, IRQ_NOREQUEST);
600 601 602 603 604
		}
		break;
	case IRQ_HOST_MAP_LINEAR:
		rmap = (unsigned int *)(host + 1);
		for (i = 0; i < revmap_arg; i++)
605
			rmap[i] = NO_IRQ;
606 607 608 609
		host->revmap_data.linear.size = revmap_arg;
		smp_wmb();
		host->revmap_data.linear.revmap = rmap;
		break;
610 611 612
	case IRQ_HOST_MAP_TREE:
		INIT_RADIX_TREE(&host->revmap_data.tree, GFP_KERNEL);
		break;
613 614 615 616 617 618 619
	default:
		break;
	}

	pr_debug("irq: Allocated host of type %d @0x%p\n", revmap_type, host);

	return host;
L
Linus Torvalds 已提交
620 621
}

622
struct irq_host *irq_find_host(struct device_node *node)
L
Linus Torvalds 已提交
623
{
624 625 626 627 628 629 630 631
	struct irq_host *h, *found = NULL;
	unsigned long flags;

	/* We might want to match the legacy controller last since
	 * it might potentially be set to match all interrupts in
	 * the absence of a device node. This isn't a problem so far
	 * yet though...
	 */
632
	raw_spin_lock_irqsave(&irq_big_lock, flags);
633
	list_for_each_entry(h, &irq_hosts, link)
634
		if (h->ops->match(h, node)) {
635 636 637
			found = h;
			break;
		}
638
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
639 640 641 642 643 644 645
	return found;
}
EXPORT_SYMBOL_GPL(irq_find_host);

void irq_set_default_host(struct irq_host *host)
{
	pr_debug("irq: Default host set to @0x%p\n", host);
L
Linus Torvalds 已提交
646

647 648
	irq_default_host = host;
}
L
Linus Torvalds 已提交
649

650 651 652
void irq_set_virq_count(unsigned int count)
{
	pr_debug("irq: Trying to set virq count to %d\n", count);
653

654 655 656 657 658
	BUG_ON(count < NUM_ISA_INTERRUPTS);
	if (count < NR_IRQS)
		irq_virq_count = count;
}

659 660 661
static int irq_setup_virq(struct irq_host *host, unsigned int virq,
			    irq_hw_number_t hwirq)
{
T
Thomas Gleixner 已提交
662
	int res;
663

T
Thomas Gleixner 已提交
664 665
	res = irq_alloc_desc_at(virq, 0);
	if (res != virq) {
666 667 668 669
		pr_debug("irq: -> allocating desc failed\n");
		goto error;
	}

670 671 672 673 674 675 676
	/* map it */
	smp_wmb();
	irq_map[virq].hwirq = hwirq;
	smp_mb();

	if (host->ops->map(host, virq, hwirq)) {
		pr_debug("irq: -> mapping failed, freeing\n");
T
Thomas Gleixner 已提交
677
		goto errdesc;
678 679
	}

680 681
	irq_clear_status_flags(virq, IRQ_NOREQUEST);

682
	return 0;
683

T
Thomas Gleixner 已提交
684 685
errdesc:
	irq_free_descs(virq, 1);
686 687 688
error:
	irq_free_virt(virq, 1);
	return -1;
689
}
690

691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714
unsigned int irq_create_direct_mapping(struct irq_host *host)
{
	unsigned int virq;

	if (host == NULL)
		host = irq_default_host;

	BUG_ON(host == NULL);
	WARN_ON(host->revmap_type != IRQ_HOST_MAP_NOMAP);

	virq = irq_alloc_virt(host, 1, 0);
	if (virq == NO_IRQ) {
		pr_debug("irq: create_direct virq allocation failed\n");
		return NO_IRQ;
	}

	pr_debug("irq: create_direct obtained virq %d\n", virq);

	if (irq_setup_virq(host, virq, virq))
		return NO_IRQ;

	return virq;
}

715
unsigned int irq_create_mapping(struct irq_host *host,
716
				irq_hw_number_t hwirq)
717 718 719
{
	unsigned int virq, hint;

720
	pr_debug("irq: irq_create_mapping(0x%p, 0x%lx)\n", host, hwirq);
721 722 723 724 725 726 727 728 729

	/* Look for default host if nececssary */
	if (host == NULL)
		host = irq_default_host;
	if (host == NULL) {
		printk(KERN_WARNING "irq_create_mapping called for"
		       " NULL host, hwirq=%lx\n", hwirq);
		WARN_ON(1);
		return NO_IRQ;
L
Linus Torvalds 已提交
730
	}
731
	pr_debug("irq: -> using host @%p\n", host);
L
Linus Torvalds 已提交
732

733
	/* Check if mapping already exists */
734
	virq = irq_find_mapping(host, hwirq);
735
	if (virq != NO_IRQ) {
736 737
		pr_debug("irq: -> existing mapping on virq %d\n", virq);
		return virq;
L
Linus Torvalds 已提交
738 739
	}

740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756
	/* Get a virtual interrupt number */
	if (host->revmap_type == IRQ_HOST_MAP_LEGACY) {
		/* Handle legacy */
		virq = (unsigned int)hwirq;
		if (virq == 0 || virq >= NUM_ISA_INTERRUPTS)
			return NO_IRQ;
		return virq;
	} else {
		/* Allocate a virtual interrupt number */
		hint = hwirq % irq_virq_count;
		virq = irq_alloc_virt(host, 1, hint);
		if (virq == NO_IRQ) {
			pr_debug("irq: -> virq allocation failed\n");
			return NO_IRQ;
		}
	}

757
	if (irq_setup_virq(host, virq, hwirq))
758
		return NO_IRQ;
759

760
	pr_debug("irq: irq %lu on host %s mapped to virtual irq %u\n",
761 762
		hwirq, host->of_node ? host->of_node->full_name : "null", virq);

L
Linus Torvalds 已提交
763
	return virq;
764 765 766
}
EXPORT_SYMBOL_GPL(irq_create_mapping);

767
unsigned int irq_create_of_mapping(struct device_node *controller,
768
				   const u32 *intspec, unsigned int intsize)
769 770 771
{
	struct irq_host *host;
	irq_hw_number_t hwirq;
772 773
	unsigned int type = IRQ_TYPE_NONE;
	unsigned int virq;
L
Linus Torvalds 已提交
774

775 776 777 778
	if (controller == NULL)
		host = irq_default_host;
	else
		host = irq_find_host(controller);
779 780 781
	if (host == NULL) {
		printk(KERN_WARNING "irq: no irq host found for %s !\n",
		       controller->full_name);
782
		return NO_IRQ;
783
	}
784 785 786 787 788 789

	/* If host has no translation, then we assume interrupt line */
	if (host->ops->xlate == NULL)
		hwirq = intspec[0];
	else {
		if (host->ops->xlate(host, controller, intspec, intsize,
790
				     &hwirq, &type))
791
			return NO_IRQ;
L
Linus Torvalds 已提交
792
	}
793

794 795 796 797 798 799 800
	/* Create mapping */
	virq = irq_create_mapping(host, hwirq);
	if (virq == NO_IRQ)
		return virq;

	/* Set type if specified and different than the current one */
	if (type != IRQ_TYPE_NONE &&
801
	    type != (irqd_get_trigger_type(irq_get_irq_data(virq))))
802
		irq_set_irq_type(virq, type);
803
	return virq;
L
Linus Torvalds 已提交
804
}
805
EXPORT_SYMBOL_GPL(irq_create_of_mapping);
L
Linus Torvalds 已提交
806

807 808
void irq_dispose_mapping(unsigned int virq)
{
809
	struct irq_host *host;
810
	irq_hw_number_t hwirq;
L
Linus Torvalds 已提交
811

812 813 814 815
	if (virq == NO_IRQ)
		return;

	host = irq_map[virq].host;
816
	if (WARN_ON(host == NULL))
817
		return;
L
Linus Torvalds 已提交
818

819 820 821
	/* Never unmap legacy interrupts */
	if (host->revmap_type == IRQ_HOST_MAP_LEGACY)
		return;
L
Linus Torvalds 已提交
822

823 824
	irq_set_status_flags(virq, IRQ_NOREQUEST);

825
	/* remove chip and handler */
826
	irq_set_chip_and_handler(virq, NULL, NULL);
827 828 829 830 831 832 833 834 835 836 837 838 839 840

	/* Make sure it's completed */
	synchronize_irq(virq);

	/* Tell the PIC about it */
	if (host->ops->unmap)
		host->ops->unmap(host, virq);
	smp_mb();

	/* Clear reverse map */
	hwirq = irq_map[virq].hwirq;
	switch(host->revmap_type) {
	case IRQ_HOST_MAP_LINEAR:
		if (hwirq < host->revmap_data.linear.size)
841
			host->revmap_data.linear.revmap[hwirq] = NO_IRQ;
842 843
		break;
	case IRQ_HOST_MAP_TREE:
844
		mutex_lock(&revmap_trees_mutex);
845
		radix_tree_delete(&host->revmap_data.tree, hwirq);
846
		mutex_unlock(&revmap_trees_mutex);
847 848
		break;
	}
L
Linus Torvalds 已提交
849

850 851 852
	/* Destroy map */
	smp_mb();
	irq_map[virq].hwirq = host->inval_irq;
L
Linus Torvalds 已提交
853

T
Thomas Gleixner 已提交
854
	irq_free_descs(virq, 1);
855 856
	/* Free it */
	irq_free_virt(virq, 1);
L
Linus Torvalds 已提交
857
}
858
EXPORT_SYMBOL_GPL(irq_dispose_mapping);
L
Linus Torvalds 已提交
859

860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890
unsigned int irq_find_mapping(struct irq_host *host,
			      irq_hw_number_t hwirq)
{
	unsigned int i;
	unsigned int hint = hwirq % irq_virq_count;

	/* Look for default host if nececssary */
	if (host == NULL)
		host = irq_default_host;
	if (host == NULL)
		return NO_IRQ;

	/* legacy -> bail early */
	if (host->revmap_type == IRQ_HOST_MAP_LEGACY)
		return hwirq;

	/* Slow path does a linear search of the map */
	if (hint < NUM_ISA_INTERRUPTS)
		hint = NUM_ISA_INTERRUPTS;
	i = hint;
	do  {
		if (irq_map[i].host == host &&
		    irq_map[i].hwirq == hwirq)
			return i;
		i++;
		if (i >= irq_virq_count)
			i = NUM_ISA_INTERRUPTS;
	} while(i != hint);
	return NO_IRQ;
}
EXPORT_SYMBOL_GPL(irq_find_mapping);
L
Linus Torvalds 已提交
891

892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926
#ifdef CONFIG_SMP
int irq_choose_cpu(const struct cpumask *mask)
{
	int cpuid;

	if (cpumask_equal(mask, cpu_all_mask)) {
		static int irq_rover;
		static DEFINE_RAW_SPINLOCK(irq_rover_lock);
		unsigned long flags;

		/* Round-robin distribution... */
do_round_robin:
		raw_spin_lock_irqsave(&irq_rover_lock, flags);

		irq_rover = cpumask_next(irq_rover, cpu_online_mask);
		if (irq_rover >= nr_cpu_ids)
			irq_rover = cpumask_first(cpu_online_mask);

		cpuid = irq_rover;

		raw_spin_unlock_irqrestore(&irq_rover_lock, flags);
	} else {
		cpuid = cpumask_first_and(mask, cpu_online_mask);
		if (cpuid >= nr_cpu_ids)
			goto do_round_robin;
	}

	return get_hard_smp_processor_id(cpuid);
}
#else
int irq_choose_cpu(const struct cpumask *mask)
{
	return hard_smp_processor_id();
}
#endif
927

928 929
unsigned int irq_radix_revmap_lookup(struct irq_host *host,
				     irq_hw_number_t hwirq)
L
Linus Torvalds 已提交
930
{
931 932
	struct irq_map_entry *ptr;
	unsigned int virq;
L
Linus Torvalds 已提交
933

934 935
	if (WARN_ON_ONCE(host->revmap_type != IRQ_HOST_MAP_TREE))
		return irq_find_mapping(host, hwirq);
L
Linus Torvalds 已提交
936

937
	/*
938 939 940
	 * The ptr returned references the static global irq_map.
	 * but freeing an irq can delete nodes along the path to
	 * do the lookup via call_rcu.
941
	 */
942
	rcu_read_lock();
943
	ptr = radix_tree_lookup(&host->revmap_data.tree, hwirq);
944
	rcu_read_unlock();
945

946 947 948 949 950 951
	/*
	 * If found in radix tree, then fine.
	 * Else fallback to linear lookup - this should not happen in practice
	 * as it means that we failed to insert the node in the radix tree.
	 */
	if (ptr)
952
		virq = ptr - irq_map;
953 954 955 956 957 958 959 960 961
	else
		virq = irq_find_mapping(host, hwirq);

	return virq;
}

void irq_radix_revmap_insert(struct irq_host *host, unsigned int virq,
			     irq_hw_number_t hwirq)
{
962 963
	if (WARN_ON(host->revmap_type != IRQ_HOST_MAP_TREE))
		return;
964

965
	if (virq != NO_IRQ) {
966
		mutex_lock(&revmap_trees_mutex);
967 968
		radix_tree_insert(&host->revmap_data.tree, hwirq,
				  &irq_map[virq]);
969
		mutex_unlock(&revmap_trees_mutex);
970
	}
L
Linus Torvalds 已提交
971 972
}

973 974
unsigned int irq_linear_revmap(struct irq_host *host,
			       irq_hw_number_t hwirq)
975
{
976
	unsigned int *revmap;
977

978 979
	if (WARN_ON_ONCE(host->revmap_type != IRQ_HOST_MAP_LINEAR))
		return irq_find_mapping(host, hwirq);
980 981 982 983 984 985 986 987 988 989 990 991 992 993 994

	/* Check revmap bounds */
	if (unlikely(hwirq >= host->revmap_data.linear.size))
		return irq_find_mapping(host, hwirq);

	/* Check if revmap was allocated */
	revmap = host->revmap_data.linear.revmap;
	if (unlikely(revmap == NULL))
		return irq_find_mapping(host, hwirq);

	/* Fill up revmap with slow path if no mapping found */
	if (unlikely(revmap[hwirq] == NO_IRQ))
		revmap[hwirq] = irq_find_mapping(host, hwirq);

	return revmap[hwirq];
995 996
}

997 998 999 1000 1001 1002
unsigned int irq_alloc_virt(struct irq_host *host,
			    unsigned int count,
			    unsigned int hint)
{
	unsigned long flags;
	unsigned int i, j, found = NO_IRQ;
1003

1004 1005 1006
	if (count == 0 || count > (irq_virq_count - NUM_ISA_INTERRUPTS))
		return NO_IRQ;

1007
	raw_spin_lock_irqsave(&irq_big_lock, flags);
1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018

	/* Use hint for 1 interrupt if any */
	if (count == 1 && hint >= NUM_ISA_INTERRUPTS &&
	    hint < irq_virq_count && irq_map[hint].host == NULL) {
		found = hint;
		goto hint_found;
	}

	/* Look for count consecutive numbers in the allocatable
	 * (non-legacy) space
	 */
1019 1020 1021 1022 1023 1024 1025 1026 1027 1028
	for (i = NUM_ISA_INTERRUPTS, j = 0; i < irq_virq_count; i++) {
		if (irq_map[i].host != NULL)
			j = 0;
		else
			j++;

		if (j == count) {
			found = i - count + 1;
			break;
		}
1029 1030
	}
	if (found == NO_IRQ) {
1031
		raw_spin_unlock_irqrestore(&irq_big_lock, flags);
1032 1033 1034 1035 1036 1037 1038 1039
		return NO_IRQ;
	}
 hint_found:
	for (i = found; i < (found + count); i++) {
		irq_map[i].hwirq = host->inval_irq;
		smp_wmb();
		irq_map[i].host = host;
	}
1040
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
1041 1042 1043 1044
	return found;
}

void irq_free_virt(unsigned int virq, unsigned int count)
L
Linus Torvalds 已提交
1045 1046
{
	unsigned long flags;
1047
	unsigned int i;
L
Linus Torvalds 已提交
1048

1049 1050
	WARN_ON (virq < NUM_ISA_INTERRUPTS);
	WARN_ON (count == 0 || (virq + count) > irq_virq_count);
L
Linus Torvalds 已提交
1051

1052 1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064
	if (virq < NUM_ISA_INTERRUPTS) {
		if (virq + count < NUM_ISA_INTERRUPTS)
			return;
		count  =- NUM_ISA_INTERRUPTS - virq;
		virq = NUM_ISA_INTERRUPTS;
	}

	if (count > irq_virq_count || virq > irq_virq_count - count) {
		if (virq > irq_virq_count)
			return;
		count = irq_virq_count - virq;
	}

1065
	raw_spin_lock_irqsave(&irq_big_lock, flags);
1066 1067
	for (i = virq; i < (virq + count); i++) {
		struct irq_host *host;
L
Linus Torvalds 已提交
1068

1069 1070 1071 1072 1073
		host = irq_map[i].host;
		irq_map[i].hwirq = host->inval_irq;
		smp_wmb();
		irq_map[i].host = NULL;
	}
1074
	raw_spin_unlock_irqrestore(&irq_big_lock, flags);
L
Linus Torvalds 已提交
1075
}
1076

1077
int arch_early_irq_init(void)
1078
{
1079
	return 0;
1080 1081
}

1082 1083 1084 1085
#ifdef CONFIG_VIRQ_DEBUG
static int virq_debug_show(struct seq_file *m, void *private)
{
	unsigned long flags;
1086
	struct irq_desc *desc;
1087
	const char *p;
1088
	static const char none[] = "none";
1089
	void *data;
1090 1091
	int i;

1092 1093
	seq_printf(m, "%-5s  %-7s  %-15s  %-18s  %s\n", "virq", "hwirq",
		      "chip name", "chip data", "host name");
1094

1095
	for (i = 1; i < nr_irqs; i++) {
M
Michael Ellerman 已提交
1096
		desc = irq_to_desc(i);
1097 1098 1099
		if (!desc)
			continue;

1100
		raw_spin_lock_irqsave(&desc->lock, flags);
1101 1102

		if (desc->action && desc->action->handler) {
1103 1104
			struct irq_chip *chip;

1105
			seq_printf(m, "%5d  ", i);
1106
			seq_printf(m, "0x%05lx  ", irq_map[i].hwirq);
1107

1108
			chip = irq_desc_get_chip(desc);
1109 1110
			if (chip && chip->name)
				p = chip->name;
1111 1112 1113 1114
			else
				p = none;
			seq_printf(m, "%-15s  ", p);

1115 1116 1117
			data = irq_desc_get_chip_data(desc);
			seq_printf(m, "0x%16p  ", data);

1118 1119 1120 1121 1122 1123 1124
			if (irq_map[i].host && irq_map[i].host->of_node)
				p = irq_map[i].host->of_node->full_name;
			else
				p = none;
			seq_printf(m, "%s\n", p);
		}

1125
		raw_spin_unlock_irqrestore(&desc->lock, flags);
1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145
	}

	return 0;
}

static int virq_debug_open(struct inode *inode, struct file *file)
{
	return single_open(file, virq_debug_show, inode->i_private);
}

static const struct file_operations virq_debug_fops = {
	.open = virq_debug_open,
	.read = seq_read,
	.llseek = seq_lseek,
	.release = single_release,
};

static int __init irq_debugfs_init(void)
{
	if (debugfs_create_file("virq_mapping", S_IRUGO, powerpc_debugfs_root,
1146
				 NULL, &virq_debug_fops) == NULL)
1147 1148 1149 1150 1151 1152 1153
		return -ENOMEM;

	return 0;
}
__initcall(irq_debugfs_init);
#endif /* CONFIG_VIRQ_DEBUG */

1154
#ifdef CONFIG_PPC64
L
Linus Torvalds 已提交
1155 1156 1157 1158 1159 1160 1161
static int __init setup_noirqdistrib(char *str)
{
	distribute_irqs = 0;
	return 1;
}

__setup("noirqdistrib", setup_noirqdistrib);
S
Stephen Rothwell 已提交
1162
#endif /* CONFIG_PPC64 */