handle.c 13.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 * linux/kernel/irq/handle.c
 *
I
Ingo Molnar 已提交
4 5
 * Copyright (C) 1992, 1998-2006 Linus Torvalds, Ingo Molnar
 * Copyright (C) 2005-2006, Thomas Gleixner, Russell King
L
Linus Torvalds 已提交
6 7
 *
 * This file contains the core interrupt handling code.
I
Ingo Molnar 已提交
8 9 10
 *
 * Detailed information is available in Documentation/DocBook/genericirq
 *
L
Linus Torvalds 已提交
11 12 13
 */

#include <linux/irq.h>
14
#include <linux/sched.h>
15
#include <linux/slab.h>
L
Linus Torvalds 已提交
16 17 18 19
#include <linux/module.h>
#include <linux/random.h>
#include <linux/interrupt.h>
#include <linux/kernel_stat.h>
20 21
#include <linux/rculist.h>
#include <linux/hash.h>
22
#include <linux/radix-tree.h>
23
#include <trace/events/irq.h>
L
Linus Torvalds 已提交
24 25 26

#include "internals.h"

27 28 29
/*
 * lockdep: we want to handle all irq_desc locks as a single lock-class:
 */
30
struct lock_class_key irq_desc_lock_class;
31

T
Thomas Gleixner 已提交
32 33
/**
 * handle_bad_irq - handle spurious and unhandled irqs
34 35 36 37
 * @irq:       the interrupt number
 * @desc:      description of the interrupt
 *
 * Handles spurious and unhandled IRQ's. It also prints a debugmessage.
T
Thomas Gleixner 已提交
38
 */
T
Thomas Gleixner 已提交
39
void handle_bad_irq(unsigned int irq, struct irq_desc *desc)
T
Thomas Gleixner 已提交
40
{
41
	print_irq_desc(irq, desc);
T
Thomas Gleixner 已提交
42
	kstat_incr_irqs_this_cpu(irq, desc);
T
Thomas Gleixner 已提交
43 44 45
	ack_bad_irq(irq);
}

46 47 48
#if defined(CONFIG_SMP) && defined(CONFIG_GENERIC_HARDIRQS)
static void __init init_irq_default_affinity(void)
{
49
	alloc_cpumask_var(&irq_default_affinity, GFP_NOWAIT);
50 51 52 53 54 55 56 57
	cpumask_setall(irq_default_affinity);
}
#else
static void __init init_irq_default_affinity(void)
{
}
#endif

L
Linus Torvalds 已提交
58 59 60 61
/*
 * Linux has a controller-independent interrupt architecture.
 * Every controller has a 'controller-template', that is used
 * by the main code to do the right thing. Each driver-visible
62
 * interrupt source is transparently wired to the appropriate
L
Linus Torvalds 已提交
63 64 65 66 67 68 69 70 71
 * controller. Thus drivers need not be aware of the
 * interrupt-controller.
 *
 * The code is designed to be easily extended with new/different
 * interrupt controllers, without having to do assembly magic or
 * having to touch the generic code.
 *
 * Controller mappings for all interrupt sources:
 */
Y
Yinghai Lu 已提交
72
int nr_irqs = NR_IRQS;
I
Ingo Molnar 已提交
73
EXPORT_SYMBOL_GPL(nr_irqs);
Y
Yinghai Lu 已提交
74

75
#ifdef CONFIG_SPARSE_IRQ
76

77
static struct irq_desc irq_desc_init = {
T
Thomas Gleixner 已提交
78 79 80 81
	.status		= IRQ_DISABLED,
	.handle_irq	= handle_bad_irq,
	.depth		= 1,
	.lock		= __RAW_SPIN_LOCK_UNLOCKED(irq_desc_init.lock),
82 83
};

84
void __ref init_kstat_irqs(struct irq_desc *desc, int node, int nr)
85
{
86
	void *ptr;
87

88 89
	ptr = kzalloc_node(nr * sizeof(*desc->kstat_irqs),
			   GFP_ATOMIC, node);
90

91 92 93 94 95
	/*
	 * don't overwite if can not get new one
	 * init_copy_kstat_irqs() could still use old one
	 */
	if (ptr) {
96
		printk(KERN_DEBUG "  alloc kstat_irqs on node %d\n", node);
97 98
		desc->kstat_irqs = ptr;
	}
99 100
}

101
static void init_one_irq_desc(int irq, struct irq_desc *desc, int node)
102 103
{
	memcpy(desc, &irq_desc_init, sizeof(struct irq_desc));
I
Ingo Molnar 已提交
104

105
	raw_spin_lock_init(&desc->lock);
T
Thomas Gleixner 已提交
106
	desc->irq_data.irq = irq;
107
#ifdef CONFIG_SMP
108
	desc->irq_data.node = node;
109 110
#endif
	lockdep_set_class(&desc->lock, &irq_desc_lock_class);
111
	init_kstat_irqs(desc, node, nr_cpu_ids);
112 113 114 115
	if (!desc->kstat_irqs) {
		printk(KERN_ERR "can not alloc kstat_irqs\n");
		BUG_ON(1);
	}
116
	if (!alloc_desc_masks(desc, node, false)) {
117 118 119
		printk(KERN_ERR "can not alloc irq_desc cpumasks\n");
		BUG_ON(1);
	}
120
	init_desc_masks(desc);
121
	arch_init_chip_data(desc, node);
122 123 124 125 126
}

/*
 * Protect the sparse_irqs:
 */
127
DEFINE_RAW_SPINLOCK(sparse_irq_lock);
128

129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148
static RADIX_TREE(irq_desc_tree, GFP_ATOMIC);

static void set_irq_desc(unsigned int irq, struct irq_desc *desc)
{
	radix_tree_insert(&irq_desc_tree, irq, desc);
}

struct irq_desc *irq_to_desc(unsigned int irq)
{
	return radix_tree_lookup(&irq_desc_tree, irq);
}

void replace_irq_desc(unsigned int irq, struct irq_desc *desc)
{
	void **ptr;

	ptr = radix_tree_lookup_slot(&irq_desc_tree, irq);
	if (ptr)
		radix_tree_replace_slot(ptr, desc);
}
149

Y
Yinghai Lu 已提交
150 151
static struct irq_desc irq_desc_legacy[NR_IRQS_LEGACY] __cacheline_aligned_in_smp = {
	[0 ... NR_IRQS_LEGACY-1] = {
T
Thomas Gleixner 已提交
152 153 154 155
		.status		= IRQ_DISABLED,
		.handle_irq	= handle_bad_irq,
		.depth		= 1,
		.lock		= __RAW_SPIN_LOCK_UNLOCKED(irq_desc_init.lock),
156 157 158
	}
};

159
static unsigned int *kstat_irqs_legacy;
160

161
int __init early_irq_init(void)
162 163 164
{
	struct irq_desc *desc;
	int legacy_count;
165
	int node;
166 167
	int i;

168 169
	init_irq_default_affinity();

Y
Yinghai Lu 已提交
170 171
	 /* initialize nr_irqs based on nr_cpu_ids */
	arch_probe_nr_irqs();
172 173
	printk(KERN_INFO "NR_IRQS:%d nr_irqs:%d\n", NR_IRQS, nr_irqs);

174 175
	desc = irq_desc_legacy;
	legacy_count = ARRAY_SIZE(irq_desc_legacy);
176
	node = first_online_node;
177

178
	/* allocate based on nr_cpu_ids */
179 180
	kstat_irqs_legacy = kzalloc_node(NR_IRQS_LEGACY * nr_cpu_ids *
					  sizeof(int), GFP_NOWAIT, node);
181

T
Thomas Gleixner 已提交
182 183
	irq_desc_init.irq_data.chip = &no_irq_chip;

184
	for (i = 0; i < legacy_count; i++) {
T
Thomas Gleixner 已提交
185 186
		desc[i].irq_data.irq = i;
		desc[i].irq_data.chip = &no_irq_chip;
187
#ifdef CONFIG_SMP
188
		desc[i].irq_data.node = node;
189
#endif
190
		desc[i].kstat_irqs = kstat_irqs_legacy + i * nr_cpu_ids;
191
		lockdep_set_class(&desc[i].lock, &irq_desc_lock_class);
192
		alloc_desc_masks(&desc[i], node, true);
193
		init_desc_masks(&desc[i]);
194
		set_irq_desc(i, &desc[i]);
195 196
	}

197
	return arch_early_irq_init();
198 199
}

200
struct irq_desc * __ref irq_to_desc_alloc_node(unsigned int irq, int node)
201 202 203 204
{
	struct irq_desc *desc;
	unsigned long flags;

205
	if (irq >= nr_irqs) {
206 207
		WARN(1, "irq (%d) >= nr_irqs (%d) in irq_to_desc_alloc\n",
			irq, nr_irqs);
208 209 210
		return NULL;
	}

211
	desc = irq_to_desc(irq);
212 213 214
	if (desc)
		return desc;

215
	raw_spin_lock_irqsave(&sparse_irq_lock, flags);
216 217

	/* We have to check it to avoid races with another CPU */
218
	desc = irq_to_desc(irq);
219 220 221
	if (desc)
		goto out_unlock;

222
	desc = kzalloc_node(sizeof(*desc), GFP_ATOMIC, node);
223

224
	printk(KERN_DEBUG "  alloc irq_desc for %d on node %d\n", irq, node);
225 226 227 228
	if (!desc) {
		printk(KERN_ERR "can not alloc irq_desc\n");
		BUG_ON(1);
	}
229
	init_one_irq_desc(irq, desc, node);
230

231
	set_irq_desc(irq, desc);
232 233

out_unlock:
234
	raw_spin_unlock_irqrestore(&sparse_irq_lock, flags);
235 236 237 238

	return desc;
}

239
#else /* !CONFIG_SPARSE_IRQ */
240

241
struct irq_desc irq_desc[NR_IRQS] __cacheline_aligned_in_smp = {
L
Linus Torvalds 已提交
242
	[0 ... NR_IRQS-1] = {
T
Thomas Gleixner 已提交
243 244 245 246
		.status		= IRQ_DISABLED,
		.handle_irq	= handle_bad_irq,
		.depth		= 1,
		.lock		= __RAW_SPIN_LOCK_UNLOCKED(irq_desc->lock),
L
Linus Torvalds 已提交
247 248
	}
};
249

250
static unsigned int kstat_irqs_all[NR_IRQS][NR_CPUS];
Y
Yinghai Lu 已提交
251 252 253 254 255 256
int __init early_irq_init(void)
{
	struct irq_desc *desc;
	int count;
	int i;

257 258
	init_irq_default_affinity();

259 260
	printk(KERN_INFO "NR_IRQS:%d\n", NR_IRQS);

Y
Yinghai Lu 已提交
261 262 263
	desc = irq_desc;
	count = ARRAY_SIZE(irq_desc);

264
	for (i = 0; i < count; i++) {
T
Thomas Gleixner 已提交
265 266
		desc[i].irq_data.irq = i;
		desc[i].irq_data.chip = &no_irq_chip;
267 268
		alloc_desc_masks(&desc[i], 0, true);
		init_desc_masks(&desc[i]);
269 270
		desc[i].kstat_irqs = kstat_irqs_all[i];
	}
Y
Yinghai Lu 已提交
271 272 273
	return arch_early_irq_init();
}

274 275 276 277 278
struct irq_desc *irq_to_desc(unsigned int irq)
{
	return (irq < NR_IRQS) ? irq_desc + irq : NULL;
}

279
struct irq_desc *irq_to_desc_alloc_node(unsigned int irq, int node)
280 281 282 283
{
	return irq_to_desc(irq);
}
#endif /* !CONFIG_SPARSE_IRQ */
284

Y
Yinghai Lu 已提交
285 286 287 288 289
void clear_kstat_irqs(struct irq_desc *desc)
{
	memset(desc->kstat_irqs, 0, nr_cpu_ids * sizeof(*(desc->kstat_irqs)));
}

L
Linus Torvalds 已提交
290
/*
291 292
 * What should we do if we get a hw irq event on an illegal vector?
 * Each architecture has to answer this themself.
L
Linus Torvalds 已提交
293
 */
294 295 296 297 298 299 300 301 302
static void ack_bad(struct irq_data *data)
{
	struct irq_desc *desc = irq_data_to_desc(data);

	print_irq_desc(data->irq, desc);
	ack_bad_irq(data->irq);
}

static void compat_ack_bad(unsigned int irq)
L
Linus Torvalds 已提交
303
{
304
	struct irq_desc *desc = irq_to_desc(irq);
305 306

	print_irq_desc(irq, desc);
L
Linus Torvalds 已提交
307 308 309
	ack_bad_irq(irq);
}

310 311 312
/*
 * NOP functions
 */
313 314 315
static void noop(struct irq_data *data) { }

static unsigned int noop_ret(struct irq_data *data)
316
{
317
	return 0;
318 319
}

320 321 322
static void compat_noop(unsigned int irq) { }

static unsigned int compat_noop_ret(unsigned int irq)
323 324 325 326 327 328 329
{
	return 0;
}

/*
 * Generic no controller implementation
 */
330 331
struct irq_chip no_irq_chip = {
	.name		= "none",
332 333 334 335 336 337 338 339 340 341 342
	.irq_startup	= noop_ret,
	.irq_shutdown	= noop,
	.irq_enable	= noop,
	.irq_disable	= noop,
	.irq_ack	= ack_bad,
	.startup	= compat_noop_ret,
	.shutdown	= compat_noop,
	.enable		= compat_noop,
	.disable	= compat_noop,
	.ack		= compat_ack_bad,
	.end		= compat_noop,
L
Linus Torvalds 已提交
343 344
};

345 346 347 348 349 350
/*
 * Generic dummy implementation which can be used for
 * real dumb interrupt sources
 */
struct irq_chip dummy_irq_chip = {
	.name		= "dummy",
351 352 353 354 355 356 357 358 359 360 361 362 363 364 365
	.irq_startup	= noop_ret,
	.irq_shutdown	= noop,
	.irq_enable	= noop,
	.irq_disable	= noop,
	.irq_ack	= noop,
	.irq_mask	= noop,
	.irq_unmask	= noop,
	.startup	= compat_noop_ret,
	.shutdown	= compat_noop,
	.enable		= compat_noop,
	.disable	= compat_noop,
	.ack		= compat_noop,
	.mask		= compat_noop,
	.unmask		= compat_noop,
	.end		= compat_noop,
366 367
};

L
Linus Torvalds 已提交
368 369 370
/*
 * Special, empty irq handler:
 */
371
irqreturn_t no_action(int cpl, void *dev_id)
L
Linus Torvalds 已提交
372 373 374 375
{
	return IRQ_NONE;
}

376 377 378 379 380 381 382 383 384
static void warn_no_thread(unsigned int irq, struct irqaction *action)
{
	if (test_and_set_bit(IRQTF_WARNED, &action->thread_flags))
		return;

	printk(KERN_WARNING "IRQ %d device %s returned IRQ_WAKE_THREAD "
	       "but no thread function available.", irq, action->name);
}

385 386 387 388 389 390
/**
 * handle_IRQ_event - irq action chain handler
 * @irq:	the interrupt number
 * @action:	the interrupt action chain for this irq
 *
 * Handles the action chain of an irq event
L
Linus Torvalds 已提交
391
 */
392
irqreturn_t handle_IRQ_event(unsigned int irq, struct irqaction *action)
L
Linus Torvalds 已提交
393
{
394 395
	irqreturn_t ret, retval = IRQ_NONE;
	unsigned int status = 0;
L
Linus Torvalds 已提交
396 397

	do {
398
		trace_irq_handler_entry(irq, action);
399
		ret = action->handler(irq, action->dev_id);
400
		trace_irq_handler_exit(irq, action, ret);
401 402 403

		switch (ret) {
		case IRQ_WAKE_THREAD:
404 405 406 407 408 409 410 411 412 413 414 415 416 417 418
			/*
			 * Set result to handled so the spurious check
			 * does not trigger.
			 */
			ret = IRQ_HANDLED;

			/*
			 * Catch drivers which return WAKE_THREAD but
			 * did not set up a thread function
			 */
			if (unlikely(!action->thread_fn)) {
				warn_no_thread(irq, action);
				break;
			}

419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434
			/*
			 * Wake up the handler thread for this
			 * action. In case the thread crashed and was
			 * killed we just pretend that we handled the
			 * interrupt. The hardirq handler above has
			 * disabled the device interrupt, so no irq
			 * storm is lurking.
			 */
			if (likely(!test_bit(IRQTF_DIED,
					     &action->thread_flags))) {
				set_bit(IRQTF_RUNTHREAD, &action->thread_flags);
				wake_up_process(action->thread);
			}

			/* Fall through to add to randomness */
		case IRQ_HANDLED:
L
Linus Torvalds 已提交
435
			status |= action->flags;
436 437 438 439 440 441
			break;

		default:
			break;
		}

L
Linus Torvalds 已提交
442 443 444 445
		retval |= ret;
		action = action->next;
	} while (action);

446
	if (status & IRQF_SAMPLE_RANDOM)
L
Linus Torvalds 已提交
447 448 449 450 451 452
		add_interrupt_randomness(irq);
	local_irq_disable();

	return retval;
}

453
#ifndef CONFIG_GENERIC_HARDIRQS_NO__DO_IRQ
T
Thomas Gleixner 已提交
454 455 456 457 458

#ifdef CONFIG_ENABLE_WARN_DEPRECATED
# warning __do_IRQ is deprecated. Please convert to proper flow handlers
#endif

459 460 461 462 463
/**
 * __do_IRQ - original all in one highlevel IRQ handler
 * @irq:	the interrupt number
 *
 * __do_IRQ handles all normal device IRQ's (the special
L
Linus Torvalds 已提交
464 465
 * SMP cross-CPU interrupts have their own specific
 * handlers).
466 467 468
 *
 * This is the original x86 implementation which is used for every
 * interrupt type.
L
Linus Torvalds 已提交
469
 */
470
unsigned int __do_IRQ(unsigned int irq)
L
Linus Torvalds 已提交
471
{
472
	struct irq_desc *desc = irq_to_desc(irq);
473
	struct irqaction *action;
L
Linus Torvalds 已提交
474 475
	unsigned int status;

T
Thomas Gleixner 已提交
476 477
	kstat_incr_irqs_this_cpu(irq, desc);

478
	if (CHECK_IRQ_PER_CPU(desc->status)) {
L
Linus Torvalds 已提交
479 480 481 482 483
		irqreturn_t action_ret;

		/*
		 * No locking required for CPU-local interrupts:
		 */
484 485
		if (desc->irq_data.chip->ack)
			desc->irq_data.chip->ack(irq);
486 487 488 489 490
		if (likely(!(desc->status & IRQ_DISABLED))) {
			action_ret = handle_IRQ_event(irq, desc->action);
			if (!noirqdebug)
				note_interrupt(irq, desc, action_ret);
		}
491
		desc->irq_data.chip->end(irq);
L
Linus Torvalds 已提交
492 493 494
		return 1;
	}

495
	raw_spin_lock(&desc->lock);
496 497
	if (desc->irq_data.chip->ack)
		desc->irq_data.chip->ack(irq);
L
Linus Torvalds 已提交
498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538
	/*
	 * REPLAY is when Linux resends an IRQ that was dropped earlier
	 * WAITING is used by probe to mark irqs that are being tested
	 */
	status = desc->status & ~(IRQ_REPLAY | IRQ_WAITING);
	status |= IRQ_PENDING; /* we _want_ to handle it */

	/*
	 * If the IRQ is disabled for whatever reason, we cannot
	 * use the action we have.
	 */
	action = NULL;
	if (likely(!(status & (IRQ_DISABLED | IRQ_INPROGRESS)))) {
		action = desc->action;
		status &= ~IRQ_PENDING; /* we commit to handling */
		status |= IRQ_INPROGRESS; /* we are handling it */
	}
	desc->status = status;

	/*
	 * If there is no IRQ handler or it was disabled, exit early.
	 * Since we set PENDING, if another processor is handling
	 * a different instance of this same irq, the other processor
	 * will take care of it.
	 */
	if (unlikely(!action))
		goto out;

	/*
	 * Edge triggered interrupts need to remember
	 * pending events.
	 * This applies to any hw interrupts that allow a second
	 * instance of the same irq to arrive while we are in do_IRQ
	 * or in the handler. But the code here only handles the _second_
	 * instance of the irq, not the third or fourth. So it is mostly
	 * useful for irq hardware that does not mask cleanly in an
	 * SMP environment.
	 */
	for (;;) {
		irqreturn_t action_ret;

539
		raw_spin_unlock(&desc->lock);
L
Linus Torvalds 已提交
540

541
		action_ret = handle_IRQ_event(irq, action);
L
Linus Torvalds 已提交
542
		if (!noirqdebug)
543
			note_interrupt(irq, desc, action_ret);
544

545
		raw_spin_lock(&desc->lock);
L
Linus Torvalds 已提交
546 547 548 549 550 551 552 553 554 555 556
		if (likely(!(desc->status & IRQ_PENDING)))
			break;
		desc->status &= ~IRQ_PENDING;
	}
	desc->status &= ~IRQ_INPROGRESS;

out:
	/*
	 * The ->end() handler has to deal with interrupts which got
	 * disabled while the handler was running.
	 */
557
	desc->irq_data.chip->end(irq);
558
	raw_spin_unlock(&desc->lock);
L
Linus Torvalds 已提交
559 560 561

	return 1;
}
562
#endif
L
Linus Torvalds 已提交
563

I
Ingo Molnar 已提交
564 565
void early_init_irq_lock_class(void)
{
566
	struct irq_desc *desc;
I
Ingo Molnar 已提交
567 568
	int i;

569
	for_each_irq_desc(i, desc) {
570
		lockdep_set_class(&desc->lock, &irq_desc_lock_class);
571 572 573 574 575 576
	}
}

unsigned int kstat_irqs_cpu(unsigned int irq, int cpu)
{
	struct irq_desc *desc = irq_to_desc(irq);
577
	return desc ? desc->kstat_irqs[cpu] : 0;
I
Ingo Molnar 已提交
578
}
579 580
EXPORT_SYMBOL(kstat_irqs_cpu);