mce-inject.c 6.0 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 * Machine check injection support.
 * Copyright 2008 Intel Corporation.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; version 2
 * of the License.
 *
 * Authors:
 * Andi Kleen
 * Ying Huang
 */
14
#include <linux/uaccess.h>
15 16 17 18 19
#include <linux/module.h>
#include <linux/timer.h>
#include <linux/kernel.h>
#include <linux/string.h>
#include <linux/fs.h>
20
#include <linux/preempt.h>
21
#include <linux/smp.h>
22 23 24 25
#include <linux/notifier.h>
#include <linux/kdebug.h>
#include <linux/cpu.h>
#include <linux/sched.h>
26
#include <linux/gfp.h>
27
#include <asm/mce.h>
28
#include <asm/apic.h>
D
Don Zickus 已提交
29
#include <asm/nmi.h>
30 31 32 33

/* Update fake mce registers on current CPU. */
static void inject_mce(struct mce *m)
{
34
	struct mce *i = &per_cpu(injectm, m->extcpu);
35

L
Lucas De Marchi 已提交
36
	/* Make sure no one reads partially written injectm */
37 38 39 40
	i->finished = 0;
	mb();
	m->finished = 0;
	/* First set the fields after finished */
41
	i->extcpu = m->extcpu;
42 43 44 45 46 47 48 49
	mb();
	/* Now write record in order, finished last (except above) */
	memcpy(i, m, sizeof(struct mce));
	/* Finally activate it */
	mb();
	i->finished = 1;
}

50
static void raise_poll(struct mce *m)
51 52 53 54 55 56 57 58 59 60 61
{
	unsigned long flags;
	mce_banks_t b;

	memset(&b, 0xff, sizeof(mce_banks_t));
	local_irq_save(flags);
	machine_check_poll(0, &b);
	local_irq_restore(flags);
	m->finished = 0;
}

62
static void raise_exception(struct mce *m, struct pt_regs *pregs)
63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
{
	struct pt_regs regs;
	unsigned long flags;

	if (!pregs) {
		memset(&regs, 0, sizeof(struct pt_regs));
		regs.ip = m->ip;
		regs.cs = m->cs;
		pregs = &regs;
	}
	/* in mcheck exeception handler, irq will be disabled */
	local_irq_save(flags);
	do_machine_check(pregs, 0);
	local_irq_restore(flags);
	m->finished = 0;
}

80
static cpumask_var_t mce_inject_cpumask;
81
static DEFINE_MUTEX(mce_inject_mutex);
82

83
static int mce_raise_notify(unsigned int cmd, struct pt_regs *regs)
84 85
{
	int cpu = smp_processor_id();
86
	struct mce *m = this_cpu_ptr(&injectm);
87 88
	if (!cpumask_test_cpu(cpu, mce_inject_cpumask))
		return NMI_DONE;
89
	cpumask_clear_cpu(cpu, mce_inject_cpumask);
90
	if (m->inject_flags & MCJ_EXCEPTION)
91
		raise_exception(m, regs);
92
	else if (m->status)
93
		raise_poll(m);
94
	return NMI_HANDLED;
95 96
}

97 98 99
static void mce_irq_ipi(void *info)
{
	int cpu = smp_processor_id();
100
	struct mce *m = this_cpu_ptr(&injectm);
101 102 103 104 105 106 107 108

	if (cpumask_test_cpu(cpu, mce_inject_cpumask) &&
			m->inject_flags & MCJ_EXCEPTION) {
		cpumask_clear_cpu(cpu, mce_inject_cpumask);
		raise_exception(m, NULL);
	}
}

109
/* Inject mce on current CPU */
110
static int raise_local(void)
111
{
112
	struct mce *m = this_cpu_ptr(&injectm);
113 114
	int context = MCJ_CTX(m->inject_flags);
	int ret = 0;
115
	int cpu = m->extcpu;
116

117
	if (m->inject_flags & MCJ_EXCEPTION) {
118
		pr_info("Triggering MCE exception on CPU %d\n", cpu);
119 120 121 122 123 124 125 126 127
		switch (context) {
		case MCJ_CTX_IRQ:
			/*
			 * Could do more to fake interrupts like
			 * calling irq_enter, but the necessary
			 * machinery isn't exported currently.
			 */
			/*FALL THROUGH*/
		case MCJ_CTX_PROCESS:
128
			raise_exception(m, NULL);
129 130
			break;
		default:
131
			pr_info("Invalid MCE context\n");
132 133
			ret = -EINVAL;
		}
134
		pr_info("MCE exception done on CPU %d\n", cpu);
135
	} else if (m->status) {
136
		pr_info("Starting machine check poll CPU %d\n", cpu);
137
		raise_poll(m);
138
		mce_notify_irq();
139
		pr_info("Machine check poll done on CPU %d\n", cpu);
140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155
	} else
		m->finished = 0;

	return ret;
}

static void raise_mce(struct mce *m)
{
	int context = MCJ_CTX(m->inject_flags);

	inject_mce(m);

	if (context == MCJ_CTX_RANDOM)
		return;

#ifdef CONFIG_X86_LOCAL_APIC
M
Mathias Krause 已提交
156
	if (m->inject_flags & (MCJ_IRQ_BROADCAST | MCJ_NMI_BROADCAST)) {
157 158
		unsigned long start;
		int cpu;
159

160
		get_online_cpus();
161 162
		cpumask_copy(mce_inject_cpumask, cpu_online_mask);
		cpumask_clear_cpu(get_cpu(), mce_inject_cpumask);
163 164 165 166
		for_each_online_cpu(cpu) {
			struct mce *mcpu = &per_cpu(injectm, cpu);
			if (!mcpu->finished ||
			    MCJ_CTX(mcpu->inject_flags) != MCJ_CTX_RANDOM)
167
				cpumask_clear_cpu(cpu, mce_inject_cpumask);
168
		}
169
		if (!cpumask_empty(mce_inject_cpumask)) {
M
Mathias Krause 已提交
170
			if (m->inject_flags & MCJ_IRQ_BROADCAST) {
171 172 173 174 175 176 177 178 179 180 181 182
				/*
				 * don't wait because mce_irq_ipi is necessary
				 * to be sync with following raise_local
				 */
				preempt_disable();
				smp_call_function_many(mce_inject_cpumask,
					mce_irq_ipi, NULL, 0);
				preempt_enable();
			} else if (m->inject_flags & MCJ_NMI_BROADCAST)
				apic->send_IPI_mask(mce_inject_cpumask,
						NMI_VECTOR);
		}
183
		start = jiffies;
184
		while (!cpumask_empty(mce_inject_cpumask)) {
185
			if (!time_before(jiffies, start + 2*HZ)) {
186
				pr_err("Timeout waiting for mce inject %lx\n",
187
					*cpumask_bits(mce_inject_cpumask));
188 189 190 191
				break;
			}
			cpu_relax();
		}
192
		raise_local();
193 194 195 196
		put_cpu();
		put_online_cpus();
	} else
#endif
197 198
	{
		preempt_disable();
199
		raise_local();
200 201
		preempt_enable();
	}
202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223
}

/* Error injection interface */
static ssize_t mce_write(struct file *filp, const char __user *ubuf,
			 size_t usize, loff_t *off)
{
	struct mce m;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
	/*
	 * There are some cases where real MSR reads could slip
	 * through.
	 */
	if (!boot_cpu_has(X86_FEATURE_MCE) || !boot_cpu_has(X86_FEATURE_MCA))
		return -EIO;

	if ((unsigned long)usize > sizeof(struct mce))
		usize = sizeof(struct mce);
	if (copy_from_user(&m, ubuf, usize))
		return -EFAULT;

224
	if (m.extcpu >= num_possible_cpus() || !cpu_online(m.extcpu))
225 226 227 228 229 230
		return -EINVAL;

	/*
	 * Need to give user space some time to set everything up,
	 * so do it a jiffie or two later everywhere.
	 */
231
	schedule_timeout(2);
232 233

	mutex_lock(&mce_inject_mutex);
234
	raise_mce(&m);
235
	mutex_unlock(&mce_inject_mutex);
236 237 238 239 240
	return usize;
}

static int inject_init(void)
{
241 242
	if (!alloc_cpumask_var(&mce_inject_cpumask, GFP_KERNEL))
		return -ENOMEM;
243
	pr_info("Machine check injector initialized\n");
244
	register_mce_write_callback(mce_write);
245 246
	register_nmi_handler(NMI_LOCAL, mce_raise_notify, 0,
				"mce_notify");
247 248 249 250
	return 0;
}

module_init(inject_init);
251 252
/*
 * Cannot tolerate unloading currently because we cannot
253 254 255
 * guarantee all openers of mce_chrdev will get a reference to us.
 */
MODULE_LICENSE("GPL");