1
2
3
4
5
6
7
8
9
10
11
12
13
14#include <linux/uaccess.h>
15#include <linux/module.h>
16#include <linux/timer.h>
17#include <linux/kernel.h>
18#include <linux/string.h>
19#include <linux/fs.h>
20#include <linux/preempt.h>
21#include <linux/smp.h>
22#include <linux/notifier.h>
23#include <linux/kdebug.h>
24#include <linux/cpu.h>
25#include <linux/sched.h>
26#include <linux/gfp.h>
27#include <asm/mce.h>
28#include <asm/apic.h>
29#include <asm/nmi.h>
30
31
32static void inject_mce(struct mce *m)
33{
34 struct mce *i = &per_cpu(injectm, m->extcpu);
35
36
37 i->finished = 0;
38 mb();
39 m->finished = 0;
40
41 i->extcpu = m->extcpu;
42 mb();
43
44 memcpy(i, m, sizeof(struct mce));
45
46 mb();
47 i->finished = 1;
48}
49
50static void raise_poll(struct mce *m)
51{
52 unsigned long flags;
53 mce_banks_t b;
54
55 memset(&b, 0xff, sizeof(mce_banks_t));
56 local_irq_save(flags);
57 machine_check_poll(0, &b);
58 local_irq_restore(flags);
59 m->finished = 0;
60}
61
62static void raise_exception(struct mce *m, struct pt_regs *pregs)
63{
64 struct pt_regs regs;
65 unsigned long flags;
66
67 if (!pregs) {
68 memset(®s, 0, sizeof(struct pt_regs));
69 regs.ip = m->ip;
70 regs.cs = m->cs;
71 pregs = ®s;
72 }
73
74 local_irq_save(flags);
75 do_machine_check(pregs, 0);
76 local_irq_restore(flags);
77 m->finished = 0;
78}
79
80static cpumask_var_t mce_inject_cpumask;
81static DEFINE_MUTEX(mce_inject_mutex);
82
83static int mce_raise_notify(unsigned int cmd, struct pt_regs *regs)
84{
85 int cpu = smp_processor_id();
86 struct mce *m = this_cpu_ptr(&injectm);
87 if (!cpumask_test_cpu(cpu, mce_inject_cpumask))
88 return NMI_DONE;
89 cpumask_clear_cpu(cpu, mce_inject_cpumask);
90 if (m->inject_flags & MCJ_EXCEPTION)
91 raise_exception(m, regs);
92 else if (m->status)
93 raise_poll(m);
94 return NMI_HANDLED;
95}
96
97static void mce_irq_ipi(void *info)
98{
99 int cpu = smp_processor_id();
100 struct mce *m = this_cpu_ptr(&injectm);
101
102 if (cpumask_test_cpu(cpu, mce_inject_cpumask) &&
103 m->inject_flags & MCJ_EXCEPTION) {
104 cpumask_clear_cpu(cpu, mce_inject_cpumask);
105 raise_exception(m, NULL);
106 }
107}
108
109
110static int raise_local(void)
111{
112 struct mce *m = this_cpu_ptr(&injectm);
113 int context = MCJ_CTX(m->inject_flags);
114 int ret = 0;
115 int cpu = m->extcpu;
116
117 if (m->inject_flags & MCJ_EXCEPTION) {
118 pr_info("Triggering MCE exception on CPU %d\n", cpu);
119 switch (context) {
120 case MCJ_CTX_IRQ:
121
122
123
124
125
126
127 case MCJ_CTX_PROCESS:
128 raise_exception(m, NULL);
129 break;
130 default:
131 pr_info("Invalid MCE context\n");
132 ret = -EINVAL;
133 }
134 pr_info("MCE exception done on CPU %d\n", cpu);
135 } else if (m->status) {
136 pr_info("Starting machine check poll CPU %d\n", cpu);
137 raise_poll(m);
138 mce_notify_irq();
139 pr_info("Machine check poll done on CPU %d\n", cpu);
140 } else
141 m->finished = 0;
142
143 return ret;
144}
145
146static void raise_mce(struct mce *m)
147{
148 int context = MCJ_CTX(m->inject_flags);
149
150 inject_mce(m);
151
152 if (context == MCJ_CTX_RANDOM)
153 return;
154
155 if (m->inject_flags & (MCJ_IRQ_BROADCAST | MCJ_NMI_BROADCAST)) {
156 unsigned long start;
157 int cpu;
158
159 get_online_cpus();
160 cpumask_copy(mce_inject_cpumask, cpu_online_mask);
161 cpumask_clear_cpu(get_cpu(), mce_inject_cpumask);
162 for_each_online_cpu(cpu) {
163 struct mce *mcpu = &per_cpu(injectm, cpu);
164 if (!mcpu->finished ||
165 MCJ_CTX(mcpu->inject_flags) != MCJ_CTX_RANDOM)
166 cpumask_clear_cpu(cpu, mce_inject_cpumask);
167 }
168 if (!cpumask_empty(mce_inject_cpumask)) {
169 if (m->inject_flags & MCJ_IRQ_BROADCAST) {
170
171
172
173
174 preempt_disable();
175 smp_call_function_many(mce_inject_cpumask,
176 mce_irq_ipi, NULL, 0);
177 preempt_enable();
178 } else if (m->inject_flags & MCJ_NMI_BROADCAST)
179 apic->send_IPI_mask(mce_inject_cpumask,
180 NMI_VECTOR);
181 }
182 start = jiffies;
183 while (!cpumask_empty(mce_inject_cpumask)) {
184 if (!time_before(jiffies, start + 2*HZ)) {
185 pr_err("Timeout waiting for mce inject %lx\n",
186 *cpumask_bits(mce_inject_cpumask));
187 break;
188 }
189 cpu_relax();
190 }
191 raise_local();
192 put_cpu();
193 put_online_cpus();
194 } else {
195 preempt_disable();
196 raise_local();
197 preempt_enable();
198 }
199}
200
201
202static ssize_t mce_write(struct file *filp, const char __user *ubuf,
203 size_t usize, loff_t *off)
204{
205 struct mce m;
206
207 if (!capable(CAP_SYS_ADMIN))
208 return -EPERM;
209
210
211
212
213 if (!boot_cpu_has(X86_FEATURE_MCE) || !boot_cpu_has(X86_FEATURE_MCA))
214 return -EIO;
215
216 if ((unsigned long)usize > sizeof(struct mce))
217 usize = sizeof(struct mce);
218 if (copy_from_user(&m, ubuf, usize))
219 return -EFAULT;
220
221 if (m.extcpu >= num_possible_cpus() || !cpu_online(m.extcpu))
222 return -EINVAL;
223
224
225
226
227
228 schedule_timeout(2);
229
230 mutex_lock(&mce_inject_mutex);
231 raise_mce(&m);
232 mutex_unlock(&mce_inject_mutex);
233 return usize;
234}
235
236static int inject_init(void)
237{
238 if (!alloc_cpumask_var(&mce_inject_cpumask, GFP_KERNEL))
239 return -ENOMEM;
240 pr_info("Machine check injector initialized\n");
241 register_mce_write_callback(mce_write);
242 register_nmi_handler(NMI_LOCAL, mce_raise_notify, 0,
243 "mce_notify");
244 return 0;
245}
246
247module_init(inject_init);
248
249
250
251
252MODULE_LICENSE("GPL");
253