|  | /* | 
|  | * Machine check injection support. | 
|  | * Copyright 2008 Intel Corporation. | 
|  | * | 
|  | * This program is free software; you can redistribute it and/or | 
|  | * modify it under the terms of the GNU General Public License | 
|  | * as published by the Free Software Foundation; version 2 | 
|  | * of the License. | 
|  | * | 
|  | * Authors: | 
|  | * Andi Kleen | 
|  | * Ying Huang | 
|  | */ | 
|  | #include <linux/uaccess.h> | 
|  | #include <linux/module.h> | 
|  | #include <linux/timer.h> | 
|  | #include <linux/kernel.h> | 
|  | #include <linux/string.h> | 
|  | #include <linux/fs.h> | 
|  | #include <linux/smp.h> | 
|  | #include <linux/notifier.h> | 
|  | #include <linux/kdebug.h> | 
|  | #include <linux/cpu.h> | 
|  | #include <linux/sched.h> | 
|  | #include <linux/gfp.h> | 
|  | #include <asm/mce.h> | 
|  | #include <asm/apic.h> | 
|  |  | 
|  | /* Update fake mce registers on current CPU. */ | 
|  | static void inject_mce(struct mce *m) | 
|  | { | 
|  | struct mce *i = &per_cpu(injectm, m->extcpu); | 
|  |  | 
|  | /* Make sure noone reads partially written injectm */ | 
|  | i->finished = 0; | 
|  | mb(); | 
|  | m->finished = 0; | 
|  | /* First set the fields after finished */ | 
|  | i->extcpu = m->extcpu; | 
|  | mb(); | 
|  | /* Now write record in order, finished last (except above) */ | 
|  | memcpy(i, m, sizeof(struct mce)); | 
|  | /* Finally activate it */ | 
|  | mb(); | 
|  | i->finished = 1; | 
|  | } | 
|  |  | 
|  | static void raise_poll(struct mce *m) | 
|  | { | 
|  | unsigned long flags; | 
|  | mce_banks_t b; | 
|  |  | 
|  | memset(&b, 0xff, sizeof(mce_banks_t)); | 
|  | local_irq_save(flags); | 
|  | machine_check_poll(0, &b); | 
|  | local_irq_restore(flags); | 
|  | m->finished = 0; | 
|  | } | 
|  |  | 
|  | static void raise_exception(struct mce *m, struct pt_regs *pregs) | 
|  | { | 
|  | struct pt_regs regs; | 
|  | unsigned long flags; | 
|  |  | 
|  | if (!pregs) { | 
|  | memset(®s, 0, sizeof(struct pt_regs)); | 
|  | regs.ip = m->ip; | 
|  | regs.cs = m->cs; | 
|  | pregs = ®s; | 
|  | } | 
|  | /* in mcheck exeception handler, irq will be disabled */ | 
|  | local_irq_save(flags); | 
|  | do_machine_check(pregs, 0); | 
|  | local_irq_restore(flags); | 
|  | m->finished = 0; | 
|  | } | 
|  |  | 
|  | static cpumask_var_t mce_inject_cpumask; | 
|  |  | 
|  | static int mce_raise_notify(struct notifier_block *self, | 
|  | unsigned long val, void *data) | 
|  | { | 
|  | struct die_args *args = (struct die_args *)data; | 
|  | int cpu = smp_processor_id(); | 
|  | struct mce *m = &__get_cpu_var(injectm); | 
|  | if (val != DIE_NMI_IPI || !cpumask_test_cpu(cpu, mce_inject_cpumask)) | 
|  | return NOTIFY_DONE; | 
|  | cpumask_clear_cpu(cpu, mce_inject_cpumask); | 
|  | if (m->inject_flags & MCJ_EXCEPTION) | 
|  | raise_exception(m, args->regs); | 
|  | else if (m->status) | 
|  | raise_poll(m); | 
|  | return NOTIFY_STOP; | 
|  | } | 
|  |  | 
|  | static struct notifier_block mce_raise_nb = { | 
|  | .notifier_call = mce_raise_notify, | 
|  | .priority = 1000, | 
|  | }; | 
|  |  | 
|  | /* Inject mce on current CPU */ | 
|  | static int raise_local(void) | 
|  | { | 
|  | struct mce *m = &__get_cpu_var(injectm); | 
|  | int context = MCJ_CTX(m->inject_flags); | 
|  | int ret = 0; | 
|  | int cpu = m->extcpu; | 
|  |  | 
|  | if (m->inject_flags & MCJ_EXCEPTION) { | 
|  | printk(KERN_INFO "Triggering MCE exception on CPU %d\n", cpu); | 
|  | switch (context) { | 
|  | case MCJ_CTX_IRQ: | 
|  | /* | 
|  | * Could do more to fake interrupts like | 
|  | * calling irq_enter, but the necessary | 
|  | * machinery isn't exported currently. | 
|  | */ | 
|  | /*FALL THROUGH*/ | 
|  | case MCJ_CTX_PROCESS: | 
|  | raise_exception(m, NULL); | 
|  | break; | 
|  | default: | 
|  | printk(KERN_INFO "Invalid MCE context\n"); | 
|  | ret = -EINVAL; | 
|  | } | 
|  | printk(KERN_INFO "MCE exception done on CPU %d\n", cpu); | 
|  | } else if (m->status) { | 
|  | printk(KERN_INFO "Starting machine check poll CPU %d\n", cpu); | 
|  | raise_poll(m); | 
|  | mce_notify_irq(); | 
|  | printk(KERN_INFO "Machine check poll done on CPU %d\n", cpu); | 
|  | } else | 
|  | m->finished = 0; | 
|  |  | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | static void raise_mce(struct mce *m) | 
|  | { | 
|  | int context = MCJ_CTX(m->inject_flags); | 
|  |  | 
|  | inject_mce(m); | 
|  |  | 
|  | if (context == MCJ_CTX_RANDOM) | 
|  | return; | 
|  |  | 
|  | #ifdef CONFIG_X86_LOCAL_APIC | 
|  | if (m->inject_flags & MCJ_NMI_BROADCAST) { | 
|  | unsigned long start; | 
|  | int cpu; | 
|  | get_online_cpus(); | 
|  | cpumask_copy(mce_inject_cpumask, cpu_online_mask); | 
|  | cpumask_clear_cpu(get_cpu(), mce_inject_cpumask); | 
|  | for_each_online_cpu(cpu) { | 
|  | struct mce *mcpu = &per_cpu(injectm, cpu); | 
|  | if (!mcpu->finished || | 
|  | MCJ_CTX(mcpu->inject_flags) != MCJ_CTX_RANDOM) | 
|  | cpumask_clear_cpu(cpu, mce_inject_cpumask); | 
|  | } | 
|  | if (!cpumask_empty(mce_inject_cpumask)) | 
|  | apic->send_IPI_mask(mce_inject_cpumask, NMI_VECTOR); | 
|  | start = jiffies; | 
|  | while (!cpumask_empty(mce_inject_cpumask)) { | 
|  | if (!time_before(jiffies, start + 2*HZ)) { | 
|  | printk(KERN_ERR | 
|  | "Timeout waiting for mce inject NMI %lx\n", | 
|  | *cpumask_bits(mce_inject_cpumask)); | 
|  | break; | 
|  | } | 
|  | cpu_relax(); | 
|  | } | 
|  | raise_local(); | 
|  | put_cpu(); | 
|  | put_online_cpus(); | 
|  | } else | 
|  | #endif | 
|  | raise_local(); | 
|  | } | 
|  |  | 
|  | /* Error injection interface */ | 
|  | static ssize_t mce_write(struct file *filp, const char __user *ubuf, | 
|  | size_t usize, loff_t *off) | 
|  | { | 
|  | struct mce m; | 
|  |  | 
|  | if (!capable(CAP_SYS_ADMIN)) | 
|  | return -EPERM; | 
|  | /* | 
|  | * There are some cases where real MSR reads could slip | 
|  | * through. | 
|  | */ | 
|  | if (!boot_cpu_has(X86_FEATURE_MCE) || !boot_cpu_has(X86_FEATURE_MCA)) | 
|  | return -EIO; | 
|  |  | 
|  | if ((unsigned long)usize > sizeof(struct mce)) | 
|  | usize = sizeof(struct mce); | 
|  | if (copy_from_user(&m, ubuf, usize)) | 
|  | return -EFAULT; | 
|  |  | 
|  | if (m.extcpu >= num_possible_cpus() || !cpu_online(m.extcpu)) | 
|  | return -EINVAL; | 
|  |  | 
|  | /* | 
|  | * Need to give user space some time to set everything up, | 
|  | * so do it a jiffie or two later everywhere. | 
|  | */ | 
|  | schedule_timeout(2); | 
|  | raise_mce(&m); | 
|  | return usize; | 
|  | } | 
|  |  | 
|  | static int inject_init(void) | 
|  | { | 
|  | if (!alloc_cpumask_var(&mce_inject_cpumask, GFP_KERNEL)) | 
|  | return -ENOMEM; | 
|  | printk(KERN_INFO "Machine check injector initialized\n"); | 
|  | mce_chrdev_ops.write = mce_write; | 
|  | register_die_notifier(&mce_raise_nb); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | module_init(inject_init); | 
|  | /* | 
|  | * Cannot tolerate unloading currently because we cannot | 
|  | * guarantee all openers of mce_chrdev will get a reference to us. | 
|  | */ | 
|  | MODULE_LICENSE("GPL"); |