2 * Kprobe module for testing crash dumps
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * Copyright (C) IBM Corporation, 2006
20 * Author: Ankita Garg <ankita@in.ibm.com>
22 * This module induces system failures at predefined crashpoints to
23 * evaluate the reliability of crash dumps obtained using different dumping
26 * It is adapted from the Linux Kernel Dump Test Tool by
27 * Fernando Luis Vazquez Cao <http://lkdtt.sourceforge.net>
29 * Debugfs support added by Simon Kagstrom <simon.kagstrom@netinsight.net>
31 * See Documentation/fault-injection/provoke-crashes.txt for instructions
33 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
35 #include <linux/kernel.h>
37 #include <linux/module.h>
38 #include <linux/buffer_head.h>
39 #include <linux/kprobes.h>
40 #include <linux/list.h>
41 #include <linux/init.h>
42 #include <linux/interrupt.h>
43 #include <linux/hrtimer.h>
44 #include <linux/slab.h>
45 #include <scsi/scsi_cmnd.h>
46 #include <linux/debugfs.h>
47 #include <linux/vmalloc.h>
48 #include <linux/mman.h>
49 #include <asm/cacheflush.h>
52 #include <linux/ide.h>
56 * Make sure our attempts to over run the kernel stack doesn't trigger
57 * a compiler warning when CONFIG_FRAME_WARN is set. Then make sure we
58 * recurse past the end of THREAD_SIZE by default.
60 #if defined(CONFIG_FRAME_WARN) && (CONFIG_FRAME_WARN > 0)
61 #define REC_STACK_SIZE (CONFIG_FRAME_WARN / 2)
63 #define REC_STACK_SIZE (THREAD_SIZE / 8)
65 #define REC_NUM_DEFAULT ((THREAD_SIZE / REC_STACK_SIZE) * 2)
67 #define DEFAULT_COUNT 10
72 CN_INT_HARDWARE_ENTRY,
92 CT_UNALIGNED_LOAD_STORE_WRITE,
93 CT_OVERWRITE_ALLOCATION,
96 CT_WRITE_BUDDY_AFTER_FREE,
97 CT_READ_BUDDY_AFTER_FREE,
109 CT_WRITE_RO_AFTER_INIT,
114 static char* cp_name[] = {
115 "INT_HARDWARE_ENTRY",
126 static char* cp_type[] = {
134 "UNALIGNED_LOAD_STORE_WRITE",
135 "OVERWRITE_ALLOCATION",
138 "WRITE_BUDDY_AFTER_FREE",
139 "READ_BUDDY_AFTER_FREE",
151 "WRITE_RO_AFTER_INIT",
156 static struct jprobe lkdtm;
158 static int lkdtm_parse_commandline(void);
159 static void lkdtm_handler(void);
161 static char* cpoint_name;
162 static char* cpoint_type;
163 static int cpoint_count = DEFAULT_COUNT;
164 static int recur_count = REC_NUM_DEFAULT;
166 static enum cname cpoint = CN_INVALID;
167 static enum ctype cptype = CT_NONE;
168 static int count = DEFAULT_COUNT;
169 static DEFINE_SPINLOCK(count_lock);
170 static DEFINE_SPINLOCK(lock_me_up);
172 static u8 data_area[EXEC_SIZE];
174 static const unsigned long rodata = 0xAA55AA55;
175 static unsigned long ro_after_init __ro_after_init = 0x55AA5500;
177 module_param(recur_count, int, 0644);
178 MODULE_PARM_DESC(recur_count, " Recursion level for the stack overflow test");
179 module_param(cpoint_name, charp, 0444);
180 MODULE_PARM_DESC(cpoint_name, " Crash Point, where kernel is to be crashed");
181 module_param(cpoint_type, charp, 0444);
182 MODULE_PARM_DESC(cpoint_type, " Crash Point Type, action to be taken on "\
183 "hitting the crash point");
184 module_param(cpoint_count, int, 0644);
185 MODULE_PARM_DESC(cpoint_count, " Crash Point Count, number of times the "\
186 "crash point is to be hit to trigger action");
188 static unsigned int jp_do_irq(unsigned int irq)
195 static irqreturn_t jp_handle_irq_event(unsigned int irq,
196 struct irqaction *action)
203 static void jp_tasklet_action(struct softirq_action *a)
209 static void jp_ll_rw_block(int rw, int nr, struct buffer_head *bhs[])
217 static unsigned long jp_shrink_inactive_list(unsigned long max_scan,
219 struct scan_control *sc)
226 static int jp_hrtimer_start(struct hrtimer *timer, ktime_t tim,
227 const enum hrtimer_mode mode)
234 static int jp_scsi_dispatch_cmd(struct scsi_cmnd *cmd)
242 static int jp_generic_ide_ioctl(ide_drive_t *drive, struct file *file,
243 struct block_device *bdev, unsigned int cmd,
252 /* Return the crashpoint number or NONE if the name is invalid */
253 static enum ctype parse_cp_type(const char *what, size_t count)
257 for (i = 0; i < ARRAY_SIZE(cp_type); i++) {
258 if (!strcmp(what, cp_type[i]))
265 static const char *cp_type_to_str(enum ctype type)
267 if (type == CT_NONE || type < 0 || type > ARRAY_SIZE(cp_type))
270 return cp_type[type - 1];
273 static const char *cp_name_to_str(enum cname name)
275 if (name == CN_INVALID || name < 0 || name > ARRAY_SIZE(cp_name))
278 return cp_name[name - 1];
282 static int lkdtm_parse_commandline(void)
287 if (cpoint_count < 1 || recur_count < 1)
290 spin_lock_irqsave(&count_lock, flags);
291 count = cpoint_count;
292 spin_unlock_irqrestore(&count_lock, flags);
294 /* No special parameters */
295 if (!cpoint_type && !cpoint_name)
298 /* Neither or both of these need to be set */
299 if (!cpoint_type || !cpoint_name)
302 cptype = parse_cp_type(cpoint_type, strlen(cpoint_type));
303 if (cptype == CT_NONE)
306 for (i = 0; i < ARRAY_SIZE(cp_name); i++) {
307 if (!strcmp(cpoint_name, cp_name[i])) {
313 /* Could not find a valid crash point */
317 static int recursive_loop(int remaining)
319 char buf[REC_STACK_SIZE];
321 /* Make sure compiler does not optimize this away. */
322 memset(buf, (remaining & 0xff) | 0x1, REC_STACK_SIZE);
326 return recursive_loop(remaining - 1);
329 static void do_nothing(void)
334 /* Must immediately follow do_nothing for size calculuations to work out. */
335 static void do_overwritten(void)
337 pr_info("do_overwritten wasn't overwritten!\n");
341 static noinline void corrupt_stack(void)
343 /* Use default char array length that triggers stack protection. */
346 memset((void *)data, 0, 64);
349 static void noinline execute_location(void *dst)
351 void (*func)(void) = dst;
353 pr_info("attempting ok execution at %p\n", do_nothing);
356 memcpy(dst, do_nothing, EXEC_SIZE);
357 flush_icache_range((unsigned long)dst, (unsigned long)dst + EXEC_SIZE);
358 pr_info("attempting bad execution at %p\n", func);
362 static void execute_user_location(void *dst)
364 /* Intentionally crossing kernel/user memory boundary. */
365 void (*func)(void) = dst;
367 pr_info("attempting ok execution at %p\n", do_nothing);
370 if (copy_to_user((void __user *)dst, do_nothing, EXEC_SIZE))
372 flush_icache_range((unsigned long)dst, (unsigned long)dst + EXEC_SIZE);
373 pr_info("attempting bad execution at %p\n", func);
377 static void lkdtm_do_action(enum ctype which)
397 (void) recursive_loop(recur_count);
399 case CT_CORRUPT_STACK:
402 case CT_UNALIGNED_LOAD_STORE_WRITE: {
403 static u8 data[5] __attribute__((aligned(4))) = {1, 2,
406 u32 val = 0x12345678;
408 p = (u32 *)(data + 1);
414 case CT_OVERWRITE_ALLOCATION: {
416 u32 *data = kmalloc(len, GFP_KERNEL);
418 data[1024 / sizeof(u32)] = 0x12345678;
422 case CT_WRITE_AFTER_FREE: {
426 * The slub allocator uses the first word to store the free
427 * pointer in some configurations. Use the middle of the
428 * allocation to avoid running into the freelist
430 size_t offset = (len / sizeof(*base)) / 2;
432 base = kmalloc(len, GFP_KERNEL);
433 pr_info("Allocated memory %p-%p\n", base, &base[offset * 2]);
434 pr_info("Attempting bad write to freed memory at %p\n",
437 base[offset] = 0x0abcdef0;
438 /* Attempt to notice the overwrite. */
439 again = kmalloc(len, GFP_KERNEL);
442 pr_info("Hmm, didn't get the same memory range.\n");
446 case CT_READ_AFTER_FREE: {
447 int *base, *val, saw;
450 * The slub allocator uses the first word to store the free
451 * pointer in some configurations. Use the middle of the
452 * allocation to avoid running into the freelist
454 size_t offset = (len / sizeof(*base)) / 2;
456 base = kmalloc(len, GFP_KERNEL);
460 val = kmalloc(len, GFP_KERNEL);
468 pr_info("Value in memory before free: %x\n", base[offset]);
472 pr_info("Attempting bad read from freed memory\n");
475 /* Good! Poisoning happened, so declare a win. */
476 pr_info("Memory correctly poisoned (%x)\n", saw);
479 pr_info("Memory was not poisoned\n");
484 case CT_WRITE_BUDDY_AFTER_FREE: {
485 unsigned long p = __get_free_page(GFP_KERNEL);
488 pr_info("Writing to the buddy page before free\n");
489 memset((void *)p, 0x3, PAGE_SIZE);
492 pr_info("Attempting bad write to the buddy page after free\n");
493 memset((void *)p, 0x78, PAGE_SIZE);
494 /* Attempt to notice the overwrite. */
495 p = __get_free_page(GFP_KERNEL);
501 case CT_READ_BUDDY_AFTER_FREE: {
502 unsigned long p = __get_free_page(GFP_KERNEL);
509 val = kmalloc(1024, GFP_KERNEL);
517 pr_info("Value in memory before free: %x\n", base[0]);
519 pr_info("Attempting to read from freed memory\n");
522 /* Good! Poisoning happened, so declare a win. */
523 pr_info("Memory correctly poisoned (%x)\n", saw);
526 pr_info("Buddy page was not poisoned\n");
542 /* Must be called twice to trigger. */
543 spin_lock(&lock_me_up);
544 /* Let sparse know we intended to exit holding the lock. */
545 __release(&lock_me_up);
548 set_current_state(TASK_UNINTERRUPTIBLE);
552 execute_location(data_area);
554 case CT_EXEC_STACK: {
555 u8 stack_area[EXEC_SIZE];
556 execute_location(stack_area);
559 case CT_EXEC_KMALLOC: {
560 u32 *kmalloc_area = kmalloc(EXEC_SIZE, GFP_KERNEL);
561 execute_location(kmalloc_area);
565 case CT_EXEC_VMALLOC: {
566 u32 *vmalloc_area = vmalloc(EXEC_SIZE);
567 execute_location(vmalloc_area);
571 case CT_EXEC_USERSPACE: {
572 unsigned long user_addr;
574 user_addr = vm_mmap(NULL, 0, PAGE_SIZE,
575 PROT_READ | PROT_WRITE | PROT_EXEC,
576 MAP_ANONYMOUS | MAP_PRIVATE, 0);
577 if (user_addr >= TASK_SIZE) {
578 pr_warn("Failed to allocate user memory\n");
581 execute_user_location((void *)user_addr);
582 vm_munmap(user_addr, PAGE_SIZE);
585 case CT_ACCESS_USERSPACE: {
586 unsigned long user_addr, tmp = 0;
589 user_addr = vm_mmap(NULL, 0, PAGE_SIZE,
590 PROT_READ | PROT_WRITE | PROT_EXEC,
591 MAP_ANONYMOUS | MAP_PRIVATE, 0);
592 if (user_addr >= TASK_SIZE) {
593 pr_warn("Failed to allocate user memory\n");
597 if (copy_to_user((void __user *)user_addr, &tmp, sizeof(tmp))) {
598 pr_warn("copy_to_user failed\n");
599 vm_munmap(user_addr, PAGE_SIZE);
603 ptr = (unsigned long *)user_addr;
605 pr_info("attempting bad read at %p\n", ptr);
609 pr_info("attempting bad write at %p\n", ptr);
612 vm_munmap(user_addr, PAGE_SIZE);
617 /* Explicitly cast away "const" for the test. */
618 unsigned long *ptr = (unsigned long *)&rodata;
620 pr_info("attempting bad rodata write at %p\n", ptr);
625 case CT_WRITE_RO_AFTER_INIT: {
626 unsigned long *ptr = &ro_after_init;
629 * Verify we were written to during init. Since an Oops
630 * is considered a "success", a failure is to just skip the
633 if ((*ptr & 0xAA) != 0xAA) {
634 pr_info("%p was NOT written during init!?\n", ptr);
638 pr_info("attempting bad ro_after_init write at %p\n", ptr);
643 case CT_WRITE_KERN: {
647 size = (unsigned long)do_overwritten -
648 (unsigned long)do_nothing;
649 ptr = (unsigned char *)do_overwritten;
651 pr_info("attempting bad %zu byte write at %p\n", size, ptr);
652 memcpy(ptr, (unsigned char *)do_nothing, size);
653 flush_icache_range((unsigned long)ptr,
654 (unsigned long)(ptr + size));
659 case CT_WRAP_ATOMIC: {
660 atomic_t under = ATOMIC_INIT(INT_MIN);
661 atomic_t over = ATOMIC_INIT(INT_MAX);
663 pr_info("attempting atomic underflow\n");
665 pr_info("attempting atomic overflow\n");
677 static void lkdtm_handler(void)
682 spin_lock_irqsave(&count_lock, flags);
684 pr_info("Crash point %s of type %s hit, trigger in %d rounds\n",
685 cp_name_to_str(cpoint), cp_type_to_str(cptype), count);
689 count = cpoint_count;
691 spin_unlock_irqrestore(&count_lock, flags);
694 lkdtm_do_action(cptype);
697 static int lkdtm_register_cpoint(enum cname which)
702 if (lkdtm.entry != NULL)
703 unregister_jprobe(&lkdtm);
707 lkdtm_do_action(cptype);
709 case CN_INT_HARDWARE_ENTRY:
710 lkdtm.kp.symbol_name = "do_IRQ";
711 lkdtm.entry = (kprobe_opcode_t*) jp_do_irq;
713 case CN_INT_HW_IRQ_EN:
714 lkdtm.kp.symbol_name = "handle_IRQ_event";
715 lkdtm.entry = (kprobe_opcode_t*) jp_handle_irq_event;
717 case CN_INT_TASKLET_ENTRY:
718 lkdtm.kp.symbol_name = "tasklet_action";
719 lkdtm.entry = (kprobe_opcode_t*) jp_tasklet_action;
722 lkdtm.kp.symbol_name = "ll_rw_block";
723 lkdtm.entry = (kprobe_opcode_t*) jp_ll_rw_block;
726 lkdtm.kp.symbol_name = "shrink_inactive_list";
727 lkdtm.entry = (kprobe_opcode_t*) jp_shrink_inactive_list;
730 lkdtm.kp.symbol_name = "hrtimer_start";
731 lkdtm.entry = (kprobe_opcode_t*) jp_hrtimer_start;
733 case CN_SCSI_DISPATCH_CMD:
734 lkdtm.kp.symbol_name = "scsi_dispatch_cmd";
735 lkdtm.entry = (kprobe_opcode_t*) jp_scsi_dispatch_cmd;
739 lkdtm.kp.symbol_name = "generic_ide_ioctl";
740 lkdtm.entry = (kprobe_opcode_t*) jp_generic_ide_ioctl;
742 pr_info("Crash point not available\n");
747 pr_info("Invalid Crash Point\n");
752 if ((ret = register_jprobe(&lkdtm)) < 0) {
753 pr_info("Couldn't register jprobe\n");
760 static ssize_t do_register_entry(enum cname which, struct file *f,
761 const char __user *user_buf, size_t count, loff_t *off)
766 if (count >= PAGE_SIZE)
769 buf = (char *)__get_free_page(GFP_KERNEL);
772 if (copy_from_user(buf, user_buf, count)) {
773 free_page((unsigned long) buf);
776 /* NULL-terminate and remove enter */
780 cptype = parse_cp_type(buf, count);
781 free_page((unsigned long) buf);
783 if (cptype == CT_NONE)
786 err = lkdtm_register_cpoint(which);
795 /* Generic read callback that just prints out the available crash types */
796 static ssize_t lkdtm_debugfs_read(struct file *f, char __user *user_buf,
797 size_t count, loff_t *off)
802 buf = (char *)__get_free_page(GFP_KERNEL);
806 n = snprintf(buf, PAGE_SIZE, "Available crash types:\n");
807 for (i = 0; i < ARRAY_SIZE(cp_type); i++)
808 n += snprintf(buf + n, PAGE_SIZE - n, "%s\n", cp_type[i]);
811 out = simple_read_from_buffer(user_buf, count, off,
813 free_page((unsigned long) buf);
818 static int lkdtm_debugfs_open(struct inode *inode, struct file *file)
824 static ssize_t int_hardware_entry(struct file *f, const char __user *buf,
825 size_t count, loff_t *off)
827 return do_register_entry(CN_INT_HARDWARE_ENTRY, f, buf, count, off);
830 static ssize_t int_hw_irq_en(struct file *f, const char __user *buf,
831 size_t count, loff_t *off)
833 return do_register_entry(CN_INT_HW_IRQ_EN, f, buf, count, off);
836 static ssize_t int_tasklet_entry(struct file *f, const char __user *buf,
837 size_t count, loff_t *off)
839 return do_register_entry(CN_INT_TASKLET_ENTRY, f, buf, count, off);
842 static ssize_t fs_devrw_entry(struct file *f, const char __user *buf,
843 size_t count, loff_t *off)
845 return do_register_entry(CN_FS_DEVRW, f, buf, count, off);
848 static ssize_t mem_swapout_entry(struct file *f, const char __user *buf,
849 size_t count, loff_t *off)
851 return do_register_entry(CN_MEM_SWAPOUT, f, buf, count, off);
854 static ssize_t timeradd_entry(struct file *f, const char __user *buf,
855 size_t count, loff_t *off)
857 return do_register_entry(CN_TIMERADD, f, buf, count, off);
860 static ssize_t scsi_dispatch_cmd_entry(struct file *f,
861 const char __user *buf, size_t count, loff_t *off)
863 return do_register_entry(CN_SCSI_DISPATCH_CMD, f, buf, count, off);
866 static ssize_t ide_core_cp_entry(struct file *f, const char __user *buf,
867 size_t count, loff_t *off)
869 return do_register_entry(CN_IDE_CORE_CP, f, buf, count, off);
872 /* Special entry to just crash directly. Available without KPROBEs */
873 static ssize_t direct_entry(struct file *f, const char __user *user_buf,
874 size_t count, loff_t *off)
879 if (count >= PAGE_SIZE)
884 buf = (char *)__get_free_page(GFP_KERNEL);
887 if (copy_from_user(buf, user_buf, count)) {
888 free_page((unsigned long) buf);
891 /* NULL-terminate and remove enter */
895 type = parse_cp_type(buf, count);
896 free_page((unsigned long) buf);
900 pr_info("Performing direct entry %s\n", cp_type_to_str(type));
901 lkdtm_do_action(type);
909 const struct file_operations fops;
912 static const struct crash_entry crash_entries[] = {
913 {"DIRECT", {.read = lkdtm_debugfs_read,
914 .llseek = generic_file_llseek,
915 .open = lkdtm_debugfs_open,
916 .write = direct_entry} },
917 {"INT_HARDWARE_ENTRY", {.read = lkdtm_debugfs_read,
918 .llseek = generic_file_llseek,
919 .open = lkdtm_debugfs_open,
920 .write = int_hardware_entry} },
921 {"INT_HW_IRQ_EN", {.read = lkdtm_debugfs_read,
922 .llseek = generic_file_llseek,
923 .open = lkdtm_debugfs_open,
924 .write = int_hw_irq_en} },
925 {"INT_TASKLET_ENTRY", {.read = lkdtm_debugfs_read,
926 .llseek = generic_file_llseek,
927 .open = lkdtm_debugfs_open,
928 .write = int_tasklet_entry} },
929 {"FS_DEVRW", {.read = lkdtm_debugfs_read,
930 .llseek = generic_file_llseek,
931 .open = lkdtm_debugfs_open,
932 .write = fs_devrw_entry} },
933 {"MEM_SWAPOUT", {.read = lkdtm_debugfs_read,
934 .llseek = generic_file_llseek,
935 .open = lkdtm_debugfs_open,
936 .write = mem_swapout_entry} },
937 {"TIMERADD", {.read = lkdtm_debugfs_read,
938 .llseek = generic_file_llseek,
939 .open = lkdtm_debugfs_open,
940 .write = timeradd_entry} },
941 {"SCSI_DISPATCH_CMD", {.read = lkdtm_debugfs_read,
942 .llseek = generic_file_llseek,
943 .open = lkdtm_debugfs_open,
944 .write = scsi_dispatch_cmd_entry} },
945 {"IDE_CORE_CP", {.read = lkdtm_debugfs_read,
946 .llseek = generic_file_llseek,
947 .open = lkdtm_debugfs_open,
948 .write = ide_core_cp_entry} },
951 static struct dentry *lkdtm_debugfs_root;
953 static int __init lkdtm_module_init(void)
956 int n_debugfs_entries = 1; /* Assume only the direct entry */
959 /* Make sure we can write to __ro_after_init values during __init */
960 ro_after_init |= 0xAA;
962 /* Register debugfs interface */
963 lkdtm_debugfs_root = debugfs_create_dir("provoke-crash", NULL);
964 if (!lkdtm_debugfs_root) {
965 pr_err("creating root dir failed\n");
969 #ifdef CONFIG_KPROBES
970 n_debugfs_entries = ARRAY_SIZE(crash_entries);
973 for (i = 0; i < n_debugfs_entries; i++) {
974 const struct crash_entry *cur = &crash_entries[i];
977 de = debugfs_create_file(cur->name, 0644, lkdtm_debugfs_root,
980 pr_err("could not create %s\n", cur->name);
985 if (lkdtm_parse_commandline() == -EINVAL) {
986 pr_info("Invalid command\n");
990 if (cpoint != CN_INVALID && cptype != CT_NONE) {
991 ret = lkdtm_register_cpoint(cpoint);
993 pr_info("Invalid crash point %d\n", cpoint);
996 pr_info("Crash point %s of type %s registered\n",
997 cpoint_name, cpoint_type);
999 pr_info("No crash points registered, enable through debugfs\n");
1005 debugfs_remove_recursive(lkdtm_debugfs_root);
1009 static void __exit lkdtm_module_exit(void)
1011 debugfs_remove_recursive(lkdtm_debugfs_root);
1013 unregister_jprobe(&lkdtm);
1014 pr_info("Crash point unregistered\n");
1017 module_init(lkdtm_module_init);
1018 module_exit(lkdtm_module_exit);
1020 MODULE_LICENSE("GPL");
1021 MODULE_DESCRIPTION("Kprobe module for testing crash dumps");