kernel: add panic_on_warn

author Prarit Bhargava <prarit@redhat.com>

Wed, 10 Dec 2014 23:45:50 +0000 (15:45 -0800)

committer Linus Torvalds <torvalds@linux-foundation.org>

Thu, 11 Dec 2014 01:41:10 +0000 (17:41 -0800)
author Prarit Bhargava <prarit@redhat.com>
Wed, 10 Dec 2014 23:45:50 +0000 (15:45 -0800)
committer Linus Torvalds <torvalds@linux-foundation.org>
Thu, 11 Dec 2014 01:41:10 +0000 (17:41 -0800)
diff --git a/Documentation/kdump/kdump.txt b/Documentation/kdump/kdump.txt

index 6c0b9f27e4652c94616ce32643a7fbe32d370eda..bc4bd5a44b88b9abedec6b4d859f1163c3c2a6ac 100644 (file)
--- a/Documentation/kdump/kdump.txt
+++ b/Documentation/kdump/kdump.txt
@@ -471,6 +471,13 @@ format. Crash is available on Dave Anderson's site at the following URL:
  
     http://people.redhat.com/~anderson/
  
+Trigger Kdump on WARN()
+=======================
+
+The kernel parameter, panic_on_warn, calls panic() in all WARN() paths.  This
+will cause a kdump to occur at the panic() call.  In cases where a user wants
+to specify this during runtime, /proc/sys/kernel/panic_on_warn can be set to 1
+to achieve the same behaviour.
  
  Contact
  =======
diff --git a/Documentation/kernel-parameters.txt b/Documentation/kernel-parameters.txt

index 838f3776c9249e2cd3d5e17c966f0fb4acdad796..d6eb3636fe5a4c12205e028da84f0e09b7d704ae 100644 (file)
--- a/Documentation/kernel-parameters.txt
+++ b/Documentation/kernel-parameters.txt
@@ -2509,6 +2509,9 @@ bytes respectively. Such letter suffixes can also be entirely omitted.
                         timeout < 0: reboot immediately
                         Format: <timeout>
  
+       panic_on_warn   panic() instead of WARN().  Useful to cause kdump
+                       on a WARN().
+
         crash_kexec_post_notifiers
                         Run kdump after running panic-notifiers and dumping
                         kmsg. This only for the users who doubt kdump always
diff --git a/Documentation/sysctl/kernel.txt b/Documentation/sysctl/kernel.txt

index 57baff5bdb806b3b725bdc7859c385fbdc1cac54..b5d0c8501a189c8e2473bea02502cd6a5932eecd 100644 (file)
--- a/Documentation/sysctl/kernel.txt
+++ b/Documentation/sysctl/kernel.txt
@@ -54,8 +54,9 @@ show up in /proc/sys/kernel:
  - overflowuid
  - panic
  - panic_on_oops
-- panic_on_unrecovered_nmi
  - panic_on_stackoverflow
+- panic_on_unrecovered_nmi
+- panic_on_warn
  - pid_max
  - powersave-nap               [ PPC only ]
  - printk
@@ -527,19 +528,6 @@ the recommended setting is 60.
  
  ==============================================================
  
-panic_on_unrecovered_nmi:
-
-The default Linux behaviour on an NMI of either memory or unknown is
-to continue operation. For many environments such as scientific
-computing it is preferable that the box is taken out and the error
-dealt with than an uncorrected parity/ECC error get propagated.
-
-A small number of systems do generate NMI's for bizarre random reasons
-such as power management so the default is off. That sysctl works like
-the existing panic controls already in that directory.
-
-==============================================================
-
  panic_on_oops:
  
  Controls the kernel's behaviour when an oops or BUG is encountered.
@@ -563,6 +551,30 @@ This file shows up if CONFIG_DEBUG_STACKOVERFLOW is enabled.
  
  ==============================================================
  
+panic_on_unrecovered_nmi:
+
+The default Linux behaviour on an NMI of either memory or unknown is
+to continue operation. For many environments such as scientific
+computing it is preferable that the box is taken out and the error
+dealt with than an uncorrected parity/ECC error get propagated.
+
+A small number of systems do generate NMI's for bizarre random reasons
+such as power management so the default is off. That sysctl works like
+the existing panic controls already in that directory.
+
+==============================================================
+
+panic_on_warn:
+
+Calls panic() in the WARN() path when set to 1.  This is useful to avoid
+a kernel rebuild when attempting to kdump at the location of a WARN().
+
+0: only WARN(), default behaviour.
+
+1: call panic() after printing out WARN() location.
+
+==============================================================
+
  perf_cpu_time_max_percent:
  
  Hints to the kernel how much CPU time it should be allowed to
diff --git a/include/linux/kernel.h b/include/linux/kernel.h

index 446d76a87ba17f8b3116482a8617df1c5972bc1a..233ea8107038a81cf7a4186196bebd2c861422cd 100644 (file)
--- a/include/linux/kernel.h
+++ b/include/linux/kernel.h
@@ -427,6 +427,7 @@ extern int panic_timeout;
  extern int panic_on_oops;
  extern int panic_on_unrecovered_nmi;
  extern int panic_on_io_nmi;
+extern int panic_on_warn;
  extern int sysctl_panic_on_stackoverflow;
  /*
   * Only to be used by arch init code. If the user over-wrote the default
diff --git a/include/uapi/linux/sysctl.h b/include/uapi/linux/sysctl.h

index 43aaba1cc0372c050f5d5caf0903609ed46f73e0..0956373b56db7825c965fa18084bfedb3f21df3c 100644 (file)
--- a/include/uapi/linux/sysctl.h
+++ b/include/uapi/linux/sysctl.h
@@ -153,6 +153,7 @@ enum
         KERN_MAX_LOCK_DEPTH=74, /* int: rtmutex's maximum lock depth */
         KERN_NMI_WATCHDOG=75, /* int: enable/disable nmi watchdog */
         KERN_PANIC_ON_NMI=76, /* int: whether we will panic on an unrecovered */
+       KERN_PANIC_ON_WARN=77, /* int: call panic() in WARN() functions */
  };
  
  
diff --git a/kernel/panic.c b/kernel/panic.c

index cf80672b79246dd439f64cea16d3e631e7d35f2f..4d8d6f906decede78600ef0767770dd713f8b225 100644 (file)
--- a/kernel/panic.c
+++ b/kernel/panic.c
@@ -33,6 +33,7 @@ static int pause_on_oops;
  static int pause_on_oops_flag;
  static DEFINE_SPINLOCK(pause_on_oops_lock);
  static bool crash_kexec_post_notifiers;
+int panic_on_warn __read_mostly;
  
  int panic_timeout = CONFIG_PANIC_TIMEOUT;
  EXPORT_SYMBOL_GPL(panic_timeout);
@@ -428,6 +429,17 @@ static void warn_slowpath_common(const char *file, int line, void *caller,
         if (args)
                 vprintk(args->fmt, args->args);
  
+       if (panic_on_warn) {
+               /*
+                * This thread may hit another WARN() in the panic path.
+                * Resetting this prevents additional WARN() from panicking the
+                * system on this thread.  Other threads are blocked by the
+                * panic_mutex in panic().
+                */
+               panic_on_warn = 0;
+               panic("panic_on_warn set ...\n");
+       }
+
         print_modules();
         dump_stack();
         print_oops_end_marker();
@@ -485,6 +497,7 @@ EXPORT_SYMBOL(__stack_chk_fail);
  
  core_param(panic, panic_timeout, int, 0644);
  core_param(pause_on_oops, pause_on_oops, int, 0644);
+core_param(panic_on_warn, panic_on_warn, int, 0644);
  
  static int __init setup_crash_kexec_post_notifiers(char *s)
  {
diff --git a/kernel/sysctl.c b/kernel/sysctl.c

index 15f2511a1b7c6e04a48f99c1b6a402f008607ba3..7c54ff79afd7f053c8ce5a943d4cf7fb9d8acb2b 100644 (file)
--- a/kernel/sysctl.c
+++ b/kernel/sysctl.c
@@ -1104,6 +1104,15 @@ static struct ctl_table kern_table[] = {
                 .proc_handler   = proc_dointvec,
         },
  #endif
+       {
+               .procname       = "panic_on_warn",
+               .data           = &panic_on_warn,
+               .maxlen         = sizeof(int),
+               .mode           = 0644,
+               .proc_handler   = proc_dointvec_minmax,
+               .extra1         = &zero,
+               .extra2         = &one,
+       },
         { }
  };
  
diff --git a/kernel/sysctl_binary.c b/kernel/sysctl_binary.c

index 9a4f750a296329861b95672dc00cfa4dc2ef515f..7e7746a42a623e66034b73c1e78f017d469b9f53 100644 (file)
--- a/kernel/sysctl_binary.c
+++ b/kernel/sysctl_binary.c
@@ -137,6 +137,7 @@ static const struct bin_table bin_kern_table[] = {
         { CTL_INT,      KERN_COMPAT_LOG,                "compat-log" },
         { CTL_INT,      KERN_MAX_LOCK_DEPTH,            "max_lock_depth" },
         { CTL_INT,      KERN_PANIC_ON_NMI,              "panic_on_unrecovered_nmi" },
+       { CTL_INT,      KERN_PANIC_ON_WARN,             "panic_on_warn" },
         {}
  };
author	Prarit Bhargava <prarit@redhat.com>
	Wed, 10 Dec 2014 23:45:50 +0000 (15:45 -0800)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Thu, 11 Dec 2014 01:41:10 +0000 (17:41 -0800)
Documentation/kdump/kdump.txt		patch \| blob \| blame \| history
Documentation/kernel-parameters.txt		patch \| blob \| blame \| history
Documentation/sysctl/kernel.txt		patch \| blob \| blame \| history
include/linux/kernel.h		patch \| blob \| blame \| history
include/uapi/linux/sysctl.h		patch \| blob \| blame \| history
kernel/panic.c		patch \| blob \| blame \| history
kernel/sysctl.c		patch \| blob \| blame \| history
kernel/sysctl_binary.c		patch \| blob \| blame \| history