watchdog/hardlockup: detect hard lockups using secondary (buddy) CPUs

author Douglas Anderson <dianders@chromium.org>

Fri, 19 May 2023 17:18:38 +0000 (10:18 -0700)

committer Andrew Morton <akpm@linux-foundation.org>

Sat, 10 Jun 2023 00:44:21 +0000 (17:44 -0700)
author Douglas Anderson <dianders@chromium.org>
Fri, 19 May 2023 17:18:38 +0000 (10:18 -0700)
committer Andrew Morton <akpm@linux-foundation.org>
Sat, 10 Jun 2023 00:44:21 +0000 (17:44 -0700)
diff --git a/include/linux/nmi.h b/include/linux/nmi.h

index e23b4dc..1cdadc6 100644 (file)
--- a/include/linux/nmi.h
+++ b/include/linux/nmi.h
@@ -85,8 +85,9 @@ extern unsigned int hardlockup_panic;
  static inline void hardlockup_detector_disable(void) {}
  #endif
  
-#if defined(CONFIG_HARDLOCKUP_DETECTOR_PERF)
+#if defined(CONFIG_HARDLOCKUP_DETECTOR_COUNTS_HRTIMER)
  void arch_touch_nmi_watchdog(void);
+void watchdog_hardlockup_touch_cpu(unsigned int cpu);
  void watchdog_hardlockup_check(unsigned int cpu, struct pt_regs *regs);
  #elif !defined(CONFIG_HAVE_NMI_WATCHDOG)
  static inline void arch_touch_nmi_watchdog(void) { }
@@ -116,6 +117,12 @@ void watchdog_hardlockup_disable(unsigned int cpu);
  
  void lockup_detector_reconfigure(void);
  
+#ifdef CONFIG_HARDLOCKUP_DETECTOR_BUDDY
+void watchdog_buddy_check_hardlockup(unsigned long hrtimer_interrupts);
+#else
+static inline void watchdog_buddy_check_hardlockup(unsigned long hrtimer_interrupts) {}
+#endif
+
  /**
   * touch_nmi_watchdog - manually reset the hardlockup watchdog timeout.
   *
diff --git a/kernel/Makefile b/kernel/Makefile

index 7eb7203..f9e3fd9 100644 (file)
--- a/kernel/Makefile
+++ b/kernel/Makefile
@@ -91,6 +91,7 @@ obj-$(CONFIG_FAIL_FUNCTION) += fail_function.o
  obj-$(CONFIG_KGDB) += debug/
  obj-$(CONFIG_DETECT_HUNG_TASK) += hung_task.o
  obj-$(CONFIG_LOCKUP_DETECTOR) += watchdog.o
+obj-$(CONFIG_HARDLOCKUP_DETECTOR_BUDDY) += watchdog_buddy.o
  obj-$(CONFIG_HARDLOCKUP_DETECTOR_PERF) += watchdog_perf.o
  obj-$(CONFIG_SECCOMP) += seccomp.o
  obj-$(CONFIG_RELAY) += relay.o
diff --git a/kernel/watchdog.c b/kernel/watchdog.c

index e67125f..10947c8 100644 (file)
--- a/kernel/watchdog.c
+++ b/kernel/watchdog.c
@@ -85,7 +85,7 @@ __setup("nmi_watchdog=", hardlockup_panic_setup);
  
  #endif /* CONFIG_HARDLOCKUP_DETECTOR */
  
-#if defined(CONFIG_HARDLOCKUP_DETECTOR_PERF)
+#if defined(CONFIG_HARDLOCKUP_DETECTOR_COUNTS_HRTIMER)
  
  static DEFINE_PER_CPU(atomic_t, hrtimer_interrupts);
  static DEFINE_PER_CPU(int, hrtimer_interrupts_saved);
@@ -106,6 +106,14 @@ notrace void arch_touch_nmi_watchdog(void)
  }
  EXPORT_SYMBOL(arch_touch_nmi_watchdog);
  
+void watchdog_hardlockup_touch_cpu(unsigned int cpu)
+{
+       per_cpu(watchdog_hardlockup_touched, cpu) = true;
+
+       /* Match with smp_rmb() in watchdog_hardlockup_check() */
+       smp_wmb();
+}
+
  static bool is_hardlockup(unsigned int cpu)
  {
         int hrint = atomic_read(&per_cpu(hrtimer_interrupts, cpu));
@@ -123,13 +131,16 @@ static bool is_hardlockup(unsigned int cpu)
         return false;
  }
  
-static void watchdog_hardlockup_kick(void)
+static unsigned long watchdog_hardlockup_kick(void)
  {
-       atomic_inc(raw_cpu_ptr(&hrtimer_interrupts));
+       return atomic_inc_return(raw_cpu_ptr(&hrtimer_interrupts));
  }
  
  void watchdog_hardlockup_check(unsigned int cpu, struct pt_regs *regs)
  {
+       /* Match with smp_wmb() in watchdog_hardlockup_touch_cpu() */
+       smp_rmb();
+
         if (per_cpu(watchdog_hardlockup_touched, cpu)) {
                 per_cpu(watchdog_hardlockup_touched, cpu) = false;
                 return;
@@ -180,11 +191,11 @@ void watchdog_hardlockup_check(unsigned int cpu, struct pt_regs *regs)
         }
  }
  
-#else /* CONFIG_HARDLOCKUP_DETECTOR_PERF */
+#else /* CONFIG_HARDLOCKUP_DETECTOR_COUNTS_HRTIMER */
  
-static inline void watchdog_hardlockup_kick(void) { }
+static inline unsigned long watchdog_hardlockup_kick(void) { return 0; }
  
-#endif /* !CONFIG_HARDLOCKUP_DETECTOR_PERF */
+#endif /* !CONFIG_HARDLOCKUP_DETECTOR_COUNTS_HRTIMER */
  
  /*
   * These functions can be overridden based on the configured hardlockdup detector.
@@ -443,11 +454,15 @@ static enum hrtimer_restart watchdog_timer_fn(struct hrtimer *hrtimer)
         struct pt_regs *regs = get_irq_regs();
         int duration;
         int softlockup_all_cpu_backtrace = sysctl_softlockup_all_cpu_backtrace;
+       unsigned long hrtimer_interrupts;
  
         if (!watchdog_enabled)
                 return HRTIMER_NORESTART;
  
-       watchdog_hardlockup_kick();
+       hrtimer_interrupts = watchdog_hardlockup_kick();
+
+       /* test for hardlockups */
+       watchdog_buddy_check_hardlockup(hrtimer_interrupts);
  
         /* kick the softlockup detector */
         if (completion_done(this_cpu_ptr(&softlockup_completion))) {
diff --git a/kernel/watchdog_buddy.c b/kernel/watchdog_buddy.c

new file mode 100644 (file)

index 0000000..fee45af
--- /dev/null
+++ b/kernel/watchdog_buddy.c
@@ -0,0 +1,93 @@
+// SPDX-License-Identifier: GPL-2.0
+
+#include <linux/cpu.h>
+#include <linux/cpumask.h>
+#include <linux/kernel.h>
+#include <linux/nmi.h>
+#include <linux/percpu-defs.h>
+
+static cpumask_t __read_mostly watchdog_cpus;
+
+static unsigned int watchdog_next_cpu(unsigned int cpu)
+{
+       cpumask_t cpus = watchdog_cpus;
+       unsigned int next_cpu;
+
+       next_cpu = cpumask_next(cpu, &cpus);
+       if (next_cpu >= nr_cpu_ids)
+               next_cpu = cpumask_first(&cpus);
+
+       if (next_cpu == cpu)
+               return nr_cpu_ids;
+
+       return next_cpu;
+}
+
+int __init watchdog_hardlockup_probe(void)
+{
+       return 0;
+}
+
+void watchdog_hardlockup_enable(unsigned int cpu)
+{
+       unsigned int next_cpu;
+
+       /*
+        * The new CPU will be marked online before the hrtimer interrupt
+        * gets a chance to run on it. If another CPU tests for a
+        * hardlockup on the new CPU before it has run its the hrtimer
+        * interrupt, it will get a false positive. Touch the watchdog on
+        * the new CPU to delay the check for at least 3 sampling periods
+        * to guarantee one hrtimer has run on the new CPU.
+        */
+       watchdog_hardlockup_touch_cpu(cpu);
+
+       /*
+        * We are going to check the next CPU. Our watchdog_hrtimer
+        * need not be zero if the CPU has already been online earlier.
+        * Touch the watchdog on the next CPU to avoid false positive
+        * if we try to check it in less then 3 interrupts.
+        */
+       next_cpu = watchdog_next_cpu(cpu);
+       if (next_cpu < nr_cpu_ids)
+               watchdog_hardlockup_touch_cpu(next_cpu);
+
+       cpumask_set_cpu(cpu, &watchdog_cpus);
+}
+
+void watchdog_hardlockup_disable(unsigned int cpu)
+{
+       unsigned int next_cpu = watchdog_next_cpu(cpu);
+
+       /*
+        * Offlining this CPU will cause the CPU before this one to start
+        * checking the one after this one. If this CPU just finished checking
+        * the next CPU and updating hrtimer_interrupts_saved, and then the
+        * previous CPU checks it within one sample period, it will trigger a
+        * false positive. Touch the watchdog on the next CPU to prevent it.
+        */
+       if (next_cpu < nr_cpu_ids)
+               watchdog_hardlockup_touch_cpu(next_cpu);
+
+       cpumask_clear_cpu(cpu, &watchdog_cpus);
+}
+
+void watchdog_buddy_check_hardlockup(unsigned long hrtimer_interrupts)
+{
+       unsigned int next_cpu;
+
+       /*
+        * Test for hardlockups every 3 samples. The sample period is
+        *  watchdog_thresh * 2 / 5, so 3 samples gets us back to slightly over
+        *  watchdog_thresh (over by 20%).
+        */
+       if (hrtimer_interrupts % 3 != 0)
+               return;
+
+       /* check for a hardlockup on the next CPU */
+       next_cpu = watchdog_next_cpu(smp_processor_id());
+       if (next_cpu >= nr_cpu_ids)
+               return;
+
+       watchdog_hardlockup_check(next_cpu, NULL);
+}
diff --git a/lib/Kconfig.debug b/lib/Kconfig.debug

index ce51d4d..abcad05 100644 (file)
--- a/lib/Kconfig.debug
+++ b/lib/Kconfig.debug
@@ -1035,10 +1035,55 @@ config BOOTPARAM_SOFTLOCKUP_PANIC
  
           Say N if unsure.
  
-config HARDLOCKUP_DETECTOR_PERF
+# Both the "perf" and "buddy" hardlockup detectors count hrtimer
+# interrupts. This config enables functions managing this common code.
+config HARDLOCKUP_DETECTOR_COUNTS_HRTIMER
         bool
         select SOFTLOCKUP_DETECTOR
  
+config HARDLOCKUP_DETECTOR_PERF
+       bool
+       depends on HAVE_HARDLOCKUP_DETECTOR_PERF
+       select HARDLOCKUP_DETECTOR_COUNTS_HRTIMER
+
+config HARDLOCKUP_DETECTOR_BUDDY
+       bool
+       depends on SMP
+       select HARDLOCKUP_DETECTOR_COUNTS_HRTIMER
+
+# For hardlockup detectors you can have one directly provided by the arch
+# or use a "non-arch" one. If you're using a "non-arch" one that is
+# further divided the perf hardlockup detector (which, confusingly, needs
+# arch-provided perf support) and the buddy hardlockup detector (which just
+# needs SMP). In either case, using the "non-arch" code conflicts with
+# the NMI watchdog code (which is sometimes used directly and sometimes used
+# by the arch-provided hardlockup detector).
+config HAVE_HARDLOCKUP_DETECTOR_NON_ARCH
+       bool
+       depends on (HAVE_HARDLOCKUP_DETECTOR_PERF || SMP) && !HAVE_NMI_WATCHDOG
+       default y
+
+config HARDLOCKUP_DETECTOR_PREFER_BUDDY
+       bool "Prefer the buddy CPU hardlockup detector"
+       depends on HAVE_HARDLOCKUP_DETECTOR_NON_ARCH && HAVE_HARDLOCKUP_DETECTOR_PERF && SMP
+       help
+         Say Y here to prefer the buddy hardlockup detector over the perf one.
+
+         With the buddy detector, each CPU uses its softlockup hrtimer
+         to check that the next CPU is processing hrtimer interrupts by
+         verifying that a counter is increasing.
+
+         This hardlockup detector is useful on systems that don't have
+         an arch-specific hardlockup detector or if resources needed
+         for the hardlockup detector are better used for other things.
+
+# This will select the appropriate non-arch hardlockdup detector
+config HARDLOCKUP_DETECTOR_NON_ARCH
+       bool
+       depends on HAVE_HARDLOCKUP_DETECTOR_NON_ARCH
+       select HARDLOCKUP_DETECTOR_BUDDY if !HAVE_HARDLOCKUP_DETECTOR_PERF || HARDLOCKUP_DETECTOR_PREFER_BUDDY
+       select HARDLOCKUP_DETECTOR_PERF if HAVE_HARDLOCKUP_DETECTOR_PERF && !HARDLOCKUP_DETECTOR_PREFER_BUDDY
+
  #
  # Enables a timestamp based low pass filter to compensate for perf based
  # hard lockup detection which runs too fast due to turbo modes.
@@ -1053,9 +1098,10 @@ config HARDLOCKUP_CHECK_TIMESTAMP
  config HARDLOCKUP_DETECTOR
         bool "Detect Hard Lockups"
         depends on DEBUG_KERNEL && !S390
-       depends on HAVE_HARDLOCKUP_DETECTOR_PERF || HAVE_HARDLOCKUP_DETECTOR_ARCH
+       depends on HAVE_HARDLOCKUP_DETECTOR_NON_ARCH || HAVE_HARDLOCKUP_DETECTOR_ARCH
         select LOCKUP_DETECTOR
-       select HARDLOCKUP_DETECTOR_PERF if HAVE_HARDLOCKUP_DETECTOR_PERF
+       select HARDLOCKUP_DETECTOR_NON_ARCH if HAVE_HARDLOCKUP_DETECTOR_NON_ARCH
+
         help
           Say Y here to enable the kernel to act as a watchdog to detect
           hard lockups.
author	Douglas Anderson <dianders@chromium.org>
	Fri, 19 May 2023 17:18:38 +0000 (10:18 -0700)
committer	Andrew Morton <akpm@linux-foundation.org>
	Sat, 10 Jun 2023 00:44:21 +0000 (17:44 -0700)
include/linux/nmi.h		patch \| blob \| history
kernel/Makefile		patch \| blob \| history
kernel/watchdog.c		patch \| blob \| history
kernel/watchdog_buddy.c	[new file with mode: 0644]	patch \| blob
lib/Kconfig.debug		patch \| blob \| history