mm: memory-failure: add memory failure stats to sysfs

author Jiaqi Yan <jiaqiyan@google.com>

Fri, 20 Jan 2023 03:46:20 +0000 (03:46 +0000)

committer Andrew Morton <akpm@linux-foundation.org>

Fri, 3 Feb 2023 06:33:28 +0000 (22:33 -0800)
author Jiaqi Yan <jiaqiyan@google.com>
Fri, 20 Jan 2023 03:46:20 +0000 (03:46 +0000)
committer Andrew Morton <akpm@linux-foundation.org>
Fri, 3 Feb 2023 06:33:28 +0000 (22:33 -0800)
diff --git a/drivers/base/node.c b/drivers/base/node.c

index faf3597a96da9d7b9122bda47687038254f2c793..b46db17124f346aff070bf839b606046720b9854 100644 (file)
--- a/drivers/base/node.c
+++ b/drivers/base/node.c
@@ -586,6 +586,9 @@ static const struct attribute_group *node_dev_groups[] = {
         &node_dev_group,
  #ifdef CONFIG_HAVE_ARCH_NODE_DEV_GROUP
         &arch_node_dev_group,
+#endif
+#ifdef CONFIG_MEMORY_FAILURE
+       &memory_failure_attr_group,
  #endif
         NULL
  };
diff --git a/include/linux/mm.h b/include/linux/mm.h

index 836b96e08a143e64cf19c2870e5bc5b79abc4441..c9db257f09b3072facd0b2c31dfe89966c42eec9 100644 (file)
--- a/include/linux/mm.h
+++ b/include/linux/mm.h
@@ -3455,6 +3455,11 @@ enum mf_action_page_type {
         MF_MSG_UNKNOWN,
  };
  
+/*
+ * Sysfs entries for memory failure handling statistics.
+ */
+extern const struct attribute_group memory_failure_attr_group;
+
  #if defined(CONFIG_TRANSPARENT_HUGEPAGE) || defined(CONFIG_HUGETLBFS)
  extern void clear_huge_page(struct page *page,
                             unsigned long addr_hint,
diff --git a/include/linux/mmzone.h b/include/linux/mmzone.h

index 977be526c93928f6ea3409c2c80684ae75601786..9fb1b03b83b2308f5489bd908f774cb83ba537e2 100644 (file)
--- a/include/linux/mmzone.h
+++ b/include/linux/mmzone.h
@@ -1212,6 +1212,31 @@ struct deferred_split {
  };
  #endif
  
+#ifdef CONFIG_MEMORY_FAILURE
+/*
+ * Per NUMA node memory failure handling statistics.
+ */
+struct memory_failure_stats {
+       /*
+        * Number of raw pages poisoned.
+        * Cases not accounted: memory outside kernel control, offline page,
+        * arch-specific memory_failure (SGX), hwpoison_filter() filtered
+        * error events, and unpoison actions from hwpoison_unpoison.
+        */
+       unsigned long total;
+       /*
+        * Recovery results of poisoned raw pages handled by memory_failure,
+        * in sync with mf_result.
+        * total = ignored + failed + delayed + recovered.
+        * total * PAGE_SIZE * #nodes = /proc/meminfo/HardwareCorrupted.
+        */
+       unsigned long ignored;
+       unsigned long failed;
+       unsigned long delayed;
+       unsigned long recovered;
+};
+#endif
+
  /*
   * On NUMA machines, each NUMA node would have a pg_data_t to describe
   * it's memory layout. On UMA machines there is a single pglist_data which
@@ -1357,6 +1382,9 @@ typedef struct pglist_data {
  #ifdef CONFIG_NUMA
         struct memory_tier __rcu *memtier;
  #endif
+#ifdef CONFIG_MEMORY_FAILURE
+       struct memory_failure_stats mf_stats;
+#endif
  } pg_data_t;
  
  #define node_present_pages(nid)        (NODE_DATA(nid)->node_present_pages)
diff --git a/mm/memory-failure.c b/mm/memory-failure.c

index 0a382191737f3421a525466647caa216c45bc826..44eec2e93a0b9e3fb23563d04cabd86e014d06dd 100644 (file)
--- a/mm/memory-failure.c
+++ b/mm/memory-failure.c
@@ -87,6 +87,41 @@ inline void num_poisoned_pages_sub(unsigned long pfn, long i)
                 memblk_nr_poison_sub(pfn, i);
  }
  
+/**
+ * MF_ATTR_RO - Create sysfs entry for each memory failure statistics.
+ * @_name: name of the file in the per NUMA sysfs directory.
+ */
+#define MF_ATTR_RO(_name)                                      \
+static ssize_t _name##_show(struct device *dev,                        \
+                           struct device_attribute *attr,      \
+                           char *buf)                          \
+{                                                              \
+       struct memory_failure_stats *mf_stats =                 \
+               &NODE_DATA(dev->id)->mf_stats;                  \
+       return sprintf(buf, "%lu\n", mf_stats->_name);          \
+}                                                              \
+static DEVICE_ATTR_RO(_name)
+
+MF_ATTR_RO(total);
+MF_ATTR_RO(ignored);
+MF_ATTR_RO(failed);
+MF_ATTR_RO(delayed);
+MF_ATTR_RO(recovered);
+
+static struct attribute *memory_failure_attr[] = {
+       &dev_attr_total.attr,
+       &dev_attr_ignored.attr,
+       &dev_attr_failed.attr,
+       &dev_attr_delayed.attr,
+       &dev_attr_recovered.attr,
+       NULL,
+};
+
+const struct attribute_group memory_failure_attr_group = {
+       .name = "memory_failure",
+       .attrs = memory_failure_attr,
+};
+
  /*
   * Return values:
   *   1:   the page is dissolved (if needed) and taken off from buddy,
author	Jiaqi Yan <jiaqiyan@google.com>
	Fri, 20 Jan 2023 03:46:20 +0000 (03:46 +0000)
committer	Andrew Morton <akpm@linux-foundation.org>
	Fri, 3 Feb 2023 06:33:28 +0000 (22:33 -0800)
drivers/base/node.c		patch \| blob \| history
include/linux/mm.h		patch \| blob \| history
include/linux/mmzone.h		patch \| blob \| history
mm/memory-failure.c		patch \| blob \| history