mm: adjust shuffle code to allow for future coalescing

author Alexander Duyck <alexander.h.duyck@linux.intel.com>

Tue, 7 Apr 2020 03:04:45 +0000 (20:04 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Tue, 7 Apr 2020 17:43:38 +0000 (10:43 -0700)
author Alexander Duyck <alexander.h.duyck@linux.intel.com>
Tue, 7 Apr 2020 03:04:45 +0000 (20:04 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Tue, 7 Apr 2020 17:43:38 +0000 (10:43 -0700)
diff --git a/include/linux/mmzone.h b/include/linux/mmzone.h

index e84d448988b6594f67c042111953cc4a0991671d..c023d7968b14d7b8d0de8658a14f8319685fd2db 100644 (file)
--- a/include/linux/mmzone.h
+++ b/include/linux/mmzone.h
@@ -116,18 +116,6 @@ static inline void add_to_free_area_tail(struct page *page, struct free_area *ar
         area->nr_free++;
  }
  
-#ifdef CONFIG_SHUFFLE_PAGE_ALLOCATOR
-/* Used to preserve page allocation order entropy */
-void add_to_free_area_random(struct page *page, struct free_area *area,
-               int migratetype);
-#else
-static inline void add_to_free_area_random(struct page *page,
-               struct free_area *area, int migratetype)
-{
-       add_to_free_area(page, area, migratetype);
-}
-#endif
-
  /* Used for pages which are on another list */
  static inline void move_to_free_area(struct page *page, struct free_area *area,
                              int migratetype)
diff --git a/mm/page_alloc.c b/mm/page_alloc.c

index e5f76da8cd4e753fac9e466a1bd9531b2e0dabca..f2b8cb8f995f389f4c18c2e9c0da5ce531518f9f 100644 (file)
--- a/mm/page_alloc.c
+++ b/mm/page_alloc.c
@@ -864,6 +864,36 @@ compaction_capture(struct capture_control *capc, struct page *page,
  }
  #endif /* CONFIG_COMPACTION */
  
+/*
+ * If this is not the largest possible page, check if the buddy
+ * of the next-highest order is free. If it is, it's possible
+ * that pages are being freed that will coalesce soon. In case,
+ * that is happening, add the free page to the tail of the list
+ * so it's less likely to be used soon and more likely to be merged
+ * as a higher order page
+ */
+static inline bool
+buddy_merge_likely(unsigned long pfn, unsigned long buddy_pfn,
+                  struct page *page, unsigned int order)
+{
+       struct page *higher_page, *higher_buddy;
+       unsigned long combined_pfn;
+
+       if (order >= MAX_ORDER - 2)
+               return false;
+
+       if (!pfn_valid_within(buddy_pfn))
+               return false;
+
+       combined_pfn = buddy_pfn & pfn;
+       higher_page = page + (combined_pfn - pfn);
+       buddy_pfn = __find_buddy_pfn(combined_pfn, order + 1);
+       higher_buddy = higher_page + (buddy_pfn - combined_pfn);
+
+       return pfn_valid_within(buddy_pfn) &&
+              page_is_buddy(higher_page, higher_buddy, order + 1);
+}
+
  /*
   * Freeing function for a buddy system allocator.
   *
@@ -893,11 +923,13 @@ static inline void __free_one_page(struct page *page,
                 struct zone *zone, unsigned int order,
                 int migratetype)
  {
-       unsigned long combined_pfn;
+       struct capture_control *capc = task_capc(zone);
         unsigned long uninitialized_var(buddy_pfn);
-       struct page *buddy;
+       unsigned long combined_pfn;
+       struct free_area *area;
         unsigned int max_order;
-       struct capture_control *capc = task_capc(zone);
+       struct page *buddy;
+       bool to_tail;
  
         max_order = min_t(unsigned int, MAX_ORDER, pageblock_order + 1);
  
@@ -966,35 +998,16 @@ continue_merging:
  done_merging:
         set_page_order(page, order);
  
-       /*
-        * If this is not the largest possible page, check if the buddy
-        * of the next-highest order is free. If it is, it's possible
-        * that pages are being freed that will coalesce soon. In case,
-        * that is happening, add the free page to the tail of the list
-        * so it's less likely to be used soon and more likely to be merged
-        * as a higher order page
-        */
-       if ((order < MAX_ORDER-2) && pfn_valid_within(buddy_pfn)
-                       && !is_shuffle_order(order)) {
-               struct page *higher_page, *higher_buddy;
-               combined_pfn = buddy_pfn & pfn;
-               higher_page = page + (combined_pfn - pfn);
-               buddy_pfn = __find_buddy_pfn(combined_pfn, order + 1);
-               higher_buddy = higher_page + (buddy_pfn - combined_pfn);
-               if (pfn_valid_within(buddy_pfn) &&
-                   page_is_buddy(higher_page, higher_buddy, order + 1)) {
-                       add_to_free_area_tail(page, &zone->free_area[order],
-                                             migratetype);
-                       return;
-               }
-       }
-
+       area = &zone->free_area[order];
         if (is_shuffle_order(order))
-               add_to_free_area_random(page, &zone->free_area[order],
-                               migratetype);
+               to_tail = shuffle_pick_tail();
         else
-               add_to_free_area(page, &zone->free_area[order], migratetype);
+               to_tail = buddy_merge_likely(pfn, buddy_pfn, page, order);
  
+       if (to_tail)
+               add_to_free_area_tail(page, area, migratetype);
+       else
+               add_to_free_area(page, area, migratetype);
  }
  
  /*
diff --git a/mm/shuffle.c b/mm/shuffle.c

index c716059cbd3cca310c88597431ba44c4340362fd..44406d9977c7779ab347dda835608046882569d7 100644 (file)
--- a/mm/shuffle.c
+++ b/mm/shuffle.c
@@ -183,11 +183,11 @@ void __meminit __shuffle_free_memory(pg_data_t *pgdat)
                 shuffle_zone(z);
  }
  
-void add_to_free_area_random(struct page *page, struct free_area *area,
-               int migratetype)
+bool shuffle_pick_tail(void)
  {
         static u64 rand;
         static u8 rand_bits;
+       bool ret;
  
         /*
          * The lack of locking is deliberate. If 2 threads race to
@@ -198,10 +198,10 @@ void add_to_free_area_random(struct page *page, struct free_area *area,
                 rand = get_random_u64();
         }
  
-       if (rand & 1)
-               add_to_free_area(page, area, migratetype);
-       else
-               add_to_free_area_tail(page, area, migratetype);
+       ret = rand & 1;
+
         rand_bits--;
         rand >>= 1;
+
+       return ret;
  }
diff --git a/mm/shuffle.h b/mm/shuffle.h

index 777a257a0d2f9346f10e68db9da34789fd5a3711..4d79f03b6658ff29799a0b3f47c9a5de2d593475 100644 (file)
--- a/mm/shuffle.h
+++ b/mm/shuffle.h
@@ -22,6 +22,7 @@ enum mm_shuffle_ctl {
  DECLARE_STATIC_KEY_FALSE(page_alloc_shuffle_key);
  extern void page_alloc_shuffle(enum mm_shuffle_ctl ctl);
  extern void __shuffle_free_memory(pg_data_t *pgdat);
+extern bool shuffle_pick_tail(void);
  static inline void shuffle_free_memory(pg_data_t *pgdat)
  {
         if (!static_branch_unlikely(&page_alloc_shuffle_key))
@@ -44,6 +45,11 @@ static inline bool is_shuffle_order(int order)
         return order >= SHUFFLE_ORDER;
  }
  #else
+static inline bool shuffle_pick_tail(void)
+{
+       return false;
+}
+
  static inline void shuffle_free_memory(pg_data_t *pgdat)
  {
  }
author	Alexander Duyck <alexander.h.duyck@linux.intel.com>
	Tue, 7 Apr 2020 03:04:45 +0000 (20:04 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Tue, 7 Apr 2020 17:43:38 +0000 (10:43 -0700)
include/linux/mmzone.h		patch \| blob \| history
mm/page_alloc.c		patch \| blob \| history
mm/shuffle.c		patch \| blob \| history
mm/shuffle.h		patch \| blob \| history