mm: add CONFIG_PAGE_BLOCK_ORDER to select page block order

author Juan Yescas <jyescas@google.com>

Wed, 21 May 2025 21:57:45 +0000 (14:57 -0700)

committer Andrew Morton <akpm@linux-foundation.org>

Sun, 1 Jun 2025 05:46:13 +0000 (22:46 -0700)
author Juan Yescas <jyescas@google.com>
Wed, 21 May 2025 21:57:45 +0000 (14:57 -0700)
committer Andrew Morton <akpm@linux-foundation.org>
Sun, 1 Jun 2025 05:46:13 +0000 (22:46 -0700)
diff --git a/include/linux/mmzone.h b/include/linux/mmzone.h

index b19a98c20de8a47a0f1f626128442fd91c0f2f4a..87a667533d6d44ddb7e8f1d817d06ec072a7bfa9 100644 (file)
--- a/include/linux/mmzone.h
+++ b/include/linux/mmzone.h
@@ -37,6 +37,22 @@
  
  #define NR_PAGE_ORDERS (MAX_PAGE_ORDER + 1)
  
+/* Defines the order for the number of pages that have a migrate type. */
+#ifndef CONFIG_PAGE_BLOCK_ORDER
+#define PAGE_BLOCK_ORDER MAX_PAGE_ORDER
+#else
+#define PAGE_BLOCK_ORDER CONFIG_PAGE_BLOCK_ORDER
+#endif /* CONFIG_PAGE_BLOCK_ORDER */
+
+/*
+ * The MAX_PAGE_ORDER, which defines the max order of pages to be allocated
+ * by the buddy allocator, has to be larger or equal to the PAGE_BLOCK_ORDER,
+ * which defines the order for the number of pages that can have a migrate type
+ */
+#if (PAGE_BLOCK_ORDER > MAX_PAGE_ORDER)
+#error MAX_PAGE_ORDER must be >= PAGE_BLOCK_ORDER
+#endif
+
  /*
   * PAGE_ALLOC_COSTLY_ORDER is the order at which allocations are deemed
   * costly to service.  That is between allocation orders which should
diff --git a/include/linux/pageblock-flags.h b/include/linux/pageblock-flags.h

index fc6b9c87cb0a8c9f44326d4739b9bff98c5e0d65..e73a4292ef02e318019cf046187281411f01ec6a 100644 (file)
--- a/include/linux/pageblock-flags.h
+++ b/include/linux/pageblock-flags.h
@@ -41,18 +41,18 @@ extern unsigned int pageblock_order;
   * Huge pages are a constant size, but don't exceed the maximum allocation
   * granularity.
   */
-#define pageblock_order                MIN_T(unsigned int, HUGETLB_PAGE_ORDER, MAX_PAGE_ORDER)
+#define pageblock_order                MIN_T(unsigned int, HUGETLB_PAGE_ORDER, PAGE_BLOCK_ORDER)
  
  #endif /* CONFIG_HUGETLB_PAGE_SIZE_VARIABLE */
  
  #elif defined(CONFIG_TRANSPARENT_HUGEPAGE)
  
-#define pageblock_order                MIN_T(unsigned int, HPAGE_PMD_ORDER, MAX_PAGE_ORDER)
+#define pageblock_order                MIN_T(unsigned int, HPAGE_PMD_ORDER, PAGE_BLOCK_ORDER)
  
  #else /* CONFIG_TRANSPARENT_HUGEPAGE */
  
-/* If huge pages are not used, group by MAX_ORDER_NR_PAGES */
-#define pageblock_order                MAX_PAGE_ORDER
+/* If huge pages are not used, group by PAGE_BLOCK_ORDER */
+#define pageblock_order                PAGE_BLOCK_ORDER
  
  #endif /* CONFIG_HUGETLB_PAGE */
  
diff --git a/mm/Kconfig b/mm/Kconfig

index bd08e151fa1bc51b6535bbc9c793ec55639a6f58..f8bb8f070d0d8f47e5dd15205af9bcfbcf7177c9 100644 (file)
--- a/mm/Kconfig
+++ b/mm/Kconfig
@@ -993,6 +993,40 @@ config CMA_AREAS
  
           If unsure, leave the default value "8" in UMA and "20" in NUMA.
  
+#
+# Select this config option from the architecture Kconfig, if available, to set
+# the max page order for physically contiguous allocations.
+#
+config ARCH_FORCE_MAX_ORDER
+       int
+
+#
+# When ARCH_FORCE_MAX_ORDER is not defined,
+# the default page block order is MAX_PAGE_ORDER (10) as per
+# include/linux/mmzone.h.
+#
+config PAGE_BLOCK_ORDER
+       int "Page Block Order"
+       range 1 10 if ARCH_FORCE_MAX_ORDER = 0
+       default 10 if ARCH_FORCE_MAX_ORDER = 0
+       range 1 ARCH_FORCE_MAX_ORDER if ARCH_FORCE_MAX_ORDER != 0
+       default ARCH_FORCE_MAX_ORDER if ARCH_FORCE_MAX_ORDER != 0
+       help
+         The page block order refers to the power of two number of pages that
+         are physically contiguous and can have a migrate type associated to
+         them. The maximum size of the page block order is limited by
+         ARCH_FORCE_MAX_ORDER.
+
+         This config allows overriding the default page block order when the
+         page block order is required to be smaller than ARCH_FORCE_MAX_ORDER
+         or MAX_PAGE_ORDER.
+
+         Reducing pageblock order can negatively impact THP generation
+         success rate. If your workloads uses THP heavily, please use this
+         option with caution.
+
+         Don't change if unsure.
+
  config MEM_SOFT_DIRTY
         bool "Track memory changes"
         depends on CHECKPOINT_RESTORE && HAVE_ARCH_SOFT_DIRTY && PROC_FS
diff --git a/mm/mm_init.c b/mm/mm_init.c

index 1c5444e188f829d9003bdf2b48f12ee10673e328..8684fa851b84f12eedfab30006a772520d38be17 100644 (file)
--- a/mm/mm_init.c
+++ b/mm/mm_init.c
@@ -1509,7 +1509,7 @@ static inline void setup_usemap(struct zone *zone) {}
  /* Initialise the number of pages represented by NR_PAGEBLOCK_BITS */
  void __init set_pageblock_order(void)
  {
-       unsigned int order = MAX_PAGE_ORDER;
+       unsigned int order = PAGE_BLOCK_ORDER;
  
         /* Check that pageblock_nr_pages has not already been setup */
         if (pageblock_order)
author	Juan Yescas <jyescas@google.com>
	Wed, 21 May 2025 21:57:45 +0000 (14:57 -0700)
committer	Andrew Morton <akpm@linux-foundation.org>
	Sun, 1 Jun 2025 05:46:13 +0000 (22:46 -0700)
include/linux/mmzone.h		patch \| blob \| blame \| history
include/linux/pageblock-flags.h		patch \| blob \| blame \| history
mm/Kconfig		patch \| blob \| blame \| history
mm/mm_init.c		patch \| blob \| blame \| history