mm/hugetlb: use separate nodemask for bootmem allocations

author Frank van der Linden <fvdl@google.com>

Wed, 2 Apr 2025 20:56:13 +0000 (20:56 +0000)

committer Andrew Morton <akpm@linux-foundation.org>

Tue, 13 May 2025 06:50:35 +0000 (23:50 -0700)
author Frank van der Linden <fvdl@google.com>
Wed, 2 Apr 2025 20:56:13 +0000 (20:56 +0000)
committer Andrew Morton <akpm@linux-foundation.org>
Tue, 13 May 2025 06:50:35 +0000 (23:50 -0700)
diff --git a/include/linux/hugetlb.h b/include/linux/hugetlb.h

index a57bed83c657b1bd95f68ccd1b896a4279c6af6a..23ebf49c5d6a4025f73cc1fcf73305fa81d7e61a 100644 (file)
--- a/include/linux/hugetlb.h
+++ b/include/linux/hugetlb.h
@@ -14,6 +14,7 @@
  #include <linux/pgtable.h>
  #include <linux/gfp.h>
  #include <linux/userfaultfd_k.h>
+#include <linux/nodemask.h>
  
  struct ctl_table;
  struct user_struct;
@@ -176,6 +177,8 @@ extern struct list_head huge_boot_pages[MAX_NUMNODES];
  
  void hugetlb_bootmem_alloc(void);
  bool hugetlb_bootmem_allocated(void);
+extern nodemask_t hugetlb_bootmem_nodes;
+void hugetlb_bootmem_set_nodes(void);
  
  /* arch callbacks */
  
diff --git a/mm/hugetlb.c b/mm/hugetlb.c

index 351254ad6ef87a328e6d7fbf12dc4df821253373..0057d1f1dc9a703568e1741f2afa95ea49fb35e5 100644 (file)
--- a/mm/hugetlb.c
+++ b/mm/hugetlb.c
@@ -58,6 +58,7 @@ int hugetlb_max_hstate __read_mostly;
  unsigned int default_hstate_idx;
  struct hstate hstates[HUGE_MAX_HSTATE];
  
+__initdata nodemask_t hugetlb_bootmem_nodes;
  __initdata struct list_head huge_boot_pages[MAX_NUMNODES];
  static unsigned long hstate_boot_nrinvalid[HUGE_MAX_HSTATE] __initdata;
  
@@ -3219,7 +3220,8 @@ int __alloc_bootmem_huge_page(struct hstate *h, int nid)
         }
  
         /* allocate from next node when distributing huge pages */
-       for_each_node_mask_to_alloc(&h->next_nid_to_alloc, nr_nodes, node, &node_states[N_ONLINE]) {
+       for_each_node_mask_to_alloc(&h->next_nid_to_alloc, nr_nodes, node,
+                                   &hugetlb_bootmem_nodes) {
                 m = alloc_bootmem(h, node, false);
                 if (!m)
                         return 0;
@@ -3683,6 +3685,15 @@ static void __init hugetlb_init_hstates(void)
         struct hstate *h, *h2;
  
         for_each_hstate(h) {
+               /*
+                * Always reset to first_memory_node here, even if
+                * next_nid_to_alloc was set before - we can't
+                * reference hugetlb_bootmem_nodes after init, and
+                * first_memory_node is right for all further allocations.
+                */
+               h->next_nid_to_alloc = first_memory_node;
+               h->next_nid_to_free = first_memory_node;
+
                 /* oversize hugepages were init'ed in early boot */
                 if (!hstate_is_gigantic(h))
                         hugetlb_hstate_alloc_pages(h);
@@ -4995,6 +5006,20 @@ static int __init default_hugepagesz_setup(char *s)
  }
  hugetlb_early_param("default_hugepagesz", default_hugepagesz_setup);
  
+void __init hugetlb_bootmem_set_nodes(void)
+{
+       int i, nid;
+       unsigned long start_pfn, end_pfn;
+
+       if (!nodes_empty(hugetlb_bootmem_nodes))
+               return;
+
+       for_each_mem_pfn_range(i, MAX_NUMNODES, &start_pfn, &end_pfn, &nid) {
+               if (end_pfn > start_pfn)
+                       node_set(nid, hugetlb_bootmem_nodes);
+       }
+}
+
  static bool __hugetlb_bootmem_allocated __initdata;
  
  bool __init hugetlb_bootmem_allocated(void)
@@ -5010,6 +5035,8 @@ void __init hugetlb_bootmem_alloc(void)
         if (__hugetlb_bootmem_allocated)
                 return;
  
+       hugetlb_bootmem_set_nodes();
+
         for (i = 0; i < MAX_NUMNODES; i++)
                 INIT_LIST_HEAD(&huge_boot_pages[i]);
  
@@ -5017,7 +5044,6 @@ void __init hugetlb_bootmem_alloc(void)
  
         for_each_hstate(h) {
                 h->next_nid_to_alloc = first_online_node;
-               h->next_nid_to_free = first_online_node;
  
                 if (hstate_is_gigantic(h))
                         hugetlb_hstate_alloc_pages(h);
diff --git a/mm/hugetlb_cma.c b/mm/hugetlb_cma.c

index e0f2d5c3a84c24a9ff3fd2b6931ed9b3f8daae23..f58ef4969e7a1c57a1ab818cc52343d7b00c26fa 100644 (file)
--- a/mm/hugetlb_cma.c
+++ b/mm/hugetlb_cma.c
@@ -66,7 +66,7 @@ hugetlb_cma_alloc_bootmem(struct hstate *h, int *nid, bool node_exact)
                 if (node_exact)
                         return NULL;
  
-               for_each_online_node(node) {
+               for_each_node_mask(node, hugetlb_bootmem_nodes) {
                         cma = hugetlb_cma[node];
                         if (!cma || node == *nid)
                                 continue;
@@ -153,11 +153,13 @@ void __init hugetlb_cma_reserve(int order)
         if (!hugetlb_cma_size)
                 return;
  
+       hugetlb_bootmem_set_nodes();
+
         for (nid = 0; nid < MAX_NUMNODES; nid++) {
                 if (hugetlb_cma_size_in_node[nid] == 0)
                         continue;
  
-               if (!node_online(nid)) {
+               if (!node_isset(nid, hugetlb_bootmem_nodes)) {
                         pr_warn("hugetlb_cma: invalid node %d specified\n", nid);
                         hugetlb_cma_size -= hugetlb_cma_size_in_node[nid];
                         hugetlb_cma_size_in_node[nid] = 0;
@@ -190,13 +192,14 @@ void __init hugetlb_cma_reserve(int order)
                  * If 3 GB area is requested on a machine with 4 numa nodes,
                  * let's allocate 1 GB on first three nodes and ignore the last one.
                  */
-               per_node = DIV_ROUND_UP(hugetlb_cma_size, nr_online_nodes);
+               per_node = DIV_ROUND_UP(hugetlb_cma_size,
+                                       nodes_weight(hugetlb_bootmem_nodes));
                 pr_info("hugetlb_cma: reserve %lu MiB, up to %lu MiB per node\n",
                         hugetlb_cma_size / SZ_1M, per_node / SZ_1M);
         }
  
         reserved = 0;
-       for_each_online_node(nid) {
+       for_each_node_mask(nid, hugetlb_bootmem_nodes) {
                 int res;
                 char name[CMA_MAX_NAME];
author	Frank van der Linden <fvdl@google.com>
	Wed, 2 Apr 2025 20:56:13 +0000 (20:56 +0000)
committer	Andrew Morton <akpm@linux-foundation.org>
	Tue, 13 May 2025 06:50:35 +0000 (23:50 -0700)
include/linux/hugetlb.h		patch \| blob \| blame \| history
mm/hugetlb.c		patch \| blob \| blame \| history
mm/hugetlb_cma.c		patch \| blob \| blame \| history