1 /* SPDX-License-Identifier: GPL-2.0 */
5 #include <linux/gfp_types.h>
7 #include <linux/mmzone.h>
8 #include <linux/topology.h>
9 #include <linux/alloc_tag.h>
10 #include <linux/cleanup.h>
11 #include <linux/sched.h>
13 struct vm_area_struct
;
16 /* Helper macro to avoid gfp flags if they are the default one */
17 #define __default_gfp(a,b,...) b
18 #define default_gfp(...) __default_gfp(,##__VA_ARGS__,GFP_KERNEL)
20 /* Convert GFP flags to their corresponding migrate type */
21 #define GFP_MOVABLE_MASK (__GFP_RECLAIMABLE|__GFP_MOVABLE)
22 #define GFP_MOVABLE_SHIFT 3
24 static inline int gfp_migratetype(const gfp_t gfp_flags
)
26 VM_WARN_ON((gfp_flags
& GFP_MOVABLE_MASK
) == GFP_MOVABLE_MASK
);
27 BUILD_BUG_ON((1UL << GFP_MOVABLE_SHIFT
) != ___GFP_MOVABLE
);
28 BUILD_BUG_ON((___GFP_MOVABLE
>> GFP_MOVABLE_SHIFT
) != MIGRATE_MOVABLE
);
29 BUILD_BUG_ON((___GFP_RECLAIMABLE
>> GFP_MOVABLE_SHIFT
) != MIGRATE_RECLAIMABLE
);
30 BUILD_BUG_ON(((___GFP_MOVABLE
| ___GFP_RECLAIMABLE
) >>
31 GFP_MOVABLE_SHIFT
) != MIGRATE_HIGHATOMIC
);
33 if (unlikely(page_group_by_mobility_disabled
))
34 return MIGRATE_UNMOVABLE
;
36 /* Group based on mobility */
37 return (__force
unsigned long)(gfp_flags
& GFP_MOVABLE_MASK
) >> GFP_MOVABLE_SHIFT
;
39 #undef GFP_MOVABLE_MASK
40 #undef GFP_MOVABLE_SHIFT
42 static inline bool gfpflags_allow_blocking(const gfp_t gfp_flags
)
44 return !!(gfp_flags
& __GFP_DIRECT_RECLAIM
);
47 static inline bool gfpflags_allow_spinning(const gfp_t gfp_flags
)
50 * !__GFP_DIRECT_RECLAIM -> direct claim is not allowed.
51 * !__GFP_KSWAPD_RECLAIM -> it's not safe to wake up kswapd.
52 * All GFP_* flags including GFP_NOWAIT use one or both flags.
53 * alloc_pages_nolock() is the only API that doesn't specify either flag.
55 * This is stronger than GFP_NOWAIT or GFP_ATOMIC because
56 * those are guaranteed to never block on a sleeping lock.
57 * Here we are enforcing that the allocation doesn't ever spin
58 * on any locks (i.e. only trylocks). There is no high level
59 * GFP_$FOO flag for this use in alloc_pages_nolock() as the
60 * regular page allocator doesn't fully support this
63 return !!(gfp_flags
& __GFP_RECLAIM
);
67 #define OPT_ZONE_HIGHMEM ZONE_HIGHMEM
69 #define OPT_ZONE_HIGHMEM ZONE_NORMAL
72 #ifdef CONFIG_ZONE_DMA
73 #define OPT_ZONE_DMA ZONE_DMA
75 #define OPT_ZONE_DMA ZONE_NORMAL
78 #ifdef CONFIG_ZONE_DMA32
79 #define OPT_ZONE_DMA32 ZONE_DMA32
81 #define OPT_ZONE_DMA32 ZONE_NORMAL
85 * GFP_ZONE_TABLE is a word size bitstring that is used for looking up the
86 * zone to use given the lowest 4 bits of gfp_t. Entries are GFP_ZONES_SHIFT
87 * bits long and there are 16 of them to cover all possible combinations of
88 * __GFP_DMA, __GFP_DMA32, __GFP_MOVABLE and __GFP_HIGHMEM.
90 * The zone fallback order is MOVABLE=>HIGHMEM=>NORMAL=>DMA32=>DMA.
91 * But GFP_MOVABLE is not only a zone specifier but also an allocation
92 * policy. Therefore __GFP_MOVABLE plus another zone selector is valid.
93 * Only 1 bit of the lowest 3 bits (DMA,DMA32,HIGHMEM) can be set to "1".
98 * 0x1 => DMA or NORMAL
99 * 0x2 => HIGHMEM or NORMAL
100 * 0x3 => BAD (DMA+HIGHMEM)
101 * 0x4 => DMA32 or NORMAL
102 * 0x5 => BAD (DMA+DMA32)
103 * 0x6 => BAD (HIGHMEM+DMA32)
104 * 0x7 => BAD (HIGHMEM+DMA32+DMA)
105 * 0x8 => NORMAL (MOVABLE+0)
106 * 0x9 => DMA or NORMAL (MOVABLE+DMA)
107 * 0xa => MOVABLE (Movable is valid only if HIGHMEM is set too)
108 * 0xb => BAD (MOVABLE+HIGHMEM+DMA)
109 * 0xc => DMA32 or NORMAL (MOVABLE+DMA32)
110 * 0xd => BAD (MOVABLE+DMA32+DMA)
111 * 0xe => BAD (MOVABLE+DMA32+HIGHMEM)
112 * 0xf => BAD (MOVABLE+DMA32+HIGHMEM+DMA)
114 * GFP_ZONES_SHIFT must be <= 2 on 32 bit platforms.
117 #if defined(CONFIG_ZONE_DEVICE) && (MAX_NR_ZONES-1) <= 4
118 /* ZONE_DEVICE is not a valid GFP zone specifier */
119 #define GFP_ZONES_SHIFT 2
121 #define GFP_ZONES_SHIFT ZONES_SHIFT
124 #if 16 * GFP_ZONES_SHIFT > BITS_PER_LONG
125 #error GFP_ZONES_SHIFT too large to create GFP_ZONE_TABLE integer
128 #define GFP_ZONE_TABLE ( \
129 (ZONE_NORMAL << 0 * GFP_ZONES_SHIFT) \
130 | (OPT_ZONE_DMA << ___GFP_DMA * GFP_ZONES_SHIFT) \
131 | (OPT_ZONE_HIGHMEM << ___GFP_HIGHMEM * GFP_ZONES_SHIFT) \
132 | (OPT_ZONE_DMA32 << ___GFP_DMA32 * GFP_ZONES_SHIFT) \
133 | (ZONE_NORMAL << ___GFP_MOVABLE * GFP_ZONES_SHIFT) \
134 | (OPT_ZONE_DMA << (___GFP_MOVABLE | ___GFP_DMA) * GFP_ZONES_SHIFT) \
135 | (ZONE_MOVABLE << (___GFP_MOVABLE | ___GFP_HIGHMEM) * GFP_ZONES_SHIFT)\
136 | (OPT_ZONE_DMA32 << (___GFP_MOVABLE | ___GFP_DMA32) * GFP_ZONES_SHIFT)\
140 * GFP_ZONE_BAD is a bitmap for all combinations of __GFP_DMA, __GFP_DMA32
141 * __GFP_HIGHMEM and __GFP_MOVABLE that are not permitted. One flag per
142 * entry starting with bit 0. Bit is set if the combination is not
145 #define GFP_ZONE_BAD ( \
146 1 << (___GFP_DMA | ___GFP_HIGHMEM) \
147 | 1 << (___GFP_DMA | ___GFP_DMA32) \
148 | 1 << (___GFP_DMA32 | ___GFP_HIGHMEM) \
149 | 1 << (___GFP_DMA | ___GFP_DMA32 | ___GFP_HIGHMEM) \
150 | 1 << (___GFP_MOVABLE | ___GFP_HIGHMEM | ___GFP_DMA) \
151 | 1 << (___GFP_MOVABLE | ___GFP_DMA32 | ___GFP_DMA) \
152 | 1 << (___GFP_MOVABLE | ___GFP_DMA32 | ___GFP_HIGHMEM) \
153 | 1 << (___GFP_MOVABLE | ___GFP_DMA32 | ___GFP_DMA | ___GFP_HIGHMEM) \
156 static inline enum zone_type
gfp_zone(gfp_t flags
)
159 int bit
= (__force
int) (flags
& GFP_ZONEMASK
);
161 z
= (GFP_ZONE_TABLE
>> (bit
* GFP_ZONES_SHIFT
)) &
162 ((1 << GFP_ZONES_SHIFT
) - 1);
163 VM_BUG_ON((GFP_ZONE_BAD
>> bit
) & 1);
168 * There is only one page-allocator function, and two main namespaces to
169 * it. The alloc_page*() variants return 'struct page *' and as such
170 * can allocate highmem pages, the *get*page*() variants return
171 * virtual kernel addresses to the allocated page(s).
174 static inline int gfp_zonelist(gfp_t flags
)
177 if (unlikely(flags
& __GFP_THISNODE
))
178 return ZONELIST_NOFALLBACK
;
180 return ZONELIST_FALLBACK
;
184 * gfp flag masking for nested internal allocations.
186 * For code that needs to do allocations inside the public allocation API (e.g.
187 * memory allocation tracking code) the allocations need to obey the caller
188 * allocation context constrains to prevent allocation context mismatches (e.g.
189 * GFP_KERNEL allocations in GFP_NOFS contexts) from potential deadlock
192 * It is also assumed that these nested allocations are for internal kernel
193 * object storage purposes only and are not going to be used for DMA, etc. Hence
194 * we strip out all the zone information and leave just the context information
197 * Further, internal allocations must fail before the higher level allocation
198 * can fail, so we must make them fail faster and fail silently. We also don't
199 * want them to deplete emergency reserves. Hence nested allocations must be
200 * prepared for these allocations to fail.
202 static inline gfp_t
gfp_nested_mask(gfp_t flags
)
204 return ((flags
& (GFP_KERNEL
| GFP_ATOMIC
| __GFP_NOLOCKDEP
)) |
205 (__GFP_NORETRY
| __GFP_NOMEMALLOC
| __GFP_NOWARN
));
209 * We get the zone list from the current node and the gfp_mask.
210 * This zone list contains a maximum of MAX_NUMNODES*MAX_NR_ZONES zones.
211 * There are two zonelists per node, one for all zones with memory and
212 * one containing just zones from the node the zonelist belongs to.
214 * For the case of non-NUMA systems the NODE_DATA() gets optimized to
215 * &contig_page_data at compile-time.
217 static inline struct zonelist
*node_zonelist(int nid
, gfp_t flags
)
219 return NODE_DATA(nid
)->node_zonelists
+ gfp_zonelist(flags
);
222 #ifndef HAVE_ARCH_FREE_PAGE
223 static inline void arch_free_page(struct page
*page
, int order
) { }
225 #ifndef HAVE_ARCH_ALLOC_PAGE
226 static inline void arch_alloc_page(struct page
*page
, int order
) { }
229 struct page
*__alloc_pages_noprof(gfp_t gfp
, unsigned int order
, int preferred_nid
,
230 nodemask_t
*nodemask
);
231 #define __alloc_pages(...) alloc_hooks(__alloc_pages_noprof(__VA_ARGS__))
233 struct folio
*__folio_alloc_noprof(gfp_t gfp
, unsigned int order
, int preferred_nid
,
234 nodemask_t
*nodemask
);
235 #define __folio_alloc(...) alloc_hooks(__folio_alloc_noprof(__VA_ARGS__))
237 unsigned long alloc_pages_bulk_noprof(gfp_t gfp
, int preferred_nid
,
238 nodemask_t
*nodemask
, int nr_pages
,
239 struct page
**page_array
);
240 #define __alloc_pages_bulk(...) alloc_hooks(alloc_pages_bulk_noprof(__VA_ARGS__))
242 void free_pages_bulk(struct page
**page_array
, unsigned long nr_pages
);
244 unsigned long alloc_pages_bulk_mempolicy_noprof(gfp_t gfp
,
245 unsigned long nr_pages
,
246 struct page
**page_array
);
247 #define alloc_pages_bulk_mempolicy(...) \
248 alloc_hooks(alloc_pages_bulk_mempolicy_noprof(__VA_ARGS__))
250 /* Bulk allocate order-0 pages */
251 #define alloc_pages_bulk(_gfp, _nr_pages, _page_array) \
252 __alloc_pages_bulk(_gfp, numa_mem_id(), NULL, _nr_pages, _page_array)
254 static inline unsigned long
255 alloc_pages_bulk_node_noprof(gfp_t gfp
, int nid
, unsigned long nr_pages
,
256 struct page
**page_array
)
258 if (nid
== NUMA_NO_NODE
)
261 return alloc_pages_bulk_noprof(gfp
, nid
, NULL
, nr_pages
, page_array
);
264 #define alloc_pages_bulk_node(...) \
265 alloc_hooks(alloc_pages_bulk_node_noprof(__VA_ARGS__))
267 static inline void warn_if_node_offline(int this_node
, gfp_t gfp_mask
)
269 gfp_t warn_gfp
= gfp_mask
& (__GFP_THISNODE
|__GFP_NOWARN
);
271 if (warn_gfp
!= (__GFP_THISNODE
|__GFP_NOWARN
))
274 if (node_online(this_node
))
277 pr_warn("%pGg allocation from offline node %d\n", &gfp_mask
, this_node
);
282 * Allocate pages, preferring the node given as nid. The node must be valid and
283 * online. For more general interface, see alloc_pages_node().
285 static inline struct page
*
286 __alloc_pages_node_noprof(int nid
, gfp_t gfp_mask
, unsigned int order
)
288 VM_BUG_ON(nid
< 0 || nid
>= MAX_NUMNODES
);
289 warn_if_node_offline(nid
, gfp_mask
);
291 return __alloc_pages_noprof(gfp_mask
, order
, nid
, NULL
);
294 #define __alloc_pages_node(...) alloc_hooks(__alloc_pages_node_noprof(__VA_ARGS__))
297 struct folio
*__folio_alloc_node_noprof(gfp_t gfp
, unsigned int order
, int nid
)
299 VM_BUG_ON(nid
< 0 || nid
>= MAX_NUMNODES
);
300 warn_if_node_offline(nid
, gfp
);
302 return __folio_alloc_noprof(gfp
, order
, nid
, NULL
);
305 #define __folio_alloc_node(...) alloc_hooks(__folio_alloc_node_noprof(__VA_ARGS__))
308 * Allocate pages, preferring the node given as nid. When nid == NUMA_NO_NODE,
309 * prefer the current CPU's closest node. Otherwise node must be valid and
312 static inline struct page
*alloc_pages_node_noprof(int nid
, gfp_t gfp_mask
,
315 if (nid
== NUMA_NO_NODE
)
318 return __alloc_pages_node_noprof(nid
, gfp_mask
, order
);
321 #define alloc_pages_node(...) alloc_hooks(alloc_pages_node_noprof(__VA_ARGS__))
324 struct page
*alloc_pages_noprof(gfp_t gfp
, unsigned int order
);
325 struct folio
*folio_alloc_noprof(gfp_t gfp
, unsigned int order
);
326 struct folio
*folio_alloc_mpol_noprof(gfp_t gfp
, unsigned int order
,
327 struct mempolicy
*mpol
, pgoff_t ilx
, int nid
);
328 struct folio
*vma_alloc_folio_noprof(gfp_t gfp
, int order
, struct vm_area_struct
*vma
,
331 static inline struct page
*alloc_pages_noprof(gfp_t gfp_mask
, unsigned int order
)
333 return alloc_pages_node_noprof(numa_node_id(), gfp_mask
, order
);
335 static inline struct folio
*folio_alloc_noprof(gfp_t gfp
, unsigned int order
)
337 return __folio_alloc_node_noprof(gfp
, order
, numa_node_id());
339 static inline struct folio
*folio_alloc_mpol_noprof(gfp_t gfp
, unsigned int order
,
340 struct mempolicy
*mpol
, pgoff_t ilx
, int nid
)
342 return folio_alloc_noprof(gfp
, order
);
344 static inline struct folio
*vma_alloc_folio_noprof(gfp_t gfp
, int order
,
345 struct vm_area_struct
*vma
, unsigned long addr
)
347 return folio_alloc_noprof(gfp
, order
);
351 #define alloc_pages(...) alloc_hooks(alloc_pages_noprof(__VA_ARGS__))
352 #define folio_alloc(...) alloc_hooks(folio_alloc_noprof(__VA_ARGS__))
353 #define folio_alloc_mpol(...) alloc_hooks(folio_alloc_mpol_noprof(__VA_ARGS__))
354 #define vma_alloc_folio(...) alloc_hooks(vma_alloc_folio_noprof(__VA_ARGS__))
356 #define alloc_page(gfp_mask) alloc_pages(gfp_mask, 0)
358 static inline struct page
*alloc_page_vma_noprof(gfp_t gfp
,
359 struct vm_area_struct
*vma
, unsigned long addr
)
361 struct folio
*folio
= vma_alloc_folio_noprof(gfp
, 0, vma
, addr
);
365 #define alloc_page_vma(...) alloc_hooks(alloc_page_vma_noprof(__VA_ARGS__))
367 struct page
*alloc_pages_nolock_noprof(gfp_t gfp_flags
, int nid
, unsigned int order
);
368 #define alloc_pages_nolock(...) alloc_hooks(alloc_pages_nolock_noprof(__VA_ARGS__))
370 extern unsigned long get_free_pages_noprof(gfp_t gfp_mask
, unsigned int order
);
371 #define __get_free_pages(...) alloc_hooks(get_free_pages_noprof(__VA_ARGS__))
373 extern unsigned long get_zeroed_page_noprof(gfp_t gfp_mask
);
374 #define get_zeroed_page(...) alloc_hooks(get_zeroed_page_noprof(__VA_ARGS__))
376 void *alloc_pages_exact_noprof(size_t size
, gfp_t gfp_mask
) __alloc_size(1);
377 #define alloc_pages_exact(...) alloc_hooks(alloc_pages_exact_noprof(__VA_ARGS__))
379 void free_pages_exact(void *virt
, size_t size
);
381 __meminit
void *alloc_pages_exact_nid_noprof(int nid
, size_t size
, gfp_t gfp_mask
) __alloc_size(2);
382 #define alloc_pages_exact_nid(...) \
383 alloc_hooks(alloc_pages_exact_nid_noprof(__VA_ARGS__))
385 #define __get_free_page(gfp_mask) \
386 __get_free_pages((gfp_mask), 0)
388 #define __get_dma_pages(gfp_mask, order) \
389 __get_free_pages((gfp_mask) | GFP_DMA, (order))
391 extern void __free_pages(struct page
*page
, unsigned int order
);
392 extern void free_pages_nolock(struct page
*page
, unsigned int order
);
393 extern void free_pages(unsigned long addr
, unsigned int order
);
395 #define __free_page(page) __free_pages((page), 0)
396 #define free_page(addr) free_pages((addr), 0)
398 void page_alloc_init_cpuhp(void);
399 bool decay_pcp_high(struct zone
*zone
, struct per_cpu_pages
*pcp
);
400 void drain_zone_pages(struct zone
*zone
, struct per_cpu_pages
*pcp
);
401 void drain_all_pages(struct zone
*zone
);
402 void drain_local_pages(struct zone
*zone
);
404 void page_alloc_init_late(void);
405 void setup_pcp_cacheinfo(unsigned int cpu
);
408 * gfp_allowed_mask is set to GFP_BOOT_MASK during early boot to restrict what
409 * GFP flags are used before interrupts are enabled. Once interrupts are
410 * enabled, it is set to __GFP_BITS_MASK while the system is running. During
411 * hibernation, it is used by PM to avoid I/O during memory allocation while
412 * devices are suspended.
414 extern gfp_t gfp_allowed_mask
;
416 /* Returns true if the gfp_mask allows use of ALLOC_NO_WATERMARK */
417 bool gfp_pfmemalloc_allowed(gfp_t gfp_mask
);
419 /* A helper for checking if gfp includes all the specified flags */
420 static inline bool gfp_has_flags(gfp_t gfp
, gfp_t flags
)
422 return (gfp
& flags
) == flags
;
425 static inline bool gfp_has_io_fs(gfp_t gfp
)
427 return gfp_has_flags(gfp
, __GFP_IO
| __GFP_FS
);
431 * Check if the gfp flags allow compaction - GFP_NOIO is a really
432 * tricky context because the migration might require IO.
434 static inline bool gfp_compaction_allowed(gfp_t gfp_mask
)
436 return IS_ENABLED(CONFIG_COMPACTION
) && (gfp_mask
& __GFP_IO
);
439 extern gfp_t
vma_thp_gfp_mask(struct vm_area_struct
*vma
);
441 #ifdef CONFIG_CONTIG_ALLOC
443 typedef unsigned int __bitwise acr_flags_t
;
444 #define ACR_FLAGS_NONE ((__force acr_flags_t)0) // ordinary allocation request
445 #define ACR_FLAGS_CMA ((__force acr_flags_t)BIT(0)) // allocate for CMA
447 /* The below functions must be run on a range from a single zone. */
448 int alloc_contig_frozen_range_noprof(unsigned long start
, unsigned long end
,
449 acr_flags_t alloc_flags
, gfp_t gfp_mask
);
450 #define alloc_contig_frozen_range(...) \
451 alloc_hooks(alloc_contig_frozen_range_noprof(__VA_ARGS__))
453 int alloc_contig_range_noprof(unsigned long start
, unsigned long end
,
454 acr_flags_t alloc_flags
, gfp_t gfp_mask
);
455 #define alloc_contig_range(...) \
456 alloc_hooks(alloc_contig_range_noprof(__VA_ARGS__))
458 struct page
*alloc_contig_frozen_pages_noprof(unsigned long nr_pages
,
459 gfp_t gfp_mask
, int nid
, nodemask_t
*nodemask
);
460 #define alloc_contig_frozen_pages(...) \
461 alloc_hooks(alloc_contig_frozen_pages_noprof(__VA_ARGS__))
463 struct page
*alloc_contig_pages_noprof(unsigned long nr_pages
, gfp_t gfp_mask
,
464 int nid
, nodemask_t
*nodemask
);
465 #define alloc_contig_pages(...) \
466 alloc_hooks(alloc_contig_pages_noprof(__VA_ARGS__))
468 void free_contig_frozen_range(unsigned long pfn
, unsigned long nr_pages
);
469 void free_contig_range(unsigned long pfn
, unsigned long nr_pages
);
472 void __free_contig_range(unsigned long pfn
, unsigned long nr_pages
);
474 DEFINE_FREE(free_page
, void *, free_page((unsigned long)_T
))
476 #endif /* __LINUX_GFP_H */