xref: /linux-6.15/include/linux/memory_hotplug.h (revision 2444172c)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef __LINUX_MEMORY_HOTPLUG_H
3 #define __LINUX_MEMORY_HOTPLUG_H
4 
5 #include <linux/mmzone.h>
6 #include <linux/spinlock.h>
7 #include <linux/notifier.h>
8 #include <linux/bug.h>
9 
10 struct page;
11 struct zone;
12 struct pglist_data;
13 struct mem_section;
14 struct memory_group;
15 struct resource;
16 struct vmem_altmap;
17 struct dev_pagemap;
18 
19 #ifdef CONFIG_HAVE_ARCH_NODEDATA_EXTENSION
20 /*
21  * For supporting node-hotadd, we have to allocate a new pgdat.
22  *
23  * If an arch has generic style NODE_DATA(),
24  * node_data[nid] = kzalloc() works well. But it depends on the architecture.
25  *
26  * In general, generic_alloc_nodedata() is used.
27  *
28  */
29 extern pg_data_t *arch_alloc_nodedata(int nid);
30 extern void arch_refresh_nodedata(int nid, pg_data_t *pgdat);
31 
32 #else /* CONFIG_HAVE_ARCH_NODEDATA_EXTENSION */
33 
34 #define arch_alloc_nodedata(nid)	generic_alloc_nodedata(nid)
35 
36 #ifdef CONFIG_NUMA
37 /*
38  * XXX: node aware allocation can't work well to get new node's memory at this time.
39  *	Because, pgdat for the new node is not allocated/initialized yet itself.
40  *	To use new node's memory, more consideration will be necessary.
41  */
42 #define generic_alloc_nodedata(nid)				\
43 ({								\
44 	memblock_alloc(sizeof(*pgdat), SMP_CACHE_BYTES);	\
45 })
46 
47 extern pg_data_t *node_data[];
48 static inline void arch_refresh_nodedata(int nid, pg_data_t *pgdat)
49 {
50 	node_data[nid] = pgdat;
51 }
52 
53 #else /* !CONFIG_NUMA */
54 
55 /* never called */
56 static inline pg_data_t *generic_alloc_nodedata(int nid)
57 {
58 	BUG();
59 	return NULL;
60 }
61 static inline void arch_refresh_nodedata(int nid, pg_data_t *pgdat)
62 {
63 }
64 #endif /* CONFIG_NUMA */
65 #endif /* CONFIG_HAVE_ARCH_NODEDATA_EXTENSION */
66 
67 #ifdef CONFIG_MEMORY_HOTPLUG
68 struct page *pfn_to_online_page(unsigned long pfn);
69 
70 /* Types for control the zone type of onlined and offlined memory */
71 enum {
72 	/* Offline the memory. */
73 	MMOP_OFFLINE = 0,
74 	/* Online the memory. Zone depends, see default_zone_for_pfn(). */
75 	MMOP_ONLINE,
76 	/* Online the memory to ZONE_NORMAL. */
77 	MMOP_ONLINE_KERNEL,
78 	/* Online the memory to ZONE_MOVABLE. */
79 	MMOP_ONLINE_MOVABLE,
80 };
81 
82 /* Flags for add_memory() and friends to specify memory hotplug details. */
83 typedef int __bitwise mhp_t;
84 
85 /* No special request */
86 #define MHP_NONE		((__force mhp_t)0)
87 /*
88  * Allow merging of the added System RAM resource with adjacent,
89  * mergeable resources. After a successful call to add_memory_resource()
90  * with this flag set, the resource pointer must no longer be used as it
91  * might be stale, or the resource might have changed.
92  */
93 #define MHP_MERGE_RESOURCE	((__force mhp_t)BIT(0))
94 
95 /*
96  * We want memmap (struct page array) to be self contained.
97  * To do so, we will use the beginning of the hot-added range to build
98  * the page tables for the memmap array that describes the entire range.
99  * Only selected architectures support it with SPARSE_VMEMMAP.
100  * This is only a hint, the core kernel can decide to not do this based on
101  * different alignment checks.
102  */
103 #define MHP_MEMMAP_ON_MEMORY   ((__force mhp_t)BIT(1))
104 /*
105  * The nid field specifies a memory group id (mgid) instead. The memory group
106  * implies the node id (nid).
107  */
108 #define MHP_NID_IS_MGID		((__force mhp_t)BIT(2))
109 /*
110  * The hotplugged memory is completely inaccessible while the memory is
111  * offline. The memory provider will handle MEM_PREPARE_ONLINE /
112  * MEM_FINISH_OFFLINE notifications and make the memory accessible.
113  *
114  * This flag is only relevant when used along with MHP_MEMMAP_ON_MEMORY,
115  * because the altmap cannot be written (e.g., poisoned) when adding
116  * memory -- before it is set online.
117  *
118  * This allows for adding memory with an altmap that is not currently
119  * made available by a hypervisor. When onlining that memory, the
120  * hypervisor can be instructed to make that memory available, and
121  * the onlining phase will not require any memory allocations, which is
122  * helpful in low-memory situations.
123  */
124 #define MHP_OFFLINE_INACCESSIBLE	((__force mhp_t)BIT(3))
125 
126 /*
127  * Extended parameters for memory hotplug:
128  * altmap: alternative allocator for memmap array (optional)
129  * pgprot: page protection flags to apply to newly created page tables
130  *	(required)
131  */
132 struct mhp_params {
133 	struct vmem_altmap *altmap;
134 	pgprot_t pgprot;
135 	struct dev_pagemap *pgmap;
136 };
137 
138 bool mhp_range_allowed(u64 start, u64 size, bool need_mapping);
139 struct range mhp_get_pluggable_range(bool need_mapping);
140 
141 /*
142  * Zone resizing functions
143  *
144  * Note: any attempt to resize a zone should has pgdat_resize_lock()
145  * zone_span_writelock() both held. This ensure the size of a zone
146  * can't be changed while pgdat_resize_lock() held.
147  */
148 static inline unsigned zone_span_seqbegin(struct zone *zone)
149 {
150 	return read_seqbegin(&zone->span_seqlock);
151 }
152 static inline int zone_span_seqretry(struct zone *zone, unsigned iv)
153 {
154 	return read_seqretry(&zone->span_seqlock, iv);
155 }
156 static inline void zone_span_writelock(struct zone *zone)
157 {
158 	write_seqlock(&zone->span_seqlock);
159 }
160 static inline void zone_span_writeunlock(struct zone *zone)
161 {
162 	write_sequnlock(&zone->span_seqlock);
163 }
164 static inline void zone_seqlock_init(struct zone *zone)
165 {
166 	seqlock_init(&zone->span_seqlock);
167 }
168 extern void adjust_present_page_count(struct page *page,
169 				      struct memory_group *group,
170 				      long nr_pages);
171 /* VM interface that may be used by firmware interface */
172 extern int mhp_init_memmap_on_memory(unsigned long pfn, unsigned long nr_pages,
173 				     struct zone *zone, bool mhp_off_inaccessible);
174 extern void mhp_deinit_memmap_on_memory(unsigned long pfn, unsigned long nr_pages);
175 extern int online_pages(unsigned long pfn, unsigned long nr_pages,
176 			struct zone *zone, struct memory_group *group);
177 extern void __offline_isolated_pages(unsigned long start_pfn,
178 				     unsigned long end_pfn);
179 
180 typedef void (*online_page_callback_t)(struct page *page, unsigned int order);
181 
182 extern void generic_online_page(struct page *page, unsigned int order);
183 extern int set_online_page_callback(online_page_callback_t callback);
184 extern int restore_online_page_callback(online_page_callback_t callback);
185 
186 extern int try_online_node(int nid);
187 
188 extern int arch_add_memory(int nid, u64 start, u64 size,
189 			   struct mhp_params *params);
190 extern u64 max_mem_size;
191 
192 extern int mhp_online_type_from_str(const char *str);
193 
194 /* Default online_type (MMOP_*) when new memory blocks are added. */
195 extern int mhp_default_online_type;
196 /* If movable_node boot option specified */
197 extern bool movable_node_enabled;
198 static inline bool movable_node_is_enabled(void)
199 {
200 	return movable_node_enabled;
201 }
202 
203 extern void arch_remove_memory(u64 start, u64 size, struct vmem_altmap *altmap);
204 extern void __remove_pages(unsigned long start_pfn, unsigned long nr_pages,
205 			   struct vmem_altmap *altmap);
206 
207 /* reasonably generic interface to expand the physical pages */
208 extern int __add_pages(int nid, unsigned long start_pfn, unsigned long nr_pages,
209 		       struct mhp_params *params);
210 
211 #ifndef CONFIG_ARCH_HAS_ADD_PAGES
212 static inline int add_pages(int nid, unsigned long start_pfn,
213 		unsigned long nr_pages, struct mhp_params *params)
214 {
215 	return __add_pages(nid, start_pfn, nr_pages, params);
216 }
217 #else /* ARCH_HAS_ADD_PAGES */
218 int add_pages(int nid, unsigned long start_pfn, unsigned long nr_pages,
219 	      struct mhp_params *params);
220 #endif /* ARCH_HAS_ADD_PAGES */
221 
222 void get_online_mems(void);
223 void put_online_mems(void);
224 
225 void mem_hotplug_begin(void);
226 void mem_hotplug_done(void);
227 
228 /* See kswapd_is_running() */
229 static inline void pgdat_kswapd_lock(pg_data_t *pgdat)
230 {
231 	mutex_lock(&pgdat->kswapd_lock);
232 }
233 
234 static inline void pgdat_kswapd_unlock(pg_data_t *pgdat)
235 {
236 	mutex_unlock(&pgdat->kswapd_lock);
237 }
238 
239 static inline void pgdat_kswapd_lock_init(pg_data_t *pgdat)
240 {
241 	mutex_init(&pgdat->kswapd_lock);
242 }
243 
244 #else /* ! CONFIG_MEMORY_HOTPLUG */
245 #define pfn_to_online_page(pfn)			\
246 ({						\
247 	struct page *___page = NULL;		\
248 	if (pfn_valid(pfn))			\
249 		___page = pfn_to_page(pfn);	\
250 	___page;				\
251  })
252 
253 static inline unsigned zone_span_seqbegin(struct zone *zone)
254 {
255 	return 0;
256 }
257 static inline int zone_span_seqretry(struct zone *zone, unsigned iv)
258 {
259 	return 0;
260 }
261 static inline void zone_span_writelock(struct zone *zone) {}
262 static inline void zone_span_writeunlock(struct zone *zone) {}
263 static inline void zone_seqlock_init(struct zone *zone) {}
264 
265 static inline int try_online_node(int nid)
266 {
267 	return 0;
268 }
269 
270 static inline void get_online_mems(void) {}
271 static inline void put_online_mems(void) {}
272 
273 static inline void mem_hotplug_begin(void) {}
274 static inline void mem_hotplug_done(void) {}
275 
276 static inline bool movable_node_is_enabled(void)
277 {
278 	return false;
279 }
280 
281 static inline void pgdat_kswapd_lock(pg_data_t *pgdat) {}
282 static inline void pgdat_kswapd_unlock(pg_data_t *pgdat) {}
283 static inline void pgdat_kswapd_lock_init(pg_data_t *pgdat) {}
284 #endif /* ! CONFIG_MEMORY_HOTPLUG */
285 
286 /*
287  * Keep this declaration outside CONFIG_MEMORY_HOTPLUG as some
288  * platforms might override and use arch_get_mappable_range()
289  * for internal non memory hotplug purposes.
290  */
291 struct range arch_get_mappable_range(void);
292 
293 #if defined(CONFIG_MEMORY_HOTPLUG) || defined(CONFIG_DEFERRED_STRUCT_PAGE_INIT)
294 /*
295  * pgdat resizing functions
296  */
297 static inline
298 void pgdat_resize_lock(struct pglist_data *pgdat, unsigned long *flags)
299 {
300 	spin_lock_irqsave(&pgdat->node_size_lock, *flags);
301 }
302 static inline
303 void pgdat_resize_unlock(struct pglist_data *pgdat, unsigned long *flags)
304 {
305 	spin_unlock_irqrestore(&pgdat->node_size_lock, *flags);
306 }
307 static inline
308 void pgdat_resize_init(struct pglist_data *pgdat)
309 {
310 	spin_lock_init(&pgdat->node_size_lock);
311 }
312 #else /* !(CONFIG_MEMORY_HOTPLUG || CONFIG_DEFERRED_STRUCT_PAGE_INIT) */
313 /*
314  * Stub functions for when hotplug is off
315  */
316 static inline void pgdat_resize_lock(struct pglist_data *p, unsigned long *f) {}
317 static inline void pgdat_resize_unlock(struct pglist_data *p, unsigned long *f) {}
318 static inline void pgdat_resize_init(struct pglist_data *pgdat) {}
319 #endif /* !(CONFIG_MEMORY_HOTPLUG || CONFIG_DEFERRED_STRUCT_PAGE_INIT) */
320 
321 #ifdef CONFIG_MEMORY_HOTREMOVE
322 
323 extern void try_offline_node(int nid);
324 extern int offline_pages(unsigned long start_pfn, unsigned long nr_pages,
325 			 struct zone *zone, struct memory_group *group);
326 extern int remove_memory(u64 start, u64 size);
327 extern void __remove_memory(u64 start, u64 size);
328 extern int offline_and_remove_memory(u64 start, u64 size);
329 
330 #else
331 static inline void try_offline_node(int nid) {}
332 
333 static inline int offline_pages(unsigned long start_pfn, unsigned long nr_pages,
334 				struct zone *zone, struct memory_group *group)
335 {
336 	return -EINVAL;
337 }
338 
339 static inline int remove_memory(u64 start, u64 size)
340 {
341 	return -EBUSY;
342 }
343 
344 static inline void __remove_memory(u64 start, u64 size) {}
345 #endif /* CONFIG_MEMORY_HOTREMOVE */
346 
347 #ifdef CONFIG_MEMORY_HOTPLUG
348 extern void __ref free_area_init_core_hotplug(struct pglist_data *pgdat);
349 extern int __add_memory(int nid, u64 start, u64 size, mhp_t mhp_flags);
350 extern int add_memory(int nid, u64 start, u64 size, mhp_t mhp_flags);
351 extern int add_memory_resource(int nid, struct resource *resource,
352 			       mhp_t mhp_flags);
353 extern int add_memory_driver_managed(int nid, u64 start, u64 size,
354 				     const char *resource_name,
355 				     mhp_t mhp_flags);
356 extern void move_pfn_range_to_zone(struct zone *zone, unsigned long start_pfn,
357 				   unsigned long nr_pages,
358 				   struct vmem_altmap *altmap, int migratetype);
359 extern void remove_pfn_range_from_zone(struct zone *zone,
360 				       unsigned long start_pfn,
361 				       unsigned long nr_pages);
362 extern int sparse_add_section(int nid, unsigned long pfn,
363 		unsigned long nr_pages, struct vmem_altmap *altmap,
364 		struct dev_pagemap *pgmap);
365 extern void sparse_remove_section(unsigned long pfn, unsigned long nr_pages,
366 				  struct vmem_altmap *altmap);
367 extern struct page *sparse_decode_mem_map(unsigned long coded_mem_map,
368 					  unsigned long pnum);
369 extern struct zone *zone_for_pfn_range(int online_type, int nid,
370 		struct memory_group *group, unsigned long start_pfn,
371 		unsigned long nr_pages);
372 extern int arch_create_linear_mapping(int nid, u64 start, u64 size,
373 				      struct mhp_params *params);
374 void arch_remove_linear_mapping(u64 start, u64 size);
375 #endif /* CONFIG_MEMORY_HOTPLUG */
376 
377 #endif /* __LINUX_MEMORY_HOTPLUG_H */
378