1 /* SPDX-License-Identifier: GPL-2.0 */ 2 #ifndef __LINUX_MEMORY_HOTPLUG_H 3 #define __LINUX_MEMORY_HOTPLUG_H 4 5 #include <linux/mmzone.h> 6 #include <linux/spinlock.h> 7 #include <linux/notifier.h> 8 #include <linux/bug.h> 9 10 struct page; 11 struct zone; 12 struct pglist_data; 13 struct mem_section; 14 struct memory_group; 15 struct resource; 16 struct vmem_altmap; 17 struct dev_pagemap; 18 19 #ifdef CONFIG_HAVE_ARCH_NODEDATA_EXTENSION 20 /* 21 * For supporting node-hotadd, we have to allocate a new pgdat. 22 * 23 * If an arch has generic style NODE_DATA(), 24 * node_data[nid] = kzalloc() works well. But it depends on the architecture. 25 * 26 * In general, generic_alloc_nodedata() is used. 27 * 28 */ 29 extern pg_data_t *arch_alloc_nodedata(int nid); 30 extern void arch_refresh_nodedata(int nid, pg_data_t *pgdat); 31 32 #else /* CONFIG_HAVE_ARCH_NODEDATA_EXTENSION */ 33 34 #define arch_alloc_nodedata(nid) generic_alloc_nodedata(nid) 35 36 #ifdef CONFIG_NUMA 37 /* 38 * XXX: node aware allocation can't work well to get new node's memory at this time. 39 * Because, pgdat for the new node is not allocated/initialized yet itself. 40 * To use new node's memory, more consideration will be necessary. 41 */ 42 #define generic_alloc_nodedata(nid) \ 43 ({ \ 44 memblock_alloc(sizeof(*pgdat), SMP_CACHE_BYTES); \ 45 }) 46 47 extern pg_data_t *node_data[]; 48 static inline void arch_refresh_nodedata(int nid, pg_data_t *pgdat) 49 { 50 node_data[nid] = pgdat; 51 } 52 53 #else /* !CONFIG_NUMA */ 54 55 /* never called */ 56 static inline pg_data_t *generic_alloc_nodedata(int nid) 57 { 58 BUG(); 59 return NULL; 60 } 61 static inline void arch_refresh_nodedata(int nid, pg_data_t *pgdat) 62 { 63 } 64 #endif /* CONFIG_NUMA */ 65 #endif /* CONFIG_HAVE_ARCH_NODEDATA_EXTENSION */ 66 67 #ifdef CONFIG_MEMORY_HOTPLUG 68 struct page *pfn_to_online_page(unsigned long pfn); 69 70 /* Types for control the zone type of onlined and offlined memory */ 71 enum { 72 /* Offline the memory. */ 73 MMOP_OFFLINE = 0, 74 /* Online the memory. Zone depends, see default_zone_for_pfn(). */ 75 MMOP_ONLINE, 76 /* Online the memory to ZONE_NORMAL. */ 77 MMOP_ONLINE_KERNEL, 78 /* Online the memory to ZONE_MOVABLE. */ 79 MMOP_ONLINE_MOVABLE, 80 }; 81 82 /* Flags for add_memory() and friends to specify memory hotplug details. */ 83 typedef int __bitwise mhp_t; 84 85 /* No special request */ 86 #define MHP_NONE ((__force mhp_t)0) 87 /* 88 * Allow merging of the added System RAM resource with adjacent, 89 * mergeable resources. After a successful call to add_memory_resource() 90 * with this flag set, the resource pointer must no longer be used as it 91 * might be stale, or the resource might have changed. 92 */ 93 #define MHP_MERGE_RESOURCE ((__force mhp_t)BIT(0)) 94 95 /* 96 * We want memmap (struct page array) to be self contained. 97 * To do so, we will use the beginning of the hot-added range to build 98 * the page tables for the memmap array that describes the entire range. 99 * Only selected architectures support it with SPARSE_VMEMMAP. 100 * This is only a hint, the core kernel can decide to not do this based on 101 * different alignment checks. 102 */ 103 #define MHP_MEMMAP_ON_MEMORY ((__force mhp_t)BIT(1)) 104 /* 105 * The nid field specifies a memory group id (mgid) instead. The memory group 106 * implies the node id (nid). 107 */ 108 #define MHP_NID_IS_MGID ((__force mhp_t)BIT(2)) 109 /* 110 * The hotplugged memory is completely inaccessible while the memory is 111 * offline. The memory provider will handle MEM_PREPARE_ONLINE / 112 * MEM_FINISH_OFFLINE notifications and make the memory accessible. 113 * 114 * This flag is only relevant when used along with MHP_MEMMAP_ON_MEMORY, 115 * because the altmap cannot be written (e.g., poisoned) when adding 116 * memory -- before it is set online. 117 * 118 * This allows for adding memory with an altmap that is not currently 119 * made available by a hypervisor. When onlining that memory, the 120 * hypervisor can be instructed to make that memory available, and 121 * the onlining phase will not require any memory allocations, which is 122 * helpful in low-memory situations. 123 */ 124 #define MHP_OFFLINE_INACCESSIBLE ((__force mhp_t)BIT(3)) 125 126 /* 127 * Extended parameters for memory hotplug: 128 * altmap: alternative allocator for memmap array (optional) 129 * pgprot: page protection flags to apply to newly created page tables 130 * (required) 131 */ 132 struct mhp_params { 133 struct vmem_altmap *altmap; 134 pgprot_t pgprot; 135 struct dev_pagemap *pgmap; 136 }; 137 138 bool mhp_range_allowed(u64 start, u64 size, bool need_mapping); 139 struct range mhp_get_pluggable_range(bool need_mapping); 140 141 /* 142 * Zone resizing functions 143 * 144 * Note: any attempt to resize a zone should has pgdat_resize_lock() 145 * zone_span_writelock() both held. This ensure the size of a zone 146 * can't be changed while pgdat_resize_lock() held. 147 */ 148 static inline unsigned zone_span_seqbegin(struct zone *zone) 149 { 150 return read_seqbegin(&zone->span_seqlock); 151 } 152 static inline int zone_span_seqretry(struct zone *zone, unsigned iv) 153 { 154 return read_seqretry(&zone->span_seqlock, iv); 155 } 156 static inline void zone_span_writelock(struct zone *zone) 157 { 158 write_seqlock(&zone->span_seqlock); 159 } 160 static inline void zone_span_writeunlock(struct zone *zone) 161 { 162 write_sequnlock(&zone->span_seqlock); 163 } 164 static inline void zone_seqlock_init(struct zone *zone) 165 { 166 seqlock_init(&zone->span_seqlock); 167 } 168 extern void adjust_present_page_count(struct page *page, 169 struct memory_group *group, 170 long nr_pages); 171 /* VM interface that may be used by firmware interface */ 172 extern int mhp_init_memmap_on_memory(unsigned long pfn, unsigned long nr_pages, 173 struct zone *zone, bool mhp_off_inaccessible); 174 extern void mhp_deinit_memmap_on_memory(unsigned long pfn, unsigned long nr_pages); 175 extern int online_pages(unsigned long pfn, unsigned long nr_pages, 176 struct zone *zone, struct memory_group *group); 177 extern void __offline_isolated_pages(unsigned long start_pfn, 178 unsigned long end_pfn); 179 180 typedef void (*online_page_callback_t)(struct page *page, unsigned int order); 181 182 extern void generic_online_page(struct page *page, unsigned int order); 183 extern int set_online_page_callback(online_page_callback_t callback); 184 extern int restore_online_page_callback(online_page_callback_t callback); 185 186 extern int try_online_node(int nid); 187 188 extern int arch_add_memory(int nid, u64 start, u64 size, 189 struct mhp_params *params); 190 extern u64 max_mem_size; 191 192 extern int mhp_online_type_from_str(const char *str); 193 194 /* Default online_type (MMOP_*) when new memory blocks are added. */ 195 extern int mhp_default_online_type; 196 /* If movable_node boot option specified */ 197 extern bool movable_node_enabled; 198 static inline bool movable_node_is_enabled(void) 199 { 200 return movable_node_enabled; 201 } 202 203 extern void arch_remove_memory(u64 start, u64 size, struct vmem_altmap *altmap); 204 extern void __remove_pages(unsigned long start_pfn, unsigned long nr_pages, 205 struct vmem_altmap *altmap); 206 207 /* reasonably generic interface to expand the physical pages */ 208 extern int __add_pages(int nid, unsigned long start_pfn, unsigned long nr_pages, 209 struct mhp_params *params); 210 211 #ifndef CONFIG_ARCH_HAS_ADD_PAGES 212 static inline int add_pages(int nid, unsigned long start_pfn, 213 unsigned long nr_pages, struct mhp_params *params) 214 { 215 return __add_pages(nid, start_pfn, nr_pages, params); 216 } 217 #else /* ARCH_HAS_ADD_PAGES */ 218 int add_pages(int nid, unsigned long start_pfn, unsigned long nr_pages, 219 struct mhp_params *params); 220 #endif /* ARCH_HAS_ADD_PAGES */ 221 222 void get_online_mems(void); 223 void put_online_mems(void); 224 225 void mem_hotplug_begin(void); 226 void mem_hotplug_done(void); 227 228 /* See kswapd_is_running() */ 229 static inline void pgdat_kswapd_lock(pg_data_t *pgdat) 230 { 231 mutex_lock(&pgdat->kswapd_lock); 232 } 233 234 static inline void pgdat_kswapd_unlock(pg_data_t *pgdat) 235 { 236 mutex_unlock(&pgdat->kswapd_lock); 237 } 238 239 static inline void pgdat_kswapd_lock_init(pg_data_t *pgdat) 240 { 241 mutex_init(&pgdat->kswapd_lock); 242 } 243 244 #else /* ! CONFIG_MEMORY_HOTPLUG */ 245 #define pfn_to_online_page(pfn) \ 246 ({ \ 247 struct page *___page = NULL; \ 248 if (pfn_valid(pfn)) \ 249 ___page = pfn_to_page(pfn); \ 250 ___page; \ 251 }) 252 253 static inline unsigned zone_span_seqbegin(struct zone *zone) 254 { 255 return 0; 256 } 257 static inline int zone_span_seqretry(struct zone *zone, unsigned iv) 258 { 259 return 0; 260 } 261 static inline void zone_span_writelock(struct zone *zone) {} 262 static inline void zone_span_writeunlock(struct zone *zone) {} 263 static inline void zone_seqlock_init(struct zone *zone) {} 264 265 static inline int try_online_node(int nid) 266 { 267 return 0; 268 } 269 270 static inline void get_online_mems(void) {} 271 static inline void put_online_mems(void) {} 272 273 static inline void mem_hotplug_begin(void) {} 274 static inline void mem_hotplug_done(void) {} 275 276 static inline bool movable_node_is_enabled(void) 277 { 278 return false; 279 } 280 281 static inline void pgdat_kswapd_lock(pg_data_t *pgdat) {} 282 static inline void pgdat_kswapd_unlock(pg_data_t *pgdat) {} 283 static inline void pgdat_kswapd_lock_init(pg_data_t *pgdat) {} 284 #endif /* ! CONFIG_MEMORY_HOTPLUG */ 285 286 /* 287 * Keep this declaration outside CONFIG_MEMORY_HOTPLUG as some 288 * platforms might override and use arch_get_mappable_range() 289 * for internal non memory hotplug purposes. 290 */ 291 struct range arch_get_mappable_range(void); 292 293 #if defined(CONFIG_MEMORY_HOTPLUG) || defined(CONFIG_DEFERRED_STRUCT_PAGE_INIT) 294 /* 295 * pgdat resizing functions 296 */ 297 static inline 298 void pgdat_resize_lock(struct pglist_data *pgdat, unsigned long *flags) 299 { 300 spin_lock_irqsave(&pgdat->node_size_lock, *flags); 301 } 302 static inline 303 void pgdat_resize_unlock(struct pglist_data *pgdat, unsigned long *flags) 304 { 305 spin_unlock_irqrestore(&pgdat->node_size_lock, *flags); 306 } 307 static inline 308 void pgdat_resize_init(struct pglist_data *pgdat) 309 { 310 spin_lock_init(&pgdat->node_size_lock); 311 } 312 #else /* !(CONFIG_MEMORY_HOTPLUG || CONFIG_DEFERRED_STRUCT_PAGE_INIT) */ 313 /* 314 * Stub functions for when hotplug is off 315 */ 316 static inline void pgdat_resize_lock(struct pglist_data *p, unsigned long *f) {} 317 static inline void pgdat_resize_unlock(struct pglist_data *p, unsigned long *f) {} 318 static inline void pgdat_resize_init(struct pglist_data *pgdat) {} 319 #endif /* !(CONFIG_MEMORY_HOTPLUG || CONFIG_DEFERRED_STRUCT_PAGE_INIT) */ 320 321 #ifdef CONFIG_MEMORY_HOTREMOVE 322 323 extern void try_offline_node(int nid); 324 extern int offline_pages(unsigned long start_pfn, unsigned long nr_pages, 325 struct zone *zone, struct memory_group *group); 326 extern int remove_memory(u64 start, u64 size); 327 extern void __remove_memory(u64 start, u64 size); 328 extern int offline_and_remove_memory(u64 start, u64 size); 329 330 #else 331 static inline void try_offline_node(int nid) {} 332 333 static inline int offline_pages(unsigned long start_pfn, unsigned long nr_pages, 334 struct zone *zone, struct memory_group *group) 335 { 336 return -EINVAL; 337 } 338 339 static inline int remove_memory(u64 start, u64 size) 340 { 341 return -EBUSY; 342 } 343 344 static inline void __remove_memory(u64 start, u64 size) {} 345 #endif /* CONFIG_MEMORY_HOTREMOVE */ 346 347 #ifdef CONFIG_MEMORY_HOTPLUG 348 extern void __ref free_area_init_core_hotplug(struct pglist_data *pgdat); 349 extern int __add_memory(int nid, u64 start, u64 size, mhp_t mhp_flags); 350 extern int add_memory(int nid, u64 start, u64 size, mhp_t mhp_flags); 351 extern int add_memory_resource(int nid, struct resource *resource, 352 mhp_t mhp_flags); 353 extern int add_memory_driver_managed(int nid, u64 start, u64 size, 354 const char *resource_name, 355 mhp_t mhp_flags); 356 extern void move_pfn_range_to_zone(struct zone *zone, unsigned long start_pfn, 357 unsigned long nr_pages, 358 struct vmem_altmap *altmap, int migratetype); 359 extern void remove_pfn_range_from_zone(struct zone *zone, 360 unsigned long start_pfn, 361 unsigned long nr_pages); 362 extern int sparse_add_section(int nid, unsigned long pfn, 363 unsigned long nr_pages, struct vmem_altmap *altmap, 364 struct dev_pagemap *pgmap); 365 extern void sparse_remove_section(unsigned long pfn, unsigned long nr_pages, 366 struct vmem_altmap *altmap); 367 extern struct page *sparse_decode_mem_map(unsigned long coded_mem_map, 368 unsigned long pnum); 369 extern struct zone *zone_for_pfn_range(int online_type, int nid, 370 struct memory_group *group, unsigned long start_pfn, 371 unsigned long nr_pages); 372 extern int arch_create_linear_mapping(int nid, u64 start, u64 size, 373 struct mhp_params *params); 374 void arch_remove_linear_mapping(u64 start, u64 size); 375 #endif /* CONFIG_MEMORY_HOTPLUG */ 376 377 #endif /* __LINUX_MEMORY_HOTPLUG_H */ 378