1 | /* SPDX-License-Identifier: GPL-2.0 */ |
2 | #ifndef __LINUX_MEMORY_HOTPLUG_H |
3 | #define __LINUX_MEMORY_HOTPLUG_H |
4 | |
5 | #include <linux/mmzone.h> |
6 | #include <linux/spinlock.h> |
7 | #include <linux/notifier.h> |
8 | #include <linux/bug.h> |
9 | |
10 | struct page; |
11 | struct zone; |
12 | struct pglist_data; |
13 | struct mem_section; |
14 | struct memory_group; |
15 | struct resource; |
16 | struct vmem_altmap; |
17 | struct dev_pagemap; |
18 | |
19 | #ifdef CONFIG_HAVE_ARCH_NODEDATA_EXTENSION |
20 | /* |
21 | * For supporting node-hotadd, we have to allocate a new pgdat. |
22 | * |
23 | * If an arch has generic style NODE_DATA(), |
24 | * node_data[nid] = kzalloc() works well. But it depends on the architecture. |
25 | * |
26 | * In general, generic_alloc_nodedata() is used. |
27 | * |
28 | */ |
29 | extern pg_data_t *arch_alloc_nodedata(int nid); |
30 | extern void arch_refresh_nodedata(int nid, pg_data_t *pgdat); |
31 | |
32 | #else /* CONFIG_HAVE_ARCH_NODEDATA_EXTENSION */ |
33 | |
34 | #define arch_alloc_nodedata(nid) generic_alloc_nodedata(nid) |
35 | |
36 | #ifdef CONFIG_NUMA |
37 | /* |
38 | * XXX: node aware allocation can't work well to get new node's memory at this time. |
39 | * Because, pgdat for the new node is not allocated/initialized yet itself. |
40 | * To use new node's memory, more consideration will be necessary. |
41 | */ |
42 | #define generic_alloc_nodedata(nid) \ |
43 | ({ \ |
44 | memblock_alloc(sizeof(*pgdat), SMP_CACHE_BYTES); \ |
45 | }) |
46 | |
47 | extern pg_data_t *node_data[]; |
48 | static inline void arch_refresh_nodedata(int nid, pg_data_t *pgdat) |
49 | { |
50 | node_data[nid] = pgdat; |
51 | } |
52 | |
53 | #else /* !CONFIG_NUMA */ |
54 | |
55 | /* never called */ |
56 | static inline pg_data_t *generic_alloc_nodedata(int nid) |
57 | { |
58 | BUG(); |
59 | return NULL; |
60 | } |
61 | static inline void arch_refresh_nodedata(int nid, pg_data_t *pgdat) |
62 | { |
63 | } |
64 | #endif /* CONFIG_NUMA */ |
65 | #endif /* CONFIG_HAVE_ARCH_NODEDATA_EXTENSION */ |
66 | |
67 | #ifdef CONFIG_MEMORY_HOTPLUG |
68 | struct page *pfn_to_online_page(unsigned long pfn); |
69 | |
70 | /* Types for control the zone type of onlined and offlined memory */ |
71 | enum { |
72 | /* Offline the memory. */ |
73 | MMOP_OFFLINE = 0, |
74 | /* Online the memory. Zone depends, see default_zone_for_pfn(). */ |
75 | MMOP_ONLINE, |
76 | /* Online the memory to ZONE_NORMAL. */ |
77 | MMOP_ONLINE_KERNEL, |
78 | /* Online the memory to ZONE_MOVABLE. */ |
79 | MMOP_ONLINE_MOVABLE, |
80 | }; |
81 | |
82 | /* Flags for add_memory() and friends to specify memory hotplug details. */ |
83 | typedef int __bitwise mhp_t; |
84 | |
85 | /* No special request */ |
86 | #define MHP_NONE ((__force mhp_t)0) |
87 | /* |
88 | * Allow merging of the added System RAM resource with adjacent, |
89 | * mergeable resources. After a successful call to add_memory_resource() |
90 | * with this flag set, the resource pointer must no longer be used as it |
91 | * might be stale, or the resource might have changed. |
92 | */ |
93 | #define MHP_MERGE_RESOURCE ((__force mhp_t)BIT(0)) |
94 | |
95 | /* |
96 | * We want memmap (struct page array) to be self contained. |
97 | * To do so, we will use the beginning of the hot-added range to build |
98 | * the page tables for the memmap array that describes the entire range. |
99 | * Only selected architectures support it with SPARSE_VMEMMAP. |
100 | * This is only a hint, the core kernel can decide to not do this based on |
101 | * different alignment checks. |
102 | */ |
103 | #define MHP_MEMMAP_ON_MEMORY ((__force mhp_t)BIT(1)) |
104 | /* |
105 | * The nid field specifies a memory group id (mgid) instead. The memory group |
106 | * implies the node id (nid). |
107 | */ |
108 | #define MHP_NID_IS_MGID ((__force mhp_t)BIT(2)) |
109 | /* |
110 | * The hotplugged memory is completely inaccessible while the memory is |
111 | * offline. The memory provider will handle MEM_PREPARE_ONLINE / |
112 | * MEM_FINISH_OFFLINE notifications and make the memory accessible. |
113 | * |
114 | * This flag is only relevant when used along with MHP_MEMMAP_ON_MEMORY, |
115 | * because the altmap cannot be written (e.g., poisoned) when adding |
116 | * memory -- before it is set online. |
117 | * |
118 | * This allows for adding memory with an altmap that is not currently |
119 | * made available by a hypervisor. When onlining that memory, the |
120 | * hypervisor can be instructed to make that memory available, and |
121 | * the onlining phase will not require any memory allocations, which is |
122 | * helpful in low-memory situations. |
123 | */ |
124 | #define MHP_OFFLINE_INACCESSIBLE ((__force mhp_t)BIT(3)) |
125 | |
126 | /* |
127 | * Extended parameters for memory hotplug: |
128 | * altmap: alternative allocator for memmap array (optional) |
129 | * pgprot: page protection flags to apply to newly created page tables |
130 | * (required) |
131 | */ |
132 | struct mhp_params { |
133 | struct vmem_altmap *altmap; |
134 | pgprot_t pgprot; |
135 | struct dev_pagemap *pgmap; |
136 | }; |
137 | |
138 | bool mhp_range_allowed(u64 start, u64 size, bool need_mapping); |
139 | struct range mhp_get_pluggable_range(bool need_mapping); |
140 | bool mhp_supports_memmap_on_memory(void); |
141 | |
142 | /* |
143 | * Zone resizing functions |
144 | * |
145 | * Note: any attempt to resize a zone should has pgdat_resize_lock() |
146 | * zone_span_writelock() both held. This ensure the size of a zone |
147 | * can't be changed while pgdat_resize_lock() held. |
148 | */ |
149 | static inline unsigned zone_span_seqbegin(struct zone *zone) |
150 | { |
151 | return read_seqbegin(sl: &zone->span_seqlock); |
152 | } |
153 | static inline int zone_span_seqretry(struct zone *zone, unsigned iv) |
154 | { |
155 | return read_seqretry(sl: &zone->span_seqlock, start: iv); |
156 | } |
157 | static inline void zone_span_writelock(struct zone *zone) |
158 | { |
159 | write_seqlock(sl: &zone->span_seqlock); |
160 | } |
161 | static inline void zone_span_writeunlock(struct zone *zone) |
162 | { |
163 | write_sequnlock(sl: &zone->span_seqlock); |
164 | } |
165 | static inline void zone_seqlock_init(struct zone *zone) |
166 | { |
167 | seqlock_init(&zone->span_seqlock); |
168 | } |
169 | extern void adjust_present_page_count(struct page *page, |
170 | struct memory_group *group, |
171 | long nr_pages); |
172 | /* VM interface that may be used by firmware interface */ |
173 | extern int mhp_init_memmap_on_memory(unsigned long pfn, unsigned long nr_pages, |
174 | struct zone *zone, bool mhp_off_inaccessible); |
175 | extern void mhp_deinit_memmap_on_memory(unsigned long pfn, unsigned long nr_pages); |
176 | extern int online_pages(unsigned long pfn, unsigned long nr_pages, |
177 | struct zone *zone, struct memory_group *group); |
178 | extern void __offline_isolated_pages(unsigned long start_pfn, |
179 | unsigned long end_pfn); |
180 | |
181 | typedef void (*online_page_callback_t)(struct page *page, unsigned int order); |
182 | |
183 | extern void generic_online_page(struct page *page, unsigned int order); |
184 | extern int set_online_page_callback(online_page_callback_t callback); |
185 | extern int restore_online_page_callback(online_page_callback_t callback); |
186 | |
187 | extern int try_online_node(int nid); |
188 | |
189 | extern int arch_add_memory(int nid, u64 start, u64 size, |
190 | struct mhp_params *params); |
191 | extern u64 max_mem_size; |
192 | |
193 | extern int mhp_online_type_from_str(const char *str); |
194 | |
195 | /* Default online_type (MMOP_*) when new memory blocks are added. */ |
196 | extern int mhp_default_online_type; |
197 | /* If movable_node boot option specified */ |
198 | extern bool movable_node_enabled; |
199 | static inline bool movable_node_is_enabled(void) |
200 | { |
201 | return movable_node_enabled; |
202 | } |
203 | |
204 | extern void arch_remove_memory(u64 start, u64 size, struct vmem_altmap *altmap); |
205 | extern void __remove_pages(unsigned long start_pfn, unsigned long nr_pages, |
206 | struct vmem_altmap *altmap); |
207 | |
208 | /* reasonably generic interface to expand the physical pages */ |
209 | extern int __add_pages(int nid, unsigned long start_pfn, unsigned long nr_pages, |
210 | struct mhp_params *params); |
211 | |
212 | #ifndef CONFIG_ARCH_HAS_ADD_PAGES |
213 | static inline int add_pages(int nid, unsigned long start_pfn, |
214 | unsigned long nr_pages, struct mhp_params *params) |
215 | { |
216 | return __add_pages(nid, start_pfn, nr_pages, params); |
217 | } |
218 | #else /* ARCH_HAS_ADD_PAGES */ |
219 | int add_pages(int nid, unsigned long start_pfn, unsigned long nr_pages, |
220 | struct mhp_params *params); |
221 | #endif /* ARCH_HAS_ADD_PAGES */ |
222 | |
223 | void get_online_mems(void); |
224 | void put_online_mems(void); |
225 | |
226 | void mem_hotplug_begin(void); |
227 | void mem_hotplug_done(void); |
228 | |
229 | /* See kswapd_is_running() */ |
230 | static inline void pgdat_kswapd_lock(pg_data_t *pgdat) |
231 | { |
232 | mutex_lock(&pgdat->kswapd_lock); |
233 | } |
234 | |
235 | static inline void pgdat_kswapd_unlock(pg_data_t *pgdat) |
236 | { |
237 | mutex_unlock(lock: &pgdat->kswapd_lock); |
238 | } |
239 | |
240 | static inline void pgdat_kswapd_lock_init(pg_data_t *pgdat) |
241 | { |
242 | mutex_init(&pgdat->kswapd_lock); |
243 | } |
244 | |
245 | #else /* ! CONFIG_MEMORY_HOTPLUG */ |
246 | #define pfn_to_online_page(pfn) \ |
247 | ({ \ |
248 | struct page *___page = NULL; \ |
249 | if (pfn_valid(pfn)) \ |
250 | ___page = pfn_to_page(pfn); \ |
251 | ___page; \ |
252 | }) |
253 | |
254 | static inline unsigned zone_span_seqbegin(struct zone *zone) |
255 | { |
256 | return 0; |
257 | } |
258 | static inline int zone_span_seqretry(struct zone *zone, unsigned iv) |
259 | { |
260 | return 0; |
261 | } |
262 | static inline void zone_span_writelock(struct zone *zone) {} |
263 | static inline void zone_span_writeunlock(struct zone *zone) {} |
264 | static inline void zone_seqlock_init(struct zone *zone) {} |
265 | |
266 | static inline int try_online_node(int nid) |
267 | { |
268 | return 0; |
269 | } |
270 | |
271 | static inline void get_online_mems(void) {} |
272 | static inline void put_online_mems(void) {} |
273 | |
274 | static inline void mem_hotplug_begin(void) {} |
275 | static inline void mem_hotplug_done(void) {} |
276 | |
277 | static inline bool movable_node_is_enabled(void) |
278 | { |
279 | return false; |
280 | } |
281 | |
282 | static inline bool mhp_supports_memmap_on_memory(void) |
283 | { |
284 | return false; |
285 | } |
286 | |
287 | static inline void pgdat_kswapd_lock(pg_data_t *pgdat) {} |
288 | static inline void pgdat_kswapd_unlock(pg_data_t *pgdat) {} |
289 | static inline void pgdat_kswapd_lock_init(pg_data_t *pgdat) {} |
290 | #endif /* ! CONFIG_MEMORY_HOTPLUG */ |
291 | |
292 | /* |
293 | * Keep this declaration outside CONFIG_MEMORY_HOTPLUG as some |
294 | * platforms might override and use arch_get_mappable_range() |
295 | * for internal non memory hotplug purposes. |
296 | */ |
297 | struct range arch_get_mappable_range(void); |
298 | |
299 | #if defined(CONFIG_MEMORY_HOTPLUG) || defined(CONFIG_DEFERRED_STRUCT_PAGE_INIT) |
300 | /* |
301 | * pgdat resizing functions |
302 | */ |
303 | static inline |
304 | void pgdat_resize_lock(struct pglist_data *pgdat, unsigned long *flags) |
305 | { |
306 | spin_lock_irqsave(&pgdat->node_size_lock, *flags); |
307 | } |
308 | static inline |
309 | void pgdat_resize_unlock(struct pglist_data *pgdat, unsigned long *flags) |
310 | { |
311 | spin_unlock_irqrestore(lock: &pgdat->node_size_lock, flags: *flags); |
312 | } |
313 | static inline |
314 | void pgdat_resize_init(struct pglist_data *pgdat) |
315 | { |
316 | spin_lock_init(&pgdat->node_size_lock); |
317 | } |
318 | #else /* !(CONFIG_MEMORY_HOTPLUG || CONFIG_DEFERRED_STRUCT_PAGE_INIT) */ |
319 | /* |
320 | * Stub functions for when hotplug is off |
321 | */ |
322 | static inline void pgdat_resize_lock(struct pglist_data *p, unsigned long *f) {} |
323 | static inline void pgdat_resize_unlock(struct pglist_data *p, unsigned long *f) {} |
324 | static inline void pgdat_resize_init(struct pglist_data *pgdat) {} |
325 | #endif /* !(CONFIG_MEMORY_HOTPLUG || CONFIG_DEFERRED_STRUCT_PAGE_INIT) */ |
326 | |
327 | #ifdef CONFIG_MEMORY_HOTREMOVE |
328 | |
329 | extern void try_offline_node(int nid); |
330 | extern int offline_pages(unsigned long start_pfn, unsigned long nr_pages, |
331 | struct zone *zone, struct memory_group *group); |
332 | extern int remove_memory(u64 start, u64 size); |
333 | extern void __remove_memory(u64 start, u64 size); |
334 | extern int offline_and_remove_memory(u64 start, u64 size); |
335 | |
336 | #else |
337 | static inline void try_offline_node(int nid) {} |
338 | |
339 | static inline int offline_pages(unsigned long start_pfn, unsigned long nr_pages, |
340 | struct zone *zone, struct memory_group *group) |
341 | { |
342 | return -EINVAL; |
343 | } |
344 | |
345 | static inline int remove_memory(u64 start, u64 size) |
346 | { |
347 | return -EBUSY; |
348 | } |
349 | |
350 | static inline void __remove_memory(u64 start, u64 size) {} |
351 | #endif /* CONFIG_MEMORY_HOTREMOVE */ |
352 | |
353 | #ifdef CONFIG_MEMORY_HOTPLUG |
354 | extern void __ref free_area_init_core_hotplug(struct pglist_data *pgdat); |
355 | extern int __add_memory(int nid, u64 start, u64 size, mhp_t mhp_flags); |
356 | extern int add_memory(int nid, u64 start, u64 size, mhp_t mhp_flags); |
357 | extern int add_memory_resource(int nid, struct resource *resource, |
358 | mhp_t mhp_flags); |
359 | extern int add_memory_driver_managed(int nid, u64 start, u64 size, |
360 | const char *resource_name, |
361 | mhp_t mhp_flags); |
362 | extern void move_pfn_range_to_zone(struct zone *zone, unsigned long start_pfn, |
363 | unsigned long nr_pages, |
364 | struct vmem_altmap *altmap, int migratetype); |
365 | extern void remove_pfn_range_from_zone(struct zone *zone, |
366 | unsigned long start_pfn, |
367 | unsigned long nr_pages); |
368 | extern int sparse_add_section(int nid, unsigned long pfn, |
369 | unsigned long nr_pages, struct vmem_altmap *altmap, |
370 | struct dev_pagemap *pgmap); |
371 | extern void sparse_remove_section(unsigned long pfn, unsigned long nr_pages, |
372 | struct vmem_altmap *altmap); |
373 | extern struct page *sparse_decode_mem_map(unsigned long coded_mem_map, |
374 | unsigned long pnum); |
375 | extern struct zone *zone_for_pfn_range(int online_type, int nid, |
376 | struct memory_group *group, unsigned long start_pfn, |
377 | unsigned long nr_pages); |
378 | extern int arch_create_linear_mapping(int nid, u64 start, u64 size, |
379 | struct mhp_params *params); |
380 | void arch_remove_linear_mapping(u64 start, u64 size); |
381 | #endif /* CONFIG_MEMORY_HOTPLUG */ |
382 | |
383 | #endif /* __LINUX_MEMORY_HOTPLUG_H */ |
384 | |