xref: /linux-6.15/include/linux/vmstat.h (revision 3ac44a34)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _LINUX_VMSTAT_H
3 #define _LINUX_VMSTAT_H
4 
5 #include <linux/types.h>
6 #include <linux/percpu.h>
7 #include <linux/mmzone.h>
8 #include <linux/vm_event_item.h>
9 #include <linux/atomic.h>
10 #include <linux/static_key.h>
11 #include <linux/mmdebug.h>
12 
13 extern int sysctl_stat_interval;
14 
15 #ifdef CONFIG_NUMA
16 #define ENABLE_NUMA_STAT   1
17 #define DISABLE_NUMA_STAT   0
18 extern int sysctl_vm_numa_stat;
19 DECLARE_STATIC_KEY_TRUE(vm_numa_stat_key);
20 int sysctl_vm_numa_stat_handler(struct ctl_table *table, int write,
21 		void *buffer, size_t *length, loff_t *ppos);
22 #endif
23 
24 struct reclaim_stat {
25 	unsigned nr_dirty;
26 	unsigned nr_unqueued_dirty;
27 	unsigned nr_congested;
28 	unsigned nr_writeback;
29 	unsigned nr_immediate;
30 	unsigned nr_pageout;
31 	unsigned nr_activate[ANON_AND_FILE];
32 	unsigned nr_ref_keep;
33 	unsigned nr_unmap_fail;
34 	unsigned nr_lazyfree_fail;
35 };
36 
37 enum writeback_stat_item {
38 	NR_DIRTY_THRESHOLD,
39 	NR_DIRTY_BG_THRESHOLD,
40 	NR_VM_WRITEBACK_STAT_ITEMS,
41 };
42 
43 #ifdef CONFIG_VM_EVENT_COUNTERS
44 /*
45  * Light weight per cpu counter implementation.
46  *
47  * Counters should only be incremented and no critical kernel component
48  * should rely on the counter values.
49  *
50  * Counters are handled completely inline. On many platforms the code
51  * generated will simply be the increment of a global address.
52  */
53 
54 struct vm_event_state {
55 	unsigned long event[NR_VM_EVENT_ITEMS];
56 };
57 
58 DECLARE_PER_CPU(struct vm_event_state, vm_event_states);
59 
60 /*
61  * vm counters are allowed to be racy. Use raw_cpu_ops to avoid the
62  * local_irq_disable overhead.
63  */
64 static inline void __count_vm_event(enum vm_event_item item)
65 {
66 	raw_cpu_inc(vm_event_states.event[item]);
67 }
68 
69 static inline void count_vm_event(enum vm_event_item item)
70 {
71 	this_cpu_inc(vm_event_states.event[item]);
72 }
73 
74 static inline void __count_vm_events(enum vm_event_item item, long delta)
75 {
76 	raw_cpu_add(vm_event_states.event[item], delta);
77 }
78 
79 static inline void count_vm_events(enum vm_event_item item, long delta)
80 {
81 	this_cpu_add(vm_event_states.event[item], delta);
82 }
83 
84 extern void all_vm_events(unsigned long *);
85 
86 extern void vm_events_fold_cpu(int cpu);
87 
88 #else
89 
90 /* Disable counters */
91 static inline void count_vm_event(enum vm_event_item item)
92 {
93 }
94 static inline void count_vm_events(enum vm_event_item item, long delta)
95 {
96 }
97 static inline void __count_vm_event(enum vm_event_item item)
98 {
99 }
100 static inline void __count_vm_events(enum vm_event_item item, long delta)
101 {
102 }
103 static inline void all_vm_events(unsigned long *ret)
104 {
105 }
106 static inline void vm_events_fold_cpu(int cpu)
107 {
108 }
109 
110 #endif /* CONFIG_VM_EVENT_COUNTERS */
111 
112 #ifdef CONFIG_NUMA_BALANCING
113 #define count_vm_numa_event(x)     count_vm_event(x)
114 #define count_vm_numa_events(x, y) count_vm_events(x, y)
115 #else
116 #define count_vm_numa_event(x) do {} while (0)
117 #define count_vm_numa_events(x, y) do { (void)(y); } while (0)
118 #endif /* CONFIG_NUMA_BALANCING */
119 
120 #ifdef CONFIG_DEBUG_TLBFLUSH
121 #define count_vm_tlb_event(x)	   count_vm_event(x)
122 #define count_vm_tlb_events(x, y)  count_vm_events(x, y)
123 #else
124 #define count_vm_tlb_event(x)     do {} while (0)
125 #define count_vm_tlb_events(x, y) do { (void)(y); } while (0)
126 #endif
127 
128 #ifdef CONFIG_DEBUG_VM_VMACACHE
129 #define count_vm_vmacache_event(x) count_vm_event(x)
130 #else
131 #define count_vm_vmacache_event(x) do {} while (0)
132 #endif
133 
134 #define __count_zid_vm_events(item, zid, delta) \
135 	__count_vm_events(item##_NORMAL - ZONE_NORMAL + zid, delta)
136 
137 /*
138  * Zone and node-based page accounting with per cpu differentials.
139  */
140 extern atomic_long_t vm_zone_stat[NR_VM_ZONE_STAT_ITEMS];
141 extern atomic_long_t vm_node_stat[NR_VM_NODE_STAT_ITEMS];
142 extern atomic_long_t vm_numa_event[NR_VM_NUMA_EVENT_ITEMS];
143 
144 #ifdef CONFIG_NUMA
145 static inline void zone_numa_event_add(long x, struct zone *zone,
146 				enum numa_stat_item item)
147 {
148 	atomic_long_add(x, &zone->vm_numa_event[item]);
149 	atomic_long_add(x, &vm_numa_event[item]);
150 }
151 
152 static inline unsigned long zone_numa_event_state(struct zone *zone,
153 					enum numa_stat_item item)
154 {
155 	return atomic_long_read(&zone->vm_numa_event[item]);
156 }
157 
158 static inline unsigned long
159 global_numa_event_state(enum numa_stat_item item)
160 {
161 	return atomic_long_read(&vm_numa_event[item]);
162 }
163 #endif /* CONFIG_NUMA */
164 
165 static inline void zone_page_state_add(long x, struct zone *zone,
166 				 enum zone_stat_item item)
167 {
168 	atomic_long_add(x, &zone->vm_stat[item]);
169 	atomic_long_add(x, &vm_zone_stat[item]);
170 }
171 
172 static inline void node_page_state_add(long x, struct pglist_data *pgdat,
173 				 enum node_stat_item item)
174 {
175 	atomic_long_add(x, &pgdat->vm_stat[item]);
176 	atomic_long_add(x, &vm_node_stat[item]);
177 }
178 
179 static inline unsigned long global_zone_page_state(enum zone_stat_item item)
180 {
181 	long x = atomic_long_read(&vm_zone_stat[item]);
182 #ifdef CONFIG_SMP
183 	if (x < 0)
184 		x = 0;
185 #endif
186 	return x;
187 }
188 
189 static inline
190 unsigned long global_node_page_state_pages(enum node_stat_item item)
191 {
192 	long x = atomic_long_read(&vm_node_stat[item]);
193 #ifdef CONFIG_SMP
194 	if (x < 0)
195 		x = 0;
196 #endif
197 	return x;
198 }
199 
200 static inline unsigned long global_node_page_state(enum node_stat_item item)
201 {
202 	VM_WARN_ON_ONCE(vmstat_item_in_bytes(item));
203 
204 	return global_node_page_state_pages(item);
205 }
206 
207 static inline unsigned long zone_page_state(struct zone *zone,
208 					enum zone_stat_item item)
209 {
210 	long x = atomic_long_read(&zone->vm_stat[item]);
211 #ifdef CONFIG_SMP
212 	if (x < 0)
213 		x = 0;
214 #endif
215 	return x;
216 }
217 
218 /*
219  * More accurate version that also considers the currently pending
220  * deltas. For that we need to loop over all cpus to find the current
221  * deltas. There is no synchronization so the result cannot be
222  * exactly accurate either.
223  */
224 static inline unsigned long zone_page_state_snapshot(struct zone *zone,
225 					enum zone_stat_item item)
226 {
227 	long x = atomic_long_read(&zone->vm_stat[item]);
228 
229 #ifdef CONFIG_SMP
230 	int cpu;
231 	for_each_online_cpu(cpu)
232 		x += per_cpu_ptr(zone->per_cpu_zonestats, cpu)->vm_stat_diff[item];
233 
234 	if (x < 0)
235 		x = 0;
236 #endif
237 	return x;
238 }
239 
240 #ifdef CONFIG_NUMA
241 /* See __count_vm_event comment on why raw_cpu_inc is used. */
242 static inline void
243 __count_numa_event(struct zone *zone, enum numa_stat_item item)
244 {
245 	struct per_cpu_zonestat __percpu *pzstats = zone->per_cpu_zonestats;
246 
247 	raw_cpu_inc(pzstats->vm_numa_event[item]);
248 }
249 
250 extern unsigned long sum_zone_node_page_state(int node,
251 					      enum zone_stat_item item);
252 extern unsigned long sum_zone_numa_event_state(int node, enum numa_stat_item item);
253 extern unsigned long node_page_state(struct pglist_data *pgdat,
254 						enum node_stat_item item);
255 extern unsigned long node_page_state_pages(struct pglist_data *pgdat,
256 					   enum node_stat_item item);
257 extern void fold_vm_numa_events(void);
258 #else
259 #define sum_zone_node_page_state(node, item) global_zone_page_state(item)
260 #define node_page_state(node, item) global_node_page_state(item)
261 #define node_page_state_pages(node, item) global_node_page_state_pages(item)
262 static inline void fold_vm_numa_events(void)
263 {
264 }
265 #endif /* CONFIG_NUMA */
266 
267 #ifdef CONFIG_SMP
268 void __mod_zone_page_state(struct zone *, enum zone_stat_item item, long);
269 void __inc_zone_page_state(struct page *, enum zone_stat_item);
270 void __dec_zone_page_state(struct page *, enum zone_stat_item);
271 
272 void __mod_node_page_state(struct pglist_data *, enum node_stat_item item, long);
273 void __inc_node_page_state(struct page *, enum node_stat_item);
274 void __dec_node_page_state(struct page *, enum node_stat_item);
275 
276 void mod_zone_page_state(struct zone *, enum zone_stat_item, long);
277 void inc_zone_page_state(struct page *, enum zone_stat_item);
278 void dec_zone_page_state(struct page *, enum zone_stat_item);
279 
280 void mod_node_page_state(struct pglist_data *, enum node_stat_item, long);
281 void inc_node_page_state(struct page *, enum node_stat_item);
282 void dec_node_page_state(struct page *, enum node_stat_item);
283 
284 extern void inc_node_state(struct pglist_data *, enum node_stat_item);
285 extern void __inc_zone_state(struct zone *, enum zone_stat_item);
286 extern void __inc_node_state(struct pglist_data *, enum node_stat_item);
287 extern void dec_zone_state(struct zone *, enum zone_stat_item);
288 extern void __dec_zone_state(struct zone *, enum zone_stat_item);
289 extern void __dec_node_state(struct pglist_data *, enum node_stat_item);
290 
291 void quiet_vmstat(void);
292 void cpu_vm_stats_fold(int cpu);
293 void refresh_zone_stat_thresholds(void);
294 
295 struct ctl_table;
296 int vmstat_refresh(struct ctl_table *, int write, void *buffer, size_t *lenp,
297 		loff_t *ppos);
298 
299 void drain_zonestat(struct zone *zone, struct per_cpu_zonestat *);
300 
301 int calculate_pressure_threshold(struct zone *zone);
302 int calculate_normal_threshold(struct zone *zone);
303 void set_pgdat_percpu_threshold(pg_data_t *pgdat,
304 				int (*calculate_pressure)(struct zone *));
305 #else /* CONFIG_SMP */
306 
307 /*
308  * We do not maintain differentials in a single processor configuration.
309  * The functions directly modify the zone and global counters.
310  */
311 static inline void __mod_zone_page_state(struct zone *zone,
312 			enum zone_stat_item item, long delta)
313 {
314 	zone_page_state_add(delta, zone, item);
315 }
316 
317 static inline void __mod_node_page_state(struct pglist_data *pgdat,
318 			enum node_stat_item item, int delta)
319 {
320 	if (vmstat_item_in_bytes(item)) {
321 		/*
322 		 * Only cgroups use subpage accounting right now; at
323 		 * the global level, these items still change in
324 		 * multiples of whole pages. Store them as pages
325 		 * internally to keep the per-cpu counters compact.
326 		 */
327 		VM_WARN_ON_ONCE(delta & (PAGE_SIZE - 1));
328 		delta >>= PAGE_SHIFT;
329 	}
330 
331 	node_page_state_add(delta, pgdat, item);
332 }
333 
334 static inline void __inc_zone_state(struct zone *zone, enum zone_stat_item item)
335 {
336 	atomic_long_inc(&zone->vm_stat[item]);
337 	atomic_long_inc(&vm_zone_stat[item]);
338 }
339 
340 static inline void __inc_node_state(struct pglist_data *pgdat, enum node_stat_item item)
341 {
342 	atomic_long_inc(&pgdat->vm_stat[item]);
343 	atomic_long_inc(&vm_node_stat[item]);
344 }
345 
346 static inline void __dec_zone_state(struct zone *zone, enum zone_stat_item item)
347 {
348 	atomic_long_dec(&zone->vm_stat[item]);
349 	atomic_long_dec(&vm_zone_stat[item]);
350 }
351 
352 static inline void __dec_node_state(struct pglist_data *pgdat, enum node_stat_item item)
353 {
354 	atomic_long_dec(&pgdat->vm_stat[item]);
355 	atomic_long_dec(&vm_node_stat[item]);
356 }
357 
358 static inline void __inc_zone_page_state(struct page *page,
359 			enum zone_stat_item item)
360 {
361 	__inc_zone_state(page_zone(page), item);
362 }
363 
364 static inline void __inc_node_page_state(struct page *page,
365 			enum node_stat_item item)
366 {
367 	__inc_node_state(page_pgdat(page), item);
368 }
369 
370 
371 static inline void __dec_zone_page_state(struct page *page,
372 			enum zone_stat_item item)
373 {
374 	__dec_zone_state(page_zone(page), item);
375 }
376 
377 static inline void __dec_node_page_state(struct page *page,
378 			enum node_stat_item item)
379 {
380 	__dec_node_state(page_pgdat(page), item);
381 }
382 
383 
384 /*
385  * We only use atomic operations to update counters. So there is no need to
386  * disable interrupts.
387  */
388 #define inc_zone_page_state __inc_zone_page_state
389 #define dec_zone_page_state __dec_zone_page_state
390 #define mod_zone_page_state __mod_zone_page_state
391 
392 #define inc_node_page_state __inc_node_page_state
393 #define dec_node_page_state __dec_node_page_state
394 #define mod_node_page_state __mod_node_page_state
395 
396 #define inc_zone_state __inc_zone_state
397 #define inc_node_state __inc_node_state
398 #define dec_zone_state __dec_zone_state
399 
400 #define set_pgdat_percpu_threshold(pgdat, callback) { }
401 
402 static inline void refresh_zone_stat_thresholds(void) { }
403 static inline void cpu_vm_stats_fold(int cpu) { }
404 static inline void quiet_vmstat(void) { }
405 
406 static inline void drain_zonestat(struct zone *zone,
407 			struct per_cpu_zonestat *pzstats) { }
408 #endif		/* CONFIG_SMP */
409 
410 static inline void __mod_zone_freepage_state(struct zone *zone, int nr_pages,
411 					     int migratetype)
412 {
413 	__mod_zone_page_state(zone, NR_FREE_PAGES, nr_pages);
414 	if (is_migrate_cma(migratetype))
415 		__mod_zone_page_state(zone, NR_FREE_CMA_PAGES, nr_pages);
416 }
417 
418 extern const char * const vmstat_text[];
419 
420 static inline const char *zone_stat_name(enum zone_stat_item item)
421 {
422 	return vmstat_text[item];
423 }
424 
425 #ifdef CONFIG_NUMA
426 static inline const char *numa_stat_name(enum numa_stat_item item)
427 {
428 	return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
429 			   item];
430 }
431 #endif /* CONFIG_NUMA */
432 
433 static inline const char *node_stat_name(enum node_stat_item item)
434 {
435 	return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
436 			   NR_VM_NUMA_EVENT_ITEMS +
437 			   item];
438 }
439 
440 static inline const char *lru_list_name(enum lru_list lru)
441 {
442 	return node_stat_name(NR_LRU_BASE + lru) + 3; // skip "nr_"
443 }
444 
445 static inline const char *writeback_stat_name(enum writeback_stat_item item)
446 {
447 	return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
448 			   NR_VM_NUMA_EVENT_ITEMS +
449 			   NR_VM_NODE_STAT_ITEMS +
450 			   item];
451 }
452 
453 #if defined(CONFIG_VM_EVENT_COUNTERS) || defined(CONFIG_MEMCG)
454 static inline const char *vm_event_name(enum vm_event_item item)
455 {
456 	return vmstat_text[NR_VM_ZONE_STAT_ITEMS +
457 			   NR_VM_NUMA_EVENT_ITEMS +
458 			   NR_VM_NODE_STAT_ITEMS +
459 			   NR_VM_WRITEBACK_STAT_ITEMS +
460 			   item];
461 }
462 #endif /* CONFIG_VM_EVENT_COUNTERS || CONFIG_MEMCG */
463 
464 #ifdef CONFIG_MEMCG
465 
466 void __mod_lruvec_state(struct lruvec *lruvec, enum node_stat_item idx,
467 			int val);
468 
469 static inline void mod_lruvec_state(struct lruvec *lruvec,
470 				    enum node_stat_item idx, int val)
471 {
472 	unsigned long flags;
473 
474 	local_irq_save(flags);
475 	__mod_lruvec_state(lruvec, idx, val);
476 	local_irq_restore(flags);
477 }
478 
479 void __mod_lruvec_page_state(struct page *page,
480 			     enum node_stat_item idx, int val);
481 
482 static inline void mod_lruvec_page_state(struct page *page,
483 					 enum node_stat_item idx, int val)
484 {
485 	unsigned long flags;
486 
487 	local_irq_save(flags);
488 	__mod_lruvec_page_state(page, idx, val);
489 	local_irq_restore(flags);
490 }
491 
492 #else
493 
494 static inline void __mod_lruvec_state(struct lruvec *lruvec,
495 				      enum node_stat_item idx, int val)
496 {
497 	__mod_node_page_state(lruvec_pgdat(lruvec), idx, val);
498 }
499 
500 static inline void mod_lruvec_state(struct lruvec *lruvec,
501 				    enum node_stat_item idx, int val)
502 {
503 	mod_node_page_state(lruvec_pgdat(lruvec), idx, val);
504 }
505 
506 static inline void __mod_lruvec_page_state(struct page *page,
507 					   enum node_stat_item idx, int val)
508 {
509 	__mod_node_page_state(page_pgdat(page), idx, val);
510 }
511 
512 static inline void mod_lruvec_page_state(struct page *page,
513 					 enum node_stat_item idx, int val)
514 {
515 	mod_node_page_state(page_pgdat(page), idx, val);
516 }
517 
518 #endif /* CONFIG_MEMCG */
519 
520 static inline void inc_lruvec_state(struct lruvec *lruvec,
521 				    enum node_stat_item idx)
522 {
523 	mod_lruvec_state(lruvec, idx, 1);
524 }
525 
526 static inline void __inc_lruvec_page_state(struct page *page,
527 					   enum node_stat_item idx)
528 {
529 	__mod_lruvec_page_state(page, idx, 1);
530 }
531 
532 static inline void __dec_lruvec_page_state(struct page *page,
533 					   enum node_stat_item idx)
534 {
535 	__mod_lruvec_page_state(page, idx, -1);
536 }
537 
538 static inline void inc_lruvec_page_state(struct page *page,
539 					 enum node_stat_item idx)
540 {
541 	mod_lruvec_page_state(page, idx, 1);
542 }
543 
544 static inline void dec_lruvec_page_state(struct page *page,
545 					 enum node_stat_item idx)
546 {
547 	mod_lruvec_page_state(page, idx, -1);
548 }
549 
550 #endif /* _LINUX_VMSTAT_H */
551