1 /* SPDX-License-Identifier: GPL-2.0 */ 2 #ifndef _LINUX_VMSTAT_H 3 #define _LINUX_VMSTAT_H 4 5 #include <linux/types.h> 6 #include <linux/percpu.h> 7 #include <linux/mmzone.h> 8 #include <linux/vm_event_item.h> 9 #include <linux/atomic.h> 10 #include <linux/static_key.h> 11 #include <linux/mmdebug.h> 12 13 extern int sysctl_stat_interval; 14 15 #ifdef CONFIG_NUMA 16 #define ENABLE_NUMA_STAT 1 17 #define DISABLE_NUMA_STAT 0 18 extern int sysctl_vm_numa_stat; 19 DECLARE_STATIC_KEY_TRUE(vm_numa_stat_key); 20 int sysctl_vm_numa_stat_handler(struct ctl_table *table, int write, 21 void *buffer, size_t *length, loff_t *ppos); 22 #endif 23 24 struct reclaim_stat { 25 unsigned nr_dirty; 26 unsigned nr_unqueued_dirty; 27 unsigned nr_congested; 28 unsigned nr_writeback; 29 unsigned nr_immediate; 30 unsigned nr_pageout; 31 unsigned nr_activate[ANON_AND_FILE]; 32 unsigned nr_ref_keep; 33 unsigned nr_unmap_fail; 34 unsigned nr_lazyfree_fail; 35 }; 36 37 enum writeback_stat_item { 38 NR_DIRTY_THRESHOLD, 39 NR_DIRTY_BG_THRESHOLD, 40 NR_VM_WRITEBACK_STAT_ITEMS, 41 }; 42 43 #ifdef CONFIG_VM_EVENT_COUNTERS 44 /* 45 * Light weight per cpu counter implementation. 46 * 47 * Counters should only be incremented and no critical kernel component 48 * should rely on the counter values. 49 * 50 * Counters are handled completely inline. On many platforms the code 51 * generated will simply be the increment of a global address. 52 */ 53 54 struct vm_event_state { 55 unsigned long event[NR_VM_EVENT_ITEMS]; 56 }; 57 58 DECLARE_PER_CPU(struct vm_event_state, vm_event_states); 59 60 /* 61 * vm counters are allowed to be racy. Use raw_cpu_ops to avoid the 62 * local_irq_disable overhead. 63 */ 64 static inline void __count_vm_event(enum vm_event_item item) 65 { 66 raw_cpu_inc(vm_event_states.event[item]); 67 } 68 69 static inline void count_vm_event(enum vm_event_item item) 70 { 71 this_cpu_inc(vm_event_states.event[item]); 72 } 73 74 static inline void __count_vm_events(enum vm_event_item item, long delta) 75 { 76 raw_cpu_add(vm_event_states.event[item], delta); 77 } 78 79 static inline void count_vm_events(enum vm_event_item item, long delta) 80 { 81 this_cpu_add(vm_event_states.event[item], delta); 82 } 83 84 extern void all_vm_events(unsigned long *); 85 86 extern void vm_events_fold_cpu(int cpu); 87 88 #else 89 90 /* Disable counters */ 91 static inline void count_vm_event(enum vm_event_item item) 92 { 93 } 94 static inline void count_vm_events(enum vm_event_item item, long delta) 95 { 96 } 97 static inline void __count_vm_event(enum vm_event_item item) 98 { 99 } 100 static inline void __count_vm_events(enum vm_event_item item, long delta) 101 { 102 } 103 static inline void all_vm_events(unsigned long *ret) 104 { 105 } 106 static inline void vm_events_fold_cpu(int cpu) 107 { 108 } 109 110 #endif /* CONFIG_VM_EVENT_COUNTERS */ 111 112 #ifdef CONFIG_NUMA_BALANCING 113 #define count_vm_numa_event(x) count_vm_event(x) 114 #define count_vm_numa_events(x, y) count_vm_events(x, y) 115 #else 116 #define count_vm_numa_event(x) do {} while (0) 117 #define count_vm_numa_events(x, y) do { (void)(y); } while (0) 118 #endif /* CONFIG_NUMA_BALANCING */ 119 120 #ifdef CONFIG_DEBUG_TLBFLUSH 121 #define count_vm_tlb_event(x) count_vm_event(x) 122 #define count_vm_tlb_events(x, y) count_vm_events(x, y) 123 #else 124 #define count_vm_tlb_event(x) do {} while (0) 125 #define count_vm_tlb_events(x, y) do { (void)(y); } while (0) 126 #endif 127 128 #ifdef CONFIG_DEBUG_VM_VMACACHE 129 #define count_vm_vmacache_event(x) count_vm_event(x) 130 #else 131 #define count_vm_vmacache_event(x) do {} while (0) 132 #endif 133 134 #define __count_zid_vm_events(item, zid, delta) \ 135 __count_vm_events(item##_NORMAL - ZONE_NORMAL + zid, delta) 136 137 /* 138 * Zone and node-based page accounting with per cpu differentials. 139 */ 140 extern atomic_long_t vm_zone_stat[NR_VM_ZONE_STAT_ITEMS]; 141 extern atomic_long_t vm_node_stat[NR_VM_NODE_STAT_ITEMS]; 142 extern atomic_long_t vm_numa_event[NR_VM_NUMA_EVENT_ITEMS]; 143 144 #ifdef CONFIG_NUMA 145 static inline void zone_numa_event_add(long x, struct zone *zone, 146 enum numa_stat_item item) 147 { 148 atomic_long_add(x, &zone->vm_numa_event[item]); 149 atomic_long_add(x, &vm_numa_event[item]); 150 } 151 152 static inline unsigned long zone_numa_event_state(struct zone *zone, 153 enum numa_stat_item item) 154 { 155 return atomic_long_read(&zone->vm_numa_event[item]); 156 } 157 158 static inline unsigned long 159 global_numa_event_state(enum numa_stat_item item) 160 { 161 return atomic_long_read(&vm_numa_event[item]); 162 } 163 #endif /* CONFIG_NUMA */ 164 165 static inline void zone_page_state_add(long x, struct zone *zone, 166 enum zone_stat_item item) 167 { 168 atomic_long_add(x, &zone->vm_stat[item]); 169 atomic_long_add(x, &vm_zone_stat[item]); 170 } 171 172 static inline void node_page_state_add(long x, struct pglist_data *pgdat, 173 enum node_stat_item item) 174 { 175 atomic_long_add(x, &pgdat->vm_stat[item]); 176 atomic_long_add(x, &vm_node_stat[item]); 177 } 178 179 static inline unsigned long global_zone_page_state(enum zone_stat_item item) 180 { 181 long x = atomic_long_read(&vm_zone_stat[item]); 182 #ifdef CONFIG_SMP 183 if (x < 0) 184 x = 0; 185 #endif 186 return x; 187 } 188 189 static inline 190 unsigned long global_node_page_state_pages(enum node_stat_item item) 191 { 192 long x = atomic_long_read(&vm_node_stat[item]); 193 #ifdef CONFIG_SMP 194 if (x < 0) 195 x = 0; 196 #endif 197 return x; 198 } 199 200 static inline unsigned long global_node_page_state(enum node_stat_item item) 201 { 202 VM_WARN_ON_ONCE(vmstat_item_in_bytes(item)); 203 204 return global_node_page_state_pages(item); 205 } 206 207 static inline unsigned long zone_page_state(struct zone *zone, 208 enum zone_stat_item item) 209 { 210 long x = atomic_long_read(&zone->vm_stat[item]); 211 #ifdef CONFIG_SMP 212 if (x < 0) 213 x = 0; 214 #endif 215 return x; 216 } 217 218 /* 219 * More accurate version that also considers the currently pending 220 * deltas. For that we need to loop over all cpus to find the current 221 * deltas. There is no synchronization so the result cannot be 222 * exactly accurate either. 223 */ 224 static inline unsigned long zone_page_state_snapshot(struct zone *zone, 225 enum zone_stat_item item) 226 { 227 long x = atomic_long_read(&zone->vm_stat[item]); 228 229 #ifdef CONFIG_SMP 230 int cpu; 231 for_each_online_cpu(cpu) 232 x += per_cpu_ptr(zone->per_cpu_zonestats, cpu)->vm_stat_diff[item]; 233 234 if (x < 0) 235 x = 0; 236 #endif 237 return x; 238 } 239 240 #ifdef CONFIG_NUMA 241 /* See __count_vm_event comment on why raw_cpu_inc is used. */ 242 static inline void 243 __count_numa_event(struct zone *zone, enum numa_stat_item item) 244 { 245 struct per_cpu_zonestat __percpu *pzstats = zone->per_cpu_zonestats; 246 247 raw_cpu_inc(pzstats->vm_numa_event[item]); 248 } 249 250 extern unsigned long sum_zone_node_page_state(int node, 251 enum zone_stat_item item); 252 extern unsigned long sum_zone_numa_event_state(int node, enum numa_stat_item item); 253 extern unsigned long node_page_state(struct pglist_data *pgdat, 254 enum node_stat_item item); 255 extern unsigned long node_page_state_pages(struct pglist_data *pgdat, 256 enum node_stat_item item); 257 extern void fold_vm_numa_events(void); 258 #else 259 #define sum_zone_node_page_state(node, item) global_zone_page_state(item) 260 #define node_page_state(node, item) global_node_page_state(item) 261 #define node_page_state_pages(node, item) global_node_page_state_pages(item) 262 static inline void fold_vm_numa_events(void) 263 { 264 } 265 #endif /* CONFIG_NUMA */ 266 267 #ifdef CONFIG_SMP 268 void __mod_zone_page_state(struct zone *, enum zone_stat_item item, long); 269 void __inc_zone_page_state(struct page *, enum zone_stat_item); 270 void __dec_zone_page_state(struct page *, enum zone_stat_item); 271 272 void __mod_node_page_state(struct pglist_data *, enum node_stat_item item, long); 273 void __inc_node_page_state(struct page *, enum node_stat_item); 274 void __dec_node_page_state(struct page *, enum node_stat_item); 275 276 void mod_zone_page_state(struct zone *, enum zone_stat_item, long); 277 void inc_zone_page_state(struct page *, enum zone_stat_item); 278 void dec_zone_page_state(struct page *, enum zone_stat_item); 279 280 void mod_node_page_state(struct pglist_data *, enum node_stat_item, long); 281 void inc_node_page_state(struct page *, enum node_stat_item); 282 void dec_node_page_state(struct page *, enum node_stat_item); 283 284 extern void inc_node_state(struct pglist_data *, enum node_stat_item); 285 extern void __inc_zone_state(struct zone *, enum zone_stat_item); 286 extern void __inc_node_state(struct pglist_data *, enum node_stat_item); 287 extern void dec_zone_state(struct zone *, enum zone_stat_item); 288 extern void __dec_zone_state(struct zone *, enum zone_stat_item); 289 extern void __dec_node_state(struct pglist_data *, enum node_stat_item); 290 291 void quiet_vmstat(void); 292 void cpu_vm_stats_fold(int cpu); 293 void refresh_zone_stat_thresholds(void); 294 295 struct ctl_table; 296 int vmstat_refresh(struct ctl_table *, int write, void *buffer, size_t *lenp, 297 loff_t *ppos); 298 299 void drain_zonestat(struct zone *zone, struct per_cpu_zonestat *); 300 301 int calculate_pressure_threshold(struct zone *zone); 302 int calculate_normal_threshold(struct zone *zone); 303 void set_pgdat_percpu_threshold(pg_data_t *pgdat, 304 int (*calculate_pressure)(struct zone *)); 305 #else /* CONFIG_SMP */ 306 307 /* 308 * We do not maintain differentials in a single processor configuration. 309 * The functions directly modify the zone and global counters. 310 */ 311 static inline void __mod_zone_page_state(struct zone *zone, 312 enum zone_stat_item item, long delta) 313 { 314 zone_page_state_add(delta, zone, item); 315 } 316 317 static inline void __mod_node_page_state(struct pglist_data *pgdat, 318 enum node_stat_item item, int delta) 319 { 320 if (vmstat_item_in_bytes(item)) { 321 /* 322 * Only cgroups use subpage accounting right now; at 323 * the global level, these items still change in 324 * multiples of whole pages. Store them as pages 325 * internally to keep the per-cpu counters compact. 326 */ 327 VM_WARN_ON_ONCE(delta & (PAGE_SIZE - 1)); 328 delta >>= PAGE_SHIFT; 329 } 330 331 node_page_state_add(delta, pgdat, item); 332 } 333 334 static inline void __inc_zone_state(struct zone *zone, enum zone_stat_item item) 335 { 336 atomic_long_inc(&zone->vm_stat[item]); 337 atomic_long_inc(&vm_zone_stat[item]); 338 } 339 340 static inline void __inc_node_state(struct pglist_data *pgdat, enum node_stat_item item) 341 { 342 atomic_long_inc(&pgdat->vm_stat[item]); 343 atomic_long_inc(&vm_node_stat[item]); 344 } 345 346 static inline void __dec_zone_state(struct zone *zone, enum zone_stat_item item) 347 { 348 atomic_long_dec(&zone->vm_stat[item]); 349 atomic_long_dec(&vm_zone_stat[item]); 350 } 351 352 static inline void __dec_node_state(struct pglist_data *pgdat, enum node_stat_item item) 353 { 354 atomic_long_dec(&pgdat->vm_stat[item]); 355 atomic_long_dec(&vm_node_stat[item]); 356 } 357 358 static inline void __inc_zone_page_state(struct page *page, 359 enum zone_stat_item item) 360 { 361 __inc_zone_state(page_zone(page), item); 362 } 363 364 static inline void __inc_node_page_state(struct page *page, 365 enum node_stat_item item) 366 { 367 __inc_node_state(page_pgdat(page), item); 368 } 369 370 371 static inline void __dec_zone_page_state(struct page *page, 372 enum zone_stat_item item) 373 { 374 __dec_zone_state(page_zone(page), item); 375 } 376 377 static inline void __dec_node_page_state(struct page *page, 378 enum node_stat_item item) 379 { 380 __dec_node_state(page_pgdat(page), item); 381 } 382 383 384 /* 385 * We only use atomic operations to update counters. So there is no need to 386 * disable interrupts. 387 */ 388 #define inc_zone_page_state __inc_zone_page_state 389 #define dec_zone_page_state __dec_zone_page_state 390 #define mod_zone_page_state __mod_zone_page_state 391 392 #define inc_node_page_state __inc_node_page_state 393 #define dec_node_page_state __dec_node_page_state 394 #define mod_node_page_state __mod_node_page_state 395 396 #define inc_zone_state __inc_zone_state 397 #define inc_node_state __inc_node_state 398 #define dec_zone_state __dec_zone_state 399 400 #define set_pgdat_percpu_threshold(pgdat, callback) { } 401 402 static inline void refresh_zone_stat_thresholds(void) { } 403 static inline void cpu_vm_stats_fold(int cpu) { } 404 static inline void quiet_vmstat(void) { } 405 406 static inline void drain_zonestat(struct zone *zone, 407 struct per_cpu_zonestat *pzstats) { } 408 #endif /* CONFIG_SMP */ 409 410 static inline void __mod_zone_freepage_state(struct zone *zone, int nr_pages, 411 int migratetype) 412 { 413 __mod_zone_page_state(zone, NR_FREE_PAGES, nr_pages); 414 if (is_migrate_cma(migratetype)) 415 __mod_zone_page_state(zone, NR_FREE_CMA_PAGES, nr_pages); 416 } 417 418 extern const char * const vmstat_text[]; 419 420 static inline const char *zone_stat_name(enum zone_stat_item item) 421 { 422 return vmstat_text[item]; 423 } 424 425 #ifdef CONFIG_NUMA 426 static inline const char *numa_stat_name(enum numa_stat_item item) 427 { 428 return vmstat_text[NR_VM_ZONE_STAT_ITEMS + 429 item]; 430 } 431 #endif /* CONFIG_NUMA */ 432 433 static inline const char *node_stat_name(enum node_stat_item item) 434 { 435 return vmstat_text[NR_VM_ZONE_STAT_ITEMS + 436 NR_VM_NUMA_EVENT_ITEMS + 437 item]; 438 } 439 440 static inline const char *lru_list_name(enum lru_list lru) 441 { 442 return node_stat_name(NR_LRU_BASE + lru) + 3; // skip "nr_" 443 } 444 445 static inline const char *writeback_stat_name(enum writeback_stat_item item) 446 { 447 return vmstat_text[NR_VM_ZONE_STAT_ITEMS + 448 NR_VM_NUMA_EVENT_ITEMS + 449 NR_VM_NODE_STAT_ITEMS + 450 item]; 451 } 452 453 #if defined(CONFIG_VM_EVENT_COUNTERS) || defined(CONFIG_MEMCG) 454 static inline const char *vm_event_name(enum vm_event_item item) 455 { 456 return vmstat_text[NR_VM_ZONE_STAT_ITEMS + 457 NR_VM_NUMA_EVENT_ITEMS + 458 NR_VM_NODE_STAT_ITEMS + 459 NR_VM_WRITEBACK_STAT_ITEMS + 460 item]; 461 } 462 #endif /* CONFIG_VM_EVENT_COUNTERS || CONFIG_MEMCG */ 463 464 #ifdef CONFIG_MEMCG 465 466 void __mod_lruvec_state(struct lruvec *lruvec, enum node_stat_item idx, 467 int val); 468 469 static inline void mod_lruvec_state(struct lruvec *lruvec, 470 enum node_stat_item idx, int val) 471 { 472 unsigned long flags; 473 474 local_irq_save(flags); 475 __mod_lruvec_state(lruvec, idx, val); 476 local_irq_restore(flags); 477 } 478 479 void __mod_lruvec_page_state(struct page *page, 480 enum node_stat_item idx, int val); 481 482 static inline void mod_lruvec_page_state(struct page *page, 483 enum node_stat_item idx, int val) 484 { 485 unsigned long flags; 486 487 local_irq_save(flags); 488 __mod_lruvec_page_state(page, idx, val); 489 local_irq_restore(flags); 490 } 491 492 #else 493 494 static inline void __mod_lruvec_state(struct lruvec *lruvec, 495 enum node_stat_item idx, int val) 496 { 497 __mod_node_page_state(lruvec_pgdat(lruvec), idx, val); 498 } 499 500 static inline void mod_lruvec_state(struct lruvec *lruvec, 501 enum node_stat_item idx, int val) 502 { 503 mod_node_page_state(lruvec_pgdat(lruvec), idx, val); 504 } 505 506 static inline void __mod_lruvec_page_state(struct page *page, 507 enum node_stat_item idx, int val) 508 { 509 __mod_node_page_state(page_pgdat(page), idx, val); 510 } 511 512 static inline void mod_lruvec_page_state(struct page *page, 513 enum node_stat_item idx, int val) 514 { 515 mod_node_page_state(page_pgdat(page), idx, val); 516 } 517 518 #endif /* CONFIG_MEMCG */ 519 520 static inline void inc_lruvec_state(struct lruvec *lruvec, 521 enum node_stat_item idx) 522 { 523 mod_lruvec_state(lruvec, idx, 1); 524 } 525 526 static inline void __inc_lruvec_page_state(struct page *page, 527 enum node_stat_item idx) 528 { 529 __mod_lruvec_page_state(page, idx, 1); 530 } 531 532 static inline void __dec_lruvec_page_state(struct page *page, 533 enum node_stat_item idx) 534 { 535 __mod_lruvec_page_state(page, idx, -1); 536 } 537 538 static inline void inc_lruvec_page_state(struct page *page, 539 enum node_stat_item idx) 540 { 541 mod_lruvec_page_state(page, idx, 1); 542 } 543 544 static inline void dec_lruvec_page_state(struct page *page, 545 enum node_stat_item idx) 546 { 547 mod_lruvec_page_state(page, idx, -1); 548 } 549 550 #endif /* _LINUX_VMSTAT_H */ 551