11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * include/linux/backing-dev.h 31da177e4SLinus Torvalds * 41da177e4SLinus Torvalds * low-level device information and state which is propagated up through 51da177e4SLinus Torvalds * to high-level code. 61da177e4SLinus Torvalds */ 71da177e4SLinus Torvalds 81da177e4SLinus Torvalds #ifndef _LINUX_BACKING_DEV_H 91da177e4SLinus Torvalds #define _LINUX_BACKING_DEV_H 101da177e4SLinus Torvalds 11b2e8fb6eSPeter Zijlstra #include <linux/percpu_counter.h> 12b2e8fb6eSPeter Zijlstra #include <linux/log2.h> 1304fbfdc1SPeter Zijlstra #include <linux/proportions.h> 14cf0ca9feSPeter Zijlstra #include <linux/kernel.h> 15e4ad08feSMiklos Szeredi #include <linux/fs.h> 1603ba3782SJens Axboe #include <linux/sched.h> 1703ba3782SJens Axboe #include <linux/writeback.h> 181da177e4SLinus Torvalds #include <asm/atomic.h> 191da177e4SLinus Torvalds 203fcfab16SAndrew Morton struct page; 21cf0ca9feSPeter Zijlstra struct device; 2276f1418bSMiklos Szeredi struct dentry; 233fcfab16SAndrew Morton 241da177e4SLinus Torvalds /* 251da177e4SLinus Torvalds * Bits in backing_dev_info.state 261da177e4SLinus Torvalds */ 271da177e4SLinus Torvalds enum bdi_state { 2803ba3782SJens Axboe BDI_pending, /* On its way to being activated */ 2903ba3782SJens Axboe BDI_wb_alloc, /* Default embedded wb allocated */ 301faa16d2SJens Axboe BDI_async_congested, /* The async (write) queue is getting full */ 311faa16d2SJens Axboe BDI_sync_congested, /* The sync queue is getting full */ 32500b067cSJens Axboe BDI_registered, /* bdi_register() was done */ 331da177e4SLinus Torvalds BDI_unused, /* Available bits start here */ 341da177e4SLinus Torvalds }; 351da177e4SLinus Torvalds 361da177e4SLinus Torvalds typedef int (congested_fn)(void *, int); 371da177e4SLinus Torvalds 38b2e8fb6eSPeter Zijlstra enum bdi_stat_item { 39c9e51e41SPeter Zijlstra BDI_RECLAIMABLE, 4069cb51d1SPeter Zijlstra BDI_WRITEBACK, 41b2e8fb6eSPeter Zijlstra NR_BDI_STAT_ITEMS 42b2e8fb6eSPeter Zijlstra }; 43b2e8fb6eSPeter Zijlstra 44b2e8fb6eSPeter Zijlstra #define BDI_STAT_BATCH (8*(1+ilog2(nr_cpu_ids))) 45b2e8fb6eSPeter Zijlstra 4603ba3782SJens Axboe struct bdi_writeback { 4703ba3782SJens Axboe struct list_head list; /* hangs off the bdi */ 4803ba3782SJens Axboe 4903ba3782SJens Axboe struct backing_dev_info *bdi; /* our parent bdi */ 5003ba3782SJens Axboe unsigned int nr; 5103ba3782SJens Axboe 5203ba3782SJens Axboe unsigned long last_old_flush; /* last old data flush */ 5303ba3782SJens Axboe 5403ba3782SJens Axboe struct task_struct *task; /* writeback task */ 5503ba3782SJens Axboe struct list_head b_dirty; /* dirty inodes */ 5603ba3782SJens Axboe struct list_head b_io; /* parked for writeback */ 5703ba3782SJens Axboe struct list_head b_more_io; /* parked for more writeback */ 5803ba3782SJens Axboe }; 5903ba3782SJens Axboe 601da177e4SLinus Torvalds struct backing_dev_info { 6166f3b8e2SJens Axboe struct list_head bdi_list; 62cfc4ba53SJens Axboe struct rcu_head rcu_head; 631da177e4SLinus Torvalds unsigned long ra_pages; /* max readahead in PAGE_CACHE_SIZE units */ 641da177e4SLinus Torvalds unsigned long state; /* Always use atomic bitops on this */ 651da177e4SLinus Torvalds unsigned int capabilities; /* Device capabilities */ 661da177e4SLinus Torvalds congested_fn *congested_fn; /* Function pointer if device is md/dm */ 671da177e4SLinus Torvalds void *congested_data; /* Pointer to aux data for congested func */ 681da177e4SLinus Torvalds void (*unplug_io_fn)(struct backing_dev_info *, struct page *); 691da177e4SLinus Torvalds void *unplug_io_data; 70b2e8fb6eSPeter Zijlstra 71d993831fSJens Axboe char *name; 72d993831fSJens Axboe 73b2e8fb6eSPeter Zijlstra struct percpu_counter bdi_stat[NR_BDI_STAT_ITEMS]; 7404fbfdc1SPeter Zijlstra 7504fbfdc1SPeter Zijlstra struct prop_local_percpu completions; 7604fbfdc1SPeter Zijlstra int dirty_exceeded; 77cf0ca9feSPeter Zijlstra 78189d3c4aSPeter Zijlstra unsigned int min_ratio; 79a42dde04SPeter Zijlstra unsigned int max_ratio, max_prop_frac; 80189d3c4aSPeter Zijlstra 8103ba3782SJens Axboe struct bdi_writeback wb; /* default writeback info for this bdi */ 8203ba3782SJens Axboe spinlock_t wb_lock; /* protects update side of wb_list */ 8303ba3782SJens Axboe struct list_head wb_list; /* the flusher threads hanging off this bdi */ 8403ba3782SJens Axboe unsigned long wb_mask; /* bitmask of registered tasks */ 8503ba3782SJens Axboe unsigned int wb_cnt; /* number of registered tasks */ 8676f1418bSMiklos Szeredi 8703ba3782SJens Axboe struct list_head work_list; 8803ba3782SJens Axboe 8903ba3782SJens Axboe struct device *dev; 9066f3b8e2SJens Axboe 9176f1418bSMiklos Szeredi #ifdef CONFIG_DEBUG_FS 9276f1418bSMiklos Szeredi struct dentry *debug_dir; 9376f1418bSMiklos Szeredi struct dentry *debug_stats; 9476f1418bSMiklos Szeredi #endif 951da177e4SLinus Torvalds }; 961da177e4SLinus Torvalds 97b2e8fb6eSPeter Zijlstra int bdi_init(struct backing_dev_info *bdi); 98b2e8fb6eSPeter Zijlstra void bdi_destroy(struct backing_dev_info *bdi); 99b2e8fb6eSPeter Zijlstra 100cf0ca9feSPeter Zijlstra int bdi_register(struct backing_dev_info *bdi, struct device *parent, 101cf0ca9feSPeter Zijlstra const char *fmt, ...); 102cf0ca9feSPeter Zijlstra int bdi_register_dev(struct backing_dev_info *bdi, dev_t dev); 103cf0ca9feSPeter Zijlstra void bdi_unregister(struct backing_dev_info *bdi); 104*a72bfd4dSJens Axboe void bdi_start_writeback(struct backing_dev_info *bdi, struct super_block *sb, 105*a72bfd4dSJens Axboe long nr_pages); 10603ba3782SJens Axboe int bdi_writeback_task(struct bdi_writeback *wb); 10703ba3782SJens Axboe int bdi_has_dirty_io(struct backing_dev_info *bdi); 108cf0ca9feSPeter Zijlstra 10903ba3782SJens Axboe extern spinlock_t bdi_lock; 11066f3b8e2SJens Axboe extern struct list_head bdi_list; 11166f3b8e2SJens Axboe 11203ba3782SJens Axboe static inline int wb_has_dirty_io(struct bdi_writeback *wb) 11303ba3782SJens Axboe { 11403ba3782SJens Axboe return !list_empty(&wb->b_dirty) || 11503ba3782SJens Axboe !list_empty(&wb->b_io) || 11603ba3782SJens Axboe !list_empty(&wb->b_more_io); 11703ba3782SJens Axboe } 11803ba3782SJens Axboe 119b2e8fb6eSPeter Zijlstra static inline void __add_bdi_stat(struct backing_dev_info *bdi, 120b2e8fb6eSPeter Zijlstra enum bdi_stat_item item, s64 amount) 121e0bf68ddSPeter Zijlstra { 122b2e8fb6eSPeter Zijlstra __percpu_counter_add(&bdi->bdi_stat[item], amount, BDI_STAT_BATCH); 123e0bf68ddSPeter Zijlstra } 124e0bf68ddSPeter Zijlstra 125b2e8fb6eSPeter Zijlstra static inline void __inc_bdi_stat(struct backing_dev_info *bdi, 126b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 127e0bf68ddSPeter Zijlstra { 128b2e8fb6eSPeter Zijlstra __add_bdi_stat(bdi, item, 1); 129b2e8fb6eSPeter Zijlstra } 130b2e8fb6eSPeter Zijlstra 131b2e8fb6eSPeter Zijlstra static inline void inc_bdi_stat(struct backing_dev_info *bdi, 132b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 133b2e8fb6eSPeter Zijlstra { 134b2e8fb6eSPeter Zijlstra unsigned long flags; 135b2e8fb6eSPeter Zijlstra 136b2e8fb6eSPeter Zijlstra local_irq_save(flags); 137b2e8fb6eSPeter Zijlstra __inc_bdi_stat(bdi, item); 138b2e8fb6eSPeter Zijlstra local_irq_restore(flags); 139b2e8fb6eSPeter Zijlstra } 140b2e8fb6eSPeter Zijlstra 141b2e8fb6eSPeter Zijlstra static inline void __dec_bdi_stat(struct backing_dev_info *bdi, 142b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 143b2e8fb6eSPeter Zijlstra { 144b2e8fb6eSPeter Zijlstra __add_bdi_stat(bdi, item, -1); 145b2e8fb6eSPeter Zijlstra } 146b2e8fb6eSPeter Zijlstra 147b2e8fb6eSPeter Zijlstra static inline void dec_bdi_stat(struct backing_dev_info *bdi, 148b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 149b2e8fb6eSPeter Zijlstra { 150b2e8fb6eSPeter Zijlstra unsigned long flags; 151b2e8fb6eSPeter Zijlstra 152b2e8fb6eSPeter Zijlstra local_irq_save(flags); 153b2e8fb6eSPeter Zijlstra __dec_bdi_stat(bdi, item); 154b2e8fb6eSPeter Zijlstra local_irq_restore(flags); 155b2e8fb6eSPeter Zijlstra } 156b2e8fb6eSPeter Zijlstra 157b2e8fb6eSPeter Zijlstra static inline s64 bdi_stat(struct backing_dev_info *bdi, 158b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 159b2e8fb6eSPeter Zijlstra { 160b2e8fb6eSPeter Zijlstra return percpu_counter_read_positive(&bdi->bdi_stat[item]); 161b2e8fb6eSPeter Zijlstra } 162b2e8fb6eSPeter Zijlstra 163b2e8fb6eSPeter Zijlstra static inline s64 __bdi_stat_sum(struct backing_dev_info *bdi, 164b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 165b2e8fb6eSPeter Zijlstra { 166b2e8fb6eSPeter Zijlstra return percpu_counter_sum_positive(&bdi->bdi_stat[item]); 167b2e8fb6eSPeter Zijlstra } 168b2e8fb6eSPeter Zijlstra 169b2e8fb6eSPeter Zijlstra static inline s64 bdi_stat_sum(struct backing_dev_info *bdi, 170b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 171b2e8fb6eSPeter Zijlstra { 172b2e8fb6eSPeter Zijlstra s64 sum; 173b2e8fb6eSPeter Zijlstra unsigned long flags; 174b2e8fb6eSPeter Zijlstra 175b2e8fb6eSPeter Zijlstra local_irq_save(flags); 176b2e8fb6eSPeter Zijlstra sum = __bdi_stat_sum(bdi, item); 177b2e8fb6eSPeter Zijlstra local_irq_restore(flags); 178b2e8fb6eSPeter Zijlstra 179b2e8fb6eSPeter Zijlstra return sum; 180b2e8fb6eSPeter Zijlstra } 181b2e8fb6eSPeter Zijlstra 182dd5656e5SMiklos Szeredi extern void bdi_writeout_inc(struct backing_dev_info *bdi); 183dd5656e5SMiklos Szeredi 184b2e8fb6eSPeter Zijlstra /* 185b2e8fb6eSPeter Zijlstra * maximal error of a stat counter. 186b2e8fb6eSPeter Zijlstra */ 187b2e8fb6eSPeter Zijlstra static inline unsigned long bdi_stat_error(struct backing_dev_info *bdi) 188b2e8fb6eSPeter Zijlstra { 189b2e8fb6eSPeter Zijlstra #ifdef CONFIG_SMP 190b2e8fb6eSPeter Zijlstra return nr_cpu_ids * BDI_STAT_BATCH; 191b2e8fb6eSPeter Zijlstra #else 192b2e8fb6eSPeter Zijlstra return 1; 193b2e8fb6eSPeter Zijlstra #endif 194e0bf68ddSPeter Zijlstra } 1951da177e4SLinus Torvalds 196189d3c4aSPeter Zijlstra int bdi_set_min_ratio(struct backing_dev_info *bdi, unsigned int min_ratio); 197a42dde04SPeter Zijlstra int bdi_set_max_ratio(struct backing_dev_info *bdi, unsigned int max_ratio); 198189d3c4aSPeter Zijlstra 1991da177e4SLinus Torvalds /* 2001da177e4SLinus Torvalds * Flags in backing_dev_info::capability 201e4ad08feSMiklos Szeredi * 202e4ad08feSMiklos Szeredi * The first three flags control whether dirty pages will contribute to the 2031da177e4SLinus Torvalds * VM's accounting and whether writepages() should be called for dirty pages 2041da177e4SLinus Torvalds * (something that would not, for example, be appropriate for ramfs) 205e4ad08feSMiklos Szeredi * 206e4ad08feSMiklos Szeredi * WARNING: these flags are closely related and should not normally be 207e4ad08feSMiklos Szeredi * used separately. The BDI_CAP_NO_ACCT_AND_WRITEBACK combines these 208e4ad08feSMiklos Szeredi * three flags into a single convenience macro. 209e4ad08feSMiklos Szeredi * 210e4ad08feSMiklos Szeredi * BDI_CAP_NO_ACCT_DIRTY: Dirty pages shouldn't contribute to accounting 211e4ad08feSMiklos Szeredi * BDI_CAP_NO_WRITEBACK: Don't write pages back 212e4ad08feSMiklos Szeredi * BDI_CAP_NO_ACCT_WB: Don't automatically account writeback pages 213e4ad08feSMiklos Szeredi * 214e4ad08feSMiklos Szeredi * These flags let !MMU mmap() govern direct device mapping vs immediate 215e4ad08feSMiklos Szeredi * copying more easily for MAP_PRIVATE, especially for ROM filesystems. 216e4ad08feSMiklos Szeredi * 217e4ad08feSMiklos Szeredi * BDI_CAP_MAP_COPY: Copy can be mapped (MAP_PRIVATE) 218e4ad08feSMiklos Szeredi * BDI_CAP_MAP_DIRECT: Can be mapped directly (MAP_SHARED) 219e4ad08feSMiklos Szeredi * BDI_CAP_READ_MAP: Can be mapped for reading 220e4ad08feSMiklos Szeredi * BDI_CAP_WRITE_MAP: Can be mapped for writing 221e4ad08feSMiklos Szeredi * BDI_CAP_EXEC_MAP: Can be mapped for execution 2224f98a2feSRik van Riel * 2234f98a2feSRik van Riel * BDI_CAP_SWAP_BACKED: Count shmem/tmpfs objects as swap-backed. 2241da177e4SLinus Torvalds */ 225e4ad08feSMiklos Szeredi #define BDI_CAP_NO_ACCT_DIRTY 0x00000001 226e4ad08feSMiklos Szeredi #define BDI_CAP_NO_WRITEBACK 0x00000002 227e4ad08feSMiklos Szeredi #define BDI_CAP_MAP_COPY 0x00000004 228e4ad08feSMiklos Szeredi #define BDI_CAP_MAP_DIRECT 0x00000008 229e4ad08feSMiklos Szeredi #define BDI_CAP_READ_MAP 0x00000010 230e4ad08feSMiklos Szeredi #define BDI_CAP_WRITE_MAP 0x00000020 231e4ad08feSMiklos Szeredi #define BDI_CAP_EXEC_MAP 0x00000040 232e4ad08feSMiklos Szeredi #define BDI_CAP_NO_ACCT_WB 0x00000080 2334f98a2feSRik van Riel #define BDI_CAP_SWAP_BACKED 0x00000100 234e4ad08feSMiklos Szeredi 2351da177e4SLinus Torvalds #define BDI_CAP_VMFLAGS \ 2361da177e4SLinus Torvalds (BDI_CAP_READ_MAP | BDI_CAP_WRITE_MAP | BDI_CAP_EXEC_MAP) 2371da177e4SLinus Torvalds 238e4ad08feSMiklos Szeredi #define BDI_CAP_NO_ACCT_AND_WRITEBACK \ 239e4ad08feSMiklos Szeredi (BDI_CAP_NO_WRITEBACK | BDI_CAP_NO_ACCT_DIRTY | BDI_CAP_NO_ACCT_WB) 240e4ad08feSMiklos Szeredi 2411da177e4SLinus Torvalds #if defined(VM_MAYREAD) && \ 2421da177e4SLinus Torvalds (BDI_CAP_READ_MAP != VM_MAYREAD || \ 2431da177e4SLinus Torvalds BDI_CAP_WRITE_MAP != VM_MAYWRITE || \ 2441da177e4SLinus Torvalds BDI_CAP_EXEC_MAP != VM_MAYEXEC) 2451da177e4SLinus Torvalds #error please change backing_dev_info::capabilities flags 2461da177e4SLinus Torvalds #endif 2471da177e4SLinus Torvalds 2481da177e4SLinus Torvalds extern struct backing_dev_info default_backing_dev_info; 2491da177e4SLinus Torvalds void default_unplug_io_fn(struct backing_dev_info *bdi, struct page *page); 2501da177e4SLinus Torvalds 2511da177e4SLinus Torvalds int writeback_in_progress(struct backing_dev_info *bdi); 2521da177e4SLinus Torvalds 2531da177e4SLinus Torvalds static inline int bdi_congested(struct backing_dev_info *bdi, int bdi_bits) 2541da177e4SLinus Torvalds { 2551da177e4SLinus Torvalds if (bdi->congested_fn) 2561da177e4SLinus Torvalds return bdi->congested_fn(bdi->congested_data, bdi_bits); 2571da177e4SLinus Torvalds return (bdi->state & bdi_bits); 2581da177e4SLinus Torvalds } 2591da177e4SLinus Torvalds 2601da177e4SLinus Torvalds static inline int bdi_read_congested(struct backing_dev_info *bdi) 2611da177e4SLinus Torvalds { 2621faa16d2SJens Axboe return bdi_congested(bdi, 1 << BDI_sync_congested); 2631da177e4SLinus Torvalds } 2641da177e4SLinus Torvalds 2651da177e4SLinus Torvalds static inline int bdi_write_congested(struct backing_dev_info *bdi) 2661da177e4SLinus Torvalds { 2671faa16d2SJens Axboe return bdi_congested(bdi, 1 << BDI_async_congested); 2681da177e4SLinus Torvalds } 2691da177e4SLinus Torvalds 2701da177e4SLinus Torvalds static inline int bdi_rw_congested(struct backing_dev_info *bdi) 2711da177e4SLinus Torvalds { 2721faa16d2SJens Axboe return bdi_congested(bdi, (1 << BDI_sync_congested) | 2731faa16d2SJens Axboe (1 << BDI_async_congested)); 2741da177e4SLinus Torvalds } 2751da177e4SLinus Torvalds 276373c0a7eSTrond Myklebust enum { 277373c0a7eSTrond Myklebust BLK_RW_ASYNC = 0, 278373c0a7eSTrond Myklebust BLK_RW_SYNC = 1, 279373c0a7eSTrond Myklebust }; 280373c0a7eSTrond Myklebust 2818aa7e847SJens Axboe void clear_bdi_congested(struct backing_dev_info *bdi, int sync); 2828aa7e847SJens Axboe void set_bdi_congested(struct backing_dev_info *bdi, int sync); 2838aa7e847SJens Axboe long congestion_wait(int sync, long timeout); 2843fcfab16SAndrew Morton 2851da177e4SLinus Torvalds 286e4ad08feSMiklos Szeredi static inline bool bdi_cap_writeback_dirty(struct backing_dev_info *bdi) 287e4ad08feSMiklos Szeredi { 288e4ad08feSMiklos Szeredi return !(bdi->capabilities & BDI_CAP_NO_WRITEBACK); 289e4ad08feSMiklos Szeredi } 2901da177e4SLinus Torvalds 291e4ad08feSMiklos Szeredi static inline bool bdi_cap_account_dirty(struct backing_dev_info *bdi) 292e4ad08feSMiklos Szeredi { 293e4ad08feSMiklos Szeredi return !(bdi->capabilities & BDI_CAP_NO_ACCT_DIRTY); 294e4ad08feSMiklos Szeredi } 2951da177e4SLinus Torvalds 296e4ad08feSMiklos Szeredi static inline bool bdi_cap_account_writeback(struct backing_dev_info *bdi) 297e4ad08feSMiklos Szeredi { 298e4ad08feSMiklos Szeredi /* Paranoia: BDI_CAP_NO_WRITEBACK implies BDI_CAP_NO_ACCT_WB */ 299e4ad08feSMiklos Szeredi return !(bdi->capabilities & (BDI_CAP_NO_ACCT_WB | 300e4ad08feSMiklos Szeredi BDI_CAP_NO_WRITEBACK)); 301e4ad08feSMiklos Szeredi } 3021da177e4SLinus Torvalds 3034f98a2feSRik van Riel static inline bool bdi_cap_swap_backed(struct backing_dev_info *bdi) 3044f98a2feSRik van Riel { 3054f98a2feSRik van Riel return bdi->capabilities & BDI_CAP_SWAP_BACKED; 3064f98a2feSRik van Riel } 3074f98a2feSRik van Riel 30803ba3782SJens Axboe static inline bool bdi_cap_flush_forker(struct backing_dev_info *bdi) 30903ba3782SJens Axboe { 31003ba3782SJens Axboe return bdi == &default_backing_dev_info; 31103ba3782SJens Axboe } 31203ba3782SJens Axboe 313e4ad08feSMiklos Szeredi static inline bool mapping_cap_writeback_dirty(struct address_space *mapping) 314e4ad08feSMiklos Szeredi { 315e4ad08feSMiklos Szeredi return bdi_cap_writeback_dirty(mapping->backing_dev_info); 316e4ad08feSMiklos Szeredi } 317e4ad08feSMiklos Szeredi 318e4ad08feSMiklos Szeredi static inline bool mapping_cap_account_dirty(struct address_space *mapping) 319e4ad08feSMiklos Szeredi { 320e4ad08feSMiklos Szeredi return bdi_cap_account_dirty(mapping->backing_dev_info); 321e4ad08feSMiklos Szeredi } 3221da177e4SLinus Torvalds 3234f98a2feSRik van Riel static inline bool mapping_cap_swap_backed(struct address_space *mapping) 3244f98a2feSRik van Riel { 3254f98a2feSRik van Riel return bdi_cap_swap_backed(mapping->backing_dev_info); 3264f98a2feSRik van Riel } 3274f98a2feSRik van Riel 32803ba3782SJens Axboe static inline int bdi_sched_wait(void *word) 32903ba3782SJens Axboe { 33003ba3782SJens Axboe schedule(); 33103ba3782SJens Axboe return 0; 33203ba3782SJens Axboe } 33303ba3782SJens Axboe 3341da177e4SLinus Torvalds #endif /* _LINUX_BACKING_DEV_H */ 335