11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * include/linux/backing-dev.h 31da177e4SLinus Torvalds * 41da177e4SLinus Torvalds * low-level device information and state which is propagated up through 51da177e4SLinus Torvalds * to high-level code. 61da177e4SLinus Torvalds */ 71da177e4SLinus Torvalds 81da177e4SLinus Torvalds #ifndef _LINUX_BACKING_DEV_H 91da177e4SLinus Torvalds #define _LINUX_BACKING_DEV_H 101da177e4SLinus Torvalds 11b2e8fb6eSPeter Zijlstra #include <linux/percpu_counter.h> 12b2e8fb6eSPeter Zijlstra #include <linux/log2.h> 1304fbfdc1SPeter Zijlstra #include <linux/proportions.h> 14cf0ca9feSPeter Zijlstra #include <linux/kernel.h> 15e4ad08feSMiklos Szeredi #include <linux/fs.h> 1603ba3782SJens Axboe #include <linux/sched.h> 1703ba3782SJens Axboe #include <linux/writeback.h> 181da177e4SLinus Torvalds #include <asm/atomic.h> 191da177e4SLinus Torvalds 203fcfab16SAndrew Morton struct page; 21cf0ca9feSPeter Zijlstra struct device; 2276f1418bSMiklos Szeredi struct dentry; 233fcfab16SAndrew Morton 241da177e4SLinus Torvalds /* 251da177e4SLinus Torvalds * Bits in backing_dev_info.state 261da177e4SLinus Torvalds */ 271da177e4SLinus Torvalds enum bdi_state { 2803ba3782SJens Axboe BDI_pending, /* On its way to being activated */ 2903ba3782SJens Axboe BDI_wb_alloc, /* Default embedded wb allocated */ 301faa16d2SJens Axboe BDI_async_congested, /* The async (write) queue is getting full */ 311faa16d2SJens Axboe BDI_sync_congested, /* The sync queue is getting full */ 32500b067cSJens Axboe BDI_registered, /* bdi_register() was done */ 331da177e4SLinus Torvalds BDI_unused, /* Available bits start here */ 341da177e4SLinus Torvalds }; 351da177e4SLinus Torvalds 361da177e4SLinus Torvalds typedef int (congested_fn)(void *, int); 371da177e4SLinus Torvalds 38b2e8fb6eSPeter Zijlstra enum bdi_stat_item { 39c9e51e41SPeter Zijlstra BDI_RECLAIMABLE, 4069cb51d1SPeter Zijlstra BDI_WRITEBACK, 41b2e8fb6eSPeter Zijlstra NR_BDI_STAT_ITEMS 42b2e8fb6eSPeter Zijlstra }; 43b2e8fb6eSPeter Zijlstra 44b2e8fb6eSPeter Zijlstra #define BDI_STAT_BATCH (8*(1+ilog2(nr_cpu_ids))) 45b2e8fb6eSPeter Zijlstra 4603ba3782SJens Axboe struct bdi_writeback { 4703ba3782SJens Axboe struct list_head list; /* hangs off the bdi */ 4803ba3782SJens Axboe 4903ba3782SJens Axboe struct backing_dev_info *bdi; /* our parent bdi */ 5003ba3782SJens Axboe unsigned int nr; 5103ba3782SJens Axboe 5203ba3782SJens Axboe unsigned long last_old_flush; /* last old data flush */ 5303ba3782SJens Axboe 5403ba3782SJens Axboe struct task_struct *task; /* writeback task */ 5503ba3782SJens Axboe struct list_head b_dirty; /* dirty inodes */ 5603ba3782SJens Axboe struct list_head b_io; /* parked for writeback */ 5703ba3782SJens Axboe struct list_head b_more_io; /* parked for more writeback */ 5803ba3782SJens Axboe }; 5903ba3782SJens Axboe 601da177e4SLinus Torvalds struct backing_dev_info { 6166f3b8e2SJens Axboe struct list_head bdi_list; 62*cfc4ba53SJens Axboe struct rcu_head rcu_head; 631da177e4SLinus Torvalds unsigned long ra_pages; /* max readahead in PAGE_CACHE_SIZE units */ 641da177e4SLinus Torvalds unsigned long state; /* Always use atomic bitops on this */ 651da177e4SLinus Torvalds unsigned int capabilities; /* Device capabilities */ 661da177e4SLinus Torvalds congested_fn *congested_fn; /* Function pointer if device is md/dm */ 671da177e4SLinus Torvalds void *congested_data; /* Pointer to aux data for congested func */ 681da177e4SLinus Torvalds void (*unplug_io_fn)(struct backing_dev_info *, struct page *); 691da177e4SLinus Torvalds void *unplug_io_data; 70b2e8fb6eSPeter Zijlstra 71d993831fSJens Axboe char *name; 72d993831fSJens Axboe 73b2e8fb6eSPeter Zijlstra struct percpu_counter bdi_stat[NR_BDI_STAT_ITEMS]; 7404fbfdc1SPeter Zijlstra 7504fbfdc1SPeter Zijlstra struct prop_local_percpu completions; 7604fbfdc1SPeter Zijlstra int dirty_exceeded; 77cf0ca9feSPeter Zijlstra 78189d3c4aSPeter Zijlstra unsigned int min_ratio; 79a42dde04SPeter Zijlstra unsigned int max_ratio, max_prop_frac; 80189d3c4aSPeter Zijlstra 8103ba3782SJens Axboe struct bdi_writeback wb; /* default writeback info for this bdi */ 8203ba3782SJens Axboe spinlock_t wb_lock; /* protects update side of wb_list */ 8303ba3782SJens Axboe struct list_head wb_list; /* the flusher threads hanging off this bdi */ 8403ba3782SJens Axboe unsigned long wb_mask; /* bitmask of registered tasks */ 8503ba3782SJens Axboe unsigned int wb_cnt; /* number of registered tasks */ 8676f1418bSMiklos Szeredi 8703ba3782SJens Axboe struct list_head work_list; 8803ba3782SJens Axboe 8903ba3782SJens Axboe struct device *dev; 9066f3b8e2SJens Axboe 9176f1418bSMiklos Szeredi #ifdef CONFIG_DEBUG_FS 9276f1418bSMiklos Szeredi struct dentry *debug_dir; 9376f1418bSMiklos Szeredi struct dentry *debug_stats; 9476f1418bSMiklos Szeredi #endif 951da177e4SLinus Torvalds }; 961da177e4SLinus Torvalds 97b2e8fb6eSPeter Zijlstra int bdi_init(struct backing_dev_info *bdi); 98b2e8fb6eSPeter Zijlstra void bdi_destroy(struct backing_dev_info *bdi); 99b2e8fb6eSPeter Zijlstra 100cf0ca9feSPeter Zijlstra int bdi_register(struct backing_dev_info *bdi, struct device *parent, 101cf0ca9feSPeter Zijlstra const char *fmt, ...); 102cf0ca9feSPeter Zijlstra int bdi_register_dev(struct backing_dev_info *bdi, dev_t dev); 103cf0ca9feSPeter Zijlstra void bdi_unregister(struct backing_dev_info *bdi); 10403ba3782SJens Axboe void bdi_start_writeback(struct writeback_control *wbc); 10503ba3782SJens Axboe int bdi_writeback_task(struct bdi_writeback *wb); 10603ba3782SJens Axboe int bdi_has_dirty_io(struct backing_dev_info *bdi); 107cf0ca9feSPeter Zijlstra 10803ba3782SJens Axboe extern spinlock_t bdi_lock; 10966f3b8e2SJens Axboe extern struct list_head bdi_list; 11066f3b8e2SJens Axboe 11103ba3782SJens Axboe static inline int wb_has_dirty_io(struct bdi_writeback *wb) 11203ba3782SJens Axboe { 11303ba3782SJens Axboe return !list_empty(&wb->b_dirty) || 11403ba3782SJens Axboe !list_empty(&wb->b_io) || 11503ba3782SJens Axboe !list_empty(&wb->b_more_io); 11603ba3782SJens Axboe } 11703ba3782SJens Axboe 118b2e8fb6eSPeter Zijlstra static inline void __add_bdi_stat(struct backing_dev_info *bdi, 119b2e8fb6eSPeter Zijlstra enum bdi_stat_item item, s64 amount) 120e0bf68ddSPeter Zijlstra { 121b2e8fb6eSPeter Zijlstra __percpu_counter_add(&bdi->bdi_stat[item], amount, BDI_STAT_BATCH); 122e0bf68ddSPeter Zijlstra } 123e0bf68ddSPeter Zijlstra 124b2e8fb6eSPeter Zijlstra static inline void __inc_bdi_stat(struct backing_dev_info *bdi, 125b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 126e0bf68ddSPeter Zijlstra { 127b2e8fb6eSPeter Zijlstra __add_bdi_stat(bdi, item, 1); 128b2e8fb6eSPeter Zijlstra } 129b2e8fb6eSPeter Zijlstra 130b2e8fb6eSPeter Zijlstra static inline void inc_bdi_stat(struct backing_dev_info *bdi, 131b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 132b2e8fb6eSPeter Zijlstra { 133b2e8fb6eSPeter Zijlstra unsigned long flags; 134b2e8fb6eSPeter Zijlstra 135b2e8fb6eSPeter Zijlstra local_irq_save(flags); 136b2e8fb6eSPeter Zijlstra __inc_bdi_stat(bdi, item); 137b2e8fb6eSPeter Zijlstra local_irq_restore(flags); 138b2e8fb6eSPeter Zijlstra } 139b2e8fb6eSPeter Zijlstra 140b2e8fb6eSPeter Zijlstra static inline void __dec_bdi_stat(struct backing_dev_info *bdi, 141b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 142b2e8fb6eSPeter Zijlstra { 143b2e8fb6eSPeter Zijlstra __add_bdi_stat(bdi, item, -1); 144b2e8fb6eSPeter Zijlstra } 145b2e8fb6eSPeter Zijlstra 146b2e8fb6eSPeter Zijlstra static inline void dec_bdi_stat(struct backing_dev_info *bdi, 147b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 148b2e8fb6eSPeter Zijlstra { 149b2e8fb6eSPeter Zijlstra unsigned long flags; 150b2e8fb6eSPeter Zijlstra 151b2e8fb6eSPeter Zijlstra local_irq_save(flags); 152b2e8fb6eSPeter Zijlstra __dec_bdi_stat(bdi, item); 153b2e8fb6eSPeter Zijlstra local_irq_restore(flags); 154b2e8fb6eSPeter Zijlstra } 155b2e8fb6eSPeter Zijlstra 156b2e8fb6eSPeter Zijlstra static inline s64 bdi_stat(struct backing_dev_info *bdi, 157b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 158b2e8fb6eSPeter Zijlstra { 159b2e8fb6eSPeter Zijlstra return percpu_counter_read_positive(&bdi->bdi_stat[item]); 160b2e8fb6eSPeter Zijlstra } 161b2e8fb6eSPeter Zijlstra 162b2e8fb6eSPeter Zijlstra static inline s64 __bdi_stat_sum(struct backing_dev_info *bdi, 163b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 164b2e8fb6eSPeter Zijlstra { 165b2e8fb6eSPeter Zijlstra return percpu_counter_sum_positive(&bdi->bdi_stat[item]); 166b2e8fb6eSPeter Zijlstra } 167b2e8fb6eSPeter Zijlstra 168b2e8fb6eSPeter Zijlstra static inline s64 bdi_stat_sum(struct backing_dev_info *bdi, 169b2e8fb6eSPeter Zijlstra enum bdi_stat_item item) 170b2e8fb6eSPeter Zijlstra { 171b2e8fb6eSPeter Zijlstra s64 sum; 172b2e8fb6eSPeter Zijlstra unsigned long flags; 173b2e8fb6eSPeter Zijlstra 174b2e8fb6eSPeter Zijlstra local_irq_save(flags); 175b2e8fb6eSPeter Zijlstra sum = __bdi_stat_sum(bdi, item); 176b2e8fb6eSPeter Zijlstra local_irq_restore(flags); 177b2e8fb6eSPeter Zijlstra 178b2e8fb6eSPeter Zijlstra return sum; 179b2e8fb6eSPeter Zijlstra } 180b2e8fb6eSPeter Zijlstra 181dd5656e5SMiklos Szeredi extern void bdi_writeout_inc(struct backing_dev_info *bdi); 182dd5656e5SMiklos Szeredi 183b2e8fb6eSPeter Zijlstra /* 184b2e8fb6eSPeter Zijlstra * maximal error of a stat counter. 185b2e8fb6eSPeter Zijlstra */ 186b2e8fb6eSPeter Zijlstra static inline unsigned long bdi_stat_error(struct backing_dev_info *bdi) 187b2e8fb6eSPeter Zijlstra { 188b2e8fb6eSPeter Zijlstra #ifdef CONFIG_SMP 189b2e8fb6eSPeter Zijlstra return nr_cpu_ids * BDI_STAT_BATCH; 190b2e8fb6eSPeter Zijlstra #else 191b2e8fb6eSPeter Zijlstra return 1; 192b2e8fb6eSPeter Zijlstra #endif 193e0bf68ddSPeter Zijlstra } 1941da177e4SLinus Torvalds 195189d3c4aSPeter Zijlstra int bdi_set_min_ratio(struct backing_dev_info *bdi, unsigned int min_ratio); 196a42dde04SPeter Zijlstra int bdi_set_max_ratio(struct backing_dev_info *bdi, unsigned int max_ratio); 197189d3c4aSPeter Zijlstra 1981da177e4SLinus Torvalds /* 1991da177e4SLinus Torvalds * Flags in backing_dev_info::capability 200e4ad08feSMiklos Szeredi * 201e4ad08feSMiklos Szeredi * The first three flags control whether dirty pages will contribute to the 2021da177e4SLinus Torvalds * VM's accounting and whether writepages() should be called for dirty pages 2031da177e4SLinus Torvalds * (something that would not, for example, be appropriate for ramfs) 204e4ad08feSMiklos Szeredi * 205e4ad08feSMiklos Szeredi * WARNING: these flags are closely related and should not normally be 206e4ad08feSMiklos Szeredi * used separately. The BDI_CAP_NO_ACCT_AND_WRITEBACK combines these 207e4ad08feSMiklos Szeredi * three flags into a single convenience macro. 208e4ad08feSMiklos Szeredi * 209e4ad08feSMiklos Szeredi * BDI_CAP_NO_ACCT_DIRTY: Dirty pages shouldn't contribute to accounting 210e4ad08feSMiklos Szeredi * BDI_CAP_NO_WRITEBACK: Don't write pages back 211e4ad08feSMiklos Szeredi * BDI_CAP_NO_ACCT_WB: Don't automatically account writeback pages 212e4ad08feSMiklos Szeredi * 213e4ad08feSMiklos Szeredi * These flags let !MMU mmap() govern direct device mapping vs immediate 214e4ad08feSMiklos Szeredi * copying more easily for MAP_PRIVATE, especially for ROM filesystems. 215e4ad08feSMiklos Szeredi * 216e4ad08feSMiklos Szeredi * BDI_CAP_MAP_COPY: Copy can be mapped (MAP_PRIVATE) 217e4ad08feSMiklos Szeredi * BDI_CAP_MAP_DIRECT: Can be mapped directly (MAP_SHARED) 218e4ad08feSMiklos Szeredi * BDI_CAP_READ_MAP: Can be mapped for reading 219e4ad08feSMiklos Szeredi * BDI_CAP_WRITE_MAP: Can be mapped for writing 220e4ad08feSMiklos Szeredi * BDI_CAP_EXEC_MAP: Can be mapped for execution 2214f98a2feSRik van Riel * 2224f98a2feSRik van Riel * BDI_CAP_SWAP_BACKED: Count shmem/tmpfs objects as swap-backed. 2231da177e4SLinus Torvalds */ 224e4ad08feSMiklos Szeredi #define BDI_CAP_NO_ACCT_DIRTY 0x00000001 225e4ad08feSMiklos Szeredi #define BDI_CAP_NO_WRITEBACK 0x00000002 226e4ad08feSMiklos Szeredi #define BDI_CAP_MAP_COPY 0x00000004 227e4ad08feSMiklos Szeredi #define BDI_CAP_MAP_DIRECT 0x00000008 228e4ad08feSMiklos Szeredi #define BDI_CAP_READ_MAP 0x00000010 229e4ad08feSMiklos Szeredi #define BDI_CAP_WRITE_MAP 0x00000020 230e4ad08feSMiklos Szeredi #define BDI_CAP_EXEC_MAP 0x00000040 231e4ad08feSMiklos Szeredi #define BDI_CAP_NO_ACCT_WB 0x00000080 2324f98a2feSRik van Riel #define BDI_CAP_SWAP_BACKED 0x00000100 233e4ad08feSMiklos Szeredi 2341da177e4SLinus Torvalds #define BDI_CAP_VMFLAGS \ 2351da177e4SLinus Torvalds (BDI_CAP_READ_MAP | BDI_CAP_WRITE_MAP | BDI_CAP_EXEC_MAP) 2361da177e4SLinus Torvalds 237e4ad08feSMiklos Szeredi #define BDI_CAP_NO_ACCT_AND_WRITEBACK \ 238e4ad08feSMiklos Szeredi (BDI_CAP_NO_WRITEBACK | BDI_CAP_NO_ACCT_DIRTY | BDI_CAP_NO_ACCT_WB) 239e4ad08feSMiklos Szeredi 2401da177e4SLinus Torvalds #if defined(VM_MAYREAD) && \ 2411da177e4SLinus Torvalds (BDI_CAP_READ_MAP != VM_MAYREAD || \ 2421da177e4SLinus Torvalds BDI_CAP_WRITE_MAP != VM_MAYWRITE || \ 2431da177e4SLinus Torvalds BDI_CAP_EXEC_MAP != VM_MAYEXEC) 2441da177e4SLinus Torvalds #error please change backing_dev_info::capabilities flags 2451da177e4SLinus Torvalds #endif 2461da177e4SLinus Torvalds 2471da177e4SLinus Torvalds extern struct backing_dev_info default_backing_dev_info; 2481da177e4SLinus Torvalds void default_unplug_io_fn(struct backing_dev_info *bdi, struct page *page); 2491da177e4SLinus Torvalds 2501da177e4SLinus Torvalds int writeback_in_progress(struct backing_dev_info *bdi); 2511da177e4SLinus Torvalds 2521da177e4SLinus Torvalds static inline int bdi_congested(struct backing_dev_info *bdi, int bdi_bits) 2531da177e4SLinus Torvalds { 2541da177e4SLinus Torvalds if (bdi->congested_fn) 2551da177e4SLinus Torvalds return bdi->congested_fn(bdi->congested_data, bdi_bits); 2561da177e4SLinus Torvalds return (bdi->state & bdi_bits); 2571da177e4SLinus Torvalds } 2581da177e4SLinus Torvalds 2591da177e4SLinus Torvalds static inline int bdi_read_congested(struct backing_dev_info *bdi) 2601da177e4SLinus Torvalds { 2611faa16d2SJens Axboe return bdi_congested(bdi, 1 << BDI_sync_congested); 2621da177e4SLinus Torvalds } 2631da177e4SLinus Torvalds 2641da177e4SLinus Torvalds static inline int bdi_write_congested(struct backing_dev_info *bdi) 2651da177e4SLinus Torvalds { 2661faa16d2SJens Axboe return bdi_congested(bdi, 1 << BDI_async_congested); 2671da177e4SLinus Torvalds } 2681da177e4SLinus Torvalds 2691da177e4SLinus Torvalds static inline int bdi_rw_congested(struct backing_dev_info *bdi) 2701da177e4SLinus Torvalds { 2711faa16d2SJens Axboe return bdi_congested(bdi, (1 << BDI_sync_congested) | 2721faa16d2SJens Axboe (1 << BDI_async_congested)); 2731da177e4SLinus Torvalds } 2741da177e4SLinus Torvalds 275373c0a7eSTrond Myklebust enum { 276373c0a7eSTrond Myklebust BLK_RW_ASYNC = 0, 277373c0a7eSTrond Myklebust BLK_RW_SYNC = 1, 278373c0a7eSTrond Myklebust }; 279373c0a7eSTrond Myklebust 2808aa7e847SJens Axboe void clear_bdi_congested(struct backing_dev_info *bdi, int sync); 2818aa7e847SJens Axboe void set_bdi_congested(struct backing_dev_info *bdi, int sync); 2828aa7e847SJens Axboe long congestion_wait(int sync, long timeout); 2833fcfab16SAndrew Morton 2841da177e4SLinus Torvalds 285e4ad08feSMiklos Szeredi static inline bool bdi_cap_writeback_dirty(struct backing_dev_info *bdi) 286e4ad08feSMiklos Szeredi { 287e4ad08feSMiklos Szeredi return !(bdi->capabilities & BDI_CAP_NO_WRITEBACK); 288e4ad08feSMiklos Szeredi } 2891da177e4SLinus Torvalds 290e4ad08feSMiklos Szeredi static inline bool bdi_cap_account_dirty(struct backing_dev_info *bdi) 291e4ad08feSMiklos Szeredi { 292e4ad08feSMiklos Szeredi return !(bdi->capabilities & BDI_CAP_NO_ACCT_DIRTY); 293e4ad08feSMiklos Szeredi } 2941da177e4SLinus Torvalds 295e4ad08feSMiklos Szeredi static inline bool bdi_cap_account_writeback(struct backing_dev_info *bdi) 296e4ad08feSMiklos Szeredi { 297e4ad08feSMiklos Szeredi /* Paranoia: BDI_CAP_NO_WRITEBACK implies BDI_CAP_NO_ACCT_WB */ 298e4ad08feSMiklos Szeredi return !(bdi->capabilities & (BDI_CAP_NO_ACCT_WB | 299e4ad08feSMiklos Szeredi BDI_CAP_NO_WRITEBACK)); 300e4ad08feSMiklos Szeredi } 3011da177e4SLinus Torvalds 3024f98a2feSRik van Riel static inline bool bdi_cap_swap_backed(struct backing_dev_info *bdi) 3034f98a2feSRik van Riel { 3044f98a2feSRik van Riel return bdi->capabilities & BDI_CAP_SWAP_BACKED; 3054f98a2feSRik van Riel } 3064f98a2feSRik van Riel 30703ba3782SJens Axboe static inline bool bdi_cap_flush_forker(struct backing_dev_info *bdi) 30803ba3782SJens Axboe { 30903ba3782SJens Axboe return bdi == &default_backing_dev_info; 31003ba3782SJens Axboe } 31103ba3782SJens Axboe 312e4ad08feSMiklos Szeredi static inline bool mapping_cap_writeback_dirty(struct address_space *mapping) 313e4ad08feSMiklos Szeredi { 314e4ad08feSMiklos Szeredi return bdi_cap_writeback_dirty(mapping->backing_dev_info); 315e4ad08feSMiklos Szeredi } 316e4ad08feSMiklos Szeredi 317e4ad08feSMiklos Szeredi static inline bool mapping_cap_account_dirty(struct address_space *mapping) 318e4ad08feSMiklos Szeredi { 319e4ad08feSMiklos Szeredi return bdi_cap_account_dirty(mapping->backing_dev_info); 320e4ad08feSMiklos Szeredi } 3211da177e4SLinus Torvalds 3224f98a2feSRik van Riel static inline bool mapping_cap_swap_backed(struct address_space *mapping) 3234f98a2feSRik van Riel { 3244f98a2feSRik van Riel return bdi_cap_swap_backed(mapping->backing_dev_info); 3254f98a2feSRik van Riel } 3264f98a2feSRik van Riel 32703ba3782SJens Axboe static inline int bdi_sched_wait(void *word) 32803ba3782SJens Axboe { 32903ba3782SJens Axboe schedule(); 33003ba3782SJens Axboe return 0; 33103ba3782SJens Axboe } 33203ba3782SJens Axboe 3331da177e4SLinus Torvalds #endif /* _LINUX_BACKING_DEV_H */ 334