1 /* 2 * NUMA memory policies for Linux. 3 * Copyright 2003,2004 Andi Kleen SuSE Labs 4 */ 5 #ifndef _LINUX_MEMPOLICY_H 6 #define _LINUX_MEMPOLICY_H 1 7 8 9 #include <linux/mmzone.h> 10 #include <linux/dax.h> 11 #include <linux/slab.h> 12 #include <linux/rbtree.h> 13 #include <linux/spinlock.h> 14 #include <linux/nodemask.h> 15 #include <linux/pagemap.h> 16 #include <uapi/linux/mempolicy.h> 17 18 struct mm_struct; 19 20 #ifdef CONFIG_NUMA 21 22 /* 23 * Describe a memory policy. 24 * 25 * A mempolicy can be either associated with a process or with a VMA. 26 * For VMA related allocations the VMA policy is preferred, otherwise 27 * the process policy is used. Interrupts ignore the memory policy 28 * of the current process. 29 * 30 * Locking policy for interlave: 31 * In process context there is no locking because only the process accesses 32 * its own state. All vma manipulation is somewhat protected by a down_read on 33 * mmap_sem. 34 * 35 * Freeing policy: 36 * Mempolicy objects are reference counted. A mempolicy will be freed when 37 * mpol_put() decrements the reference count to zero. 38 * 39 * Duplicating policy objects: 40 * mpol_dup() allocates a new mempolicy and copies the specified mempolicy 41 * to the new storage. The reference count of the new object is initialized 42 * to 1, representing the caller of mpol_dup(). 43 */ 44 struct mempolicy { 45 atomic_t refcnt; 46 unsigned short mode; /* See MPOL_* above */ 47 unsigned short flags; /* See set_mempolicy() MPOL_F_* above */ 48 union { 49 short preferred_node; /* preferred */ 50 nodemask_t nodes; /* interleave/bind */ 51 /* undefined for default */ 52 } v; 53 union { 54 nodemask_t cpuset_mems_allowed; /* relative to these nodes */ 55 nodemask_t user_nodemask; /* nodemask passed by user */ 56 } w; 57 }; 58 59 /* 60 * Support for managing mempolicy data objects (clone, copy, destroy) 61 * The default fast path of a NULL MPOL_DEFAULT policy is always inlined. 62 */ 63 64 extern void __mpol_put(struct mempolicy *pol); 65 static inline void mpol_put(struct mempolicy *pol) 66 { 67 if (pol) 68 __mpol_put(pol); 69 } 70 71 /* 72 * Does mempolicy pol need explicit unref after use? 73 * Currently only needed for shared policies. 74 */ 75 static inline int mpol_needs_cond_ref(struct mempolicy *pol) 76 { 77 return (pol && (pol->flags & MPOL_F_SHARED)); 78 } 79 80 static inline void mpol_cond_put(struct mempolicy *pol) 81 { 82 if (mpol_needs_cond_ref(pol)) 83 __mpol_put(pol); 84 } 85 86 extern struct mempolicy *__mpol_dup(struct mempolicy *pol); 87 static inline struct mempolicy *mpol_dup(struct mempolicy *pol) 88 { 89 if (pol) 90 pol = __mpol_dup(pol); 91 return pol; 92 } 93 94 #define vma_policy(vma) ((vma)->vm_policy) 95 96 static inline void mpol_get(struct mempolicy *pol) 97 { 98 if (pol) 99 atomic_inc(&pol->refcnt); 100 } 101 102 extern bool __mpol_equal(struct mempolicy *a, struct mempolicy *b); 103 static inline bool mpol_equal(struct mempolicy *a, struct mempolicy *b) 104 { 105 if (a == b) 106 return true; 107 return __mpol_equal(a, b); 108 } 109 110 /* 111 * Tree of shared policies for a shared memory region. 112 * Maintain the policies in a pseudo mm that contains vmas. The vmas 113 * carry the policy. As a special twist the pseudo mm is indexed in pages, not 114 * bytes, so that we can work with shared memory segments bigger than 115 * unsigned long. 116 */ 117 118 struct sp_node { 119 struct rb_node nd; 120 unsigned long start, end; 121 struct mempolicy *policy; 122 }; 123 124 struct shared_policy { 125 struct rb_root root; 126 rwlock_t lock; 127 }; 128 129 int vma_dup_policy(struct vm_area_struct *src, struct vm_area_struct *dst); 130 void mpol_shared_policy_init(struct shared_policy *sp, struct mempolicy *mpol); 131 int mpol_set_shared_policy(struct shared_policy *info, 132 struct vm_area_struct *vma, 133 struct mempolicy *new); 134 void mpol_free_shared_policy(struct shared_policy *p); 135 struct mempolicy *mpol_shared_policy_lookup(struct shared_policy *sp, 136 unsigned long idx); 137 138 struct mempolicy *get_task_policy(struct task_struct *p); 139 struct mempolicy *__get_vma_policy(struct vm_area_struct *vma, 140 unsigned long addr); 141 bool vma_policy_mof(struct vm_area_struct *vma); 142 143 extern void numa_default_policy(void); 144 extern void numa_policy_init(void); 145 extern void mpol_rebind_task(struct task_struct *tsk, const nodemask_t *new); 146 extern void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new); 147 148 extern int huge_node(struct vm_area_struct *vma, 149 unsigned long addr, gfp_t gfp_flags, 150 struct mempolicy **mpol, nodemask_t **nodemask); 151 extern bool init_nodemask_of_mempolicy(nodemask_t *mask); 152 extern bool mempolicy_nodemask_intersects(struct task_struct *tsk, 153 const nodemask_t *mask); 154 extern unsigned int mempolicy_slab_node(void); 155 156 extern enum zone_type policy_zone; 157 158 static inline void check_highest_zone(enum zone_type k) 159 { 160 if (k > policy_zone && k != ZONE_MOVABLE) 161 policy_zone = k; 162 } 163 164 int do_migrate_pages(struct mm_struct *mm, const nodemask_t *from, 165 const nodemask_t *to, int flags); 166 167 168 #ifdef CONFIG_TMPFS 169 extern int mpol_parse_str(char *str, struct mempolicy **mpol); 170 #endif 171 172 extern void mpol_to_str(char *buffer, int maxlen, struct mempolicy *pol); 173 174 /* Check if a vma is migratable */ 175 static inline bool vma_migratable(struct vm_area_struct *vma) 176 { 177 if (vma->vm_flags & (VM_IO | VM_PFNMAP)) 178 return false; 179 180 /* 181 * DAX device mappings require predictable access latency, so avoid 182 * incurring periodic faults. 183 */ 184 if (vma_is_dax(vma)) 185 return false; 186 187 #ifndef CONFIG_ARCH_ENABLE_HUGEPAGE_MIGRATION 188 if (vma->vm_flags & VM_HUGETLB) 189 return false; 190 #endif 191 192 /* 193 * Migration allocates pages in the highest zone. If we cannot 194 * do so then migration (at least from node to node) is not 195 * possible. 196 */ 197 if (vma->vm_file && 198 gfp_zone(mapping_gfp_mask(vma->vm_file->f_mapping)) 199 < policy_zone) 200 return false; 201 return true; 202 } 203 204 extern int mpol_misplaced(struct page *, struct vm_area_struct *, unsigned long); 205 extern void mpol_put_task_policy(struct task_struct *); 206 207 #else 208 209 struct mempolicy {}; 210 211 static inline bool mpol_equal(struct mempolicy *a, struct mempolicy *b) 212 { 213 return true; 214 } 215 216 static inline void mpol_put(struct mempolicy *p) 217 { 218 } 219 220 static inline void mpol_cond_put(struct mempolicy *pol) 221 { 222 } 223 224 static inline void mpol_get(struct mempolicy *pol) 225 { 226 } 227 228 struct shared_policy {}; 229 230 static inline void mpol_shared_policy_init(struct shared_policy *sp, 231 struct mempolicy *mpol) 232 { 233 } 234 235 static inline void mpol_free_shared_policy(struct shared_policy *p) 236 { 237 } 238 239 static inline struct mempolicy * 240 mpol_shared_policy_lookup(struct shared_policy *sp, unsigned long idx) 241 { 242 return NULL; 243 } 244 245 #define vma_policy(vma) NULL 246 247 static inline int 248 vma_dup_policy(struct vm_area_struct *src, struct vm_area_struct *dst) 249 { 250 return 0; 251 } 252 253 static inline void numa_policy_init(void) 254 { 255 } 256 257 static inline void numa_default_policy(void) 258 { 259 } 260 261 static inline void mpol_rebind_task(struct task_struct *tsk, 262 const nodemask_t *new) 263 { 264 } 265 266 static inline void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new) 267 { 268 } 269 270 static inline int huge_node(struct vm_area_struct *vma, 271 unsigned long addr, gfp_t gfp_flags, 272 struct mempolicy **mpol, nodemask_t **nodemask) 273 { 274 *mpol = NULL; 275 *nodemask = NULL; 276 return 0; 277 } 278 279 static inline bool init_nodemask_of_mempolicy(nodemask_t *m) 280 { 281 return false; 282 } 283 284 static inline int do_migrate_pages(struct mm_struct *mm, const nodemask_t *from, 285 const nodemask_t *to, int flags) 286 { 287 return 0; 288 } 289 290 static inline void check_highest_zone(int k) 291 { 292 } 293 294 #ifdef CONFIG_TMPFS 295 static inline int mpol_parse_str(char *str, struct mempolicy **mpol) 296 { 297 return 1; /* error */ 298 } 299 #endif 300 301 static inline int mpol_misplaced(struct page *page, struct vm_area_struct *vma, 302 unsigned long address) 303 { 304 return -1; /* no node preference */ 305 } 306 307 static inline void mpol_put_task_policy(struct task_struct *task) 308 { 309 } 310 #endif /* CONFIG_NUMA */ 311 #endif 312