at 4ff9083b8a9a80bdf4ebbbec22cda4cbfb60f7aa 311 lines 7.6 kB view raw
1/* 2 * NUMA memory policies for Linux. 3 * Copyright 2003,2004 Andi Kleen SuSE Labs 4 */ 5#ifndef _LINUX_MEMPOLICY_H 6#define _LINUX_MEMPOLICY_H 1 7 8 9#include <linux/mmzone.h> 10#include <linux/dax.h> 11#include <linux/slab.h> 12#include <linux/rbtree.h> 13#include <linux/spinlock.h> 14#include <linux/nodemask.h> 15#include <linux/pagemap.h> 16#include <uapi/linux/mempolicy.h> 17 18struct mm_struct; 19 20#ifdef CONFIG_NUMA 21 22/* 23 * Describe a memory policy. 24 * 25 * A mempolicy can be either associated with a process or with a VMA. 26 * For VMA related allocations the VMA policy is preferred, otherwise 27 * the process policy is used. Interrupts ignore the memory policy 28 * of the current process. 29 * 30 * Locking policy for interlave: 31 * In process context there is no locking because only the process accesses 32 * its own state. All vma manipulation is somewhat protected by a down_read on 33 * mmap_sem. 34 * 35 * Freeing policy: 36 * Mempolicy objects are reference counted. A mempolicy will be freed when 37 * mpol_put() decrements the reference count to zero. 38 * 39 * Duplicating policy objects: 40 * mpol_dup() allocates a new mempolicy and copies the specified mempolicy 41 * to the new storage. The reference count of the new object is initialized 42 * to 1, representing the caller of mpol_dup(). 43 */ 44struct mempolicy { 45 atomic_t refcnt; 46 unsigned short mode; /* See MPOL_* above */ 47 unsigned short flags; /* See set_mempolicy() MPOL_F_* above */ 48 union { 49 short preferred_node; /* preferred */ 50 nodemask_t nodes; /* interleave/bind */ 51 /* undefined for default */ 52 } v; 53 union { 54 nodemask_t cpuset_mems_allowed; /* relative to these nodes */ 55 nodemask_t user_nodemask; /* nodemask passed by user */ 56 } w; 57}; 58 59/* 60 * Support for managing mempolicy data objects (clone, copy, destroy) 61 * The default fast path of a NULL MPOL_DEFAULT policy is always inlined. 62 */ 63 64extern void __mpol_put(struct mempolicy *pol); 65static inline void mpol_put(struct mempolicy *pol) 66{ 67 if (pol) 68 __mpol_put(pol); 69} 70 71/* 72 * Does mempolicy pol need explicit unref after use? 73 * Currently only needed for shared policies. 74 */ 75static inline int mpol_needs_cond_ref(struct mempolicy *pol) 76{ 77 return (pol && (pol->flags & MPOL_F_SHARED)); 78} 79 80static inline void mpol_cond_put(struct mempolicy *pol) 81{ 82 if (mpol_needs_cond_ref(pol)) 83 __mpol_put(pol); 84} 85 86extern struct mempolicy *__mpol_dup(struct mempolicy *pol); 87static inline struct mempolicy *mpol_dup(struct mempolicy *pol) 88{ 89 if (pol) 90 pol = __mpol_dup(pol); 91 return pol; 92} 93 94#define vma_policy(vma) ((vma)->vm_policy) 95 96static inline void mpol_get(struct mempolicy *pol) 97{ 98 if (pol) 99 atomic_inc(&pol->refcnt); 100} 101 102extern bool __mpol_equal(struct mempolicy *a, struct mempolicy *b); 103static inline bool mpol_equal(struct mempolicy *a, struct mempolicy *b) 104{ 105 if (a == b) 106 return true; 107 return __mpol_equal(a, b); 108} 109 110/* 111 * Tree of shared policies for a shared memory region. 112 * Maintain the policies in a pseudo mm that contains vmas. The vmas 113 * carry the policy. As a special twist the pseudo mm is indexed in pages, not 114 * bytes, so that we can work with shared memory segments bigger than 115 * unsigned long. 116 */ 117 118struct sp_node { 119 struct rb_node nd; 120 unsigned long start, end; 121 struct mempolicy *policy; 122}; 123 124struct shared_policy { 125 struct rb_root root; 126 rwlock_t lock; 127}; 128 129int vma_dup_policy(struct vm_area_struct *src, struct vm_area_struct *dst); 130void mpol_shared_policy_init(struct shared_policy *sp, struct mempolicy *mpol); 131int mpol_set_shared_policy(struct shared_policy *info, 132 struct vm_area_struct *vma, 133 struct mempolicy *new); 134void mpol_free_shared_policy(struct shared_policy *p); 135struct mempolicy *mpol_shared_policy_lookup(struct shared_policy *sp, 136 unsigned long idx); 137 138struct mempolicy *get_task_policy(struct task_struct *p); 139struct mempolicy *__get_vma_policy(struct vm_area_struct *vma, 140 unsigned long addr); 141bool vma_policy_mof(struct vm_area_struct *vma); 142 143extern void numa_default_policy(void); 144extern void numa_policy_init(void); 145extern void mpol_rebind_task(struct task_struct *tsk, const nodemask_t *new); 146extern void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new); 147 148extern int huge_node(struct vm_area_struct *vma, 149 unsigned long addr, gfp_t gfp_flags, 150 struct mempolicy **mpol, nodemask_t **nodemask); 151extern bool init_nodemask_of_mempolicy(nodemask_t *mask); 152extern bool mempolicy_nodemask_intersects(struct task_struct *tsk, 153 const nodemask_t *mask); 154extern unsigned int mempolicy_slab_node(void); 155 156extern enum zone_type policy_zone; 157 158static inline void check_highest_zone(enum zone_type k) 159{ 160 if (k > policy_zone && k != ZONE_MOVABLE) 161 policy_zone = k; 162} 163 164int do_migrate_pages(struct mm_struct *mm, const nodemask_t *from, 165 const nodemask_t *to, int flags); 166 167 168#ifdef CONFIG_TMPFS 169extern int mpol_parse_str(char *str, struct mempolicy **mpol); 170#endif 171 172extern void mpol_to_str(char *buffer, int maxlen, struct mempolicy *pol); 173 174/* Check if a vma is migratable */ 175static inline bool vma_migratable(struct vm_area_struct *vma) 176{ 177 if (vma->vm_flags & (VM_IO | VM_PFNMAP)) 178 return false; 179 180 /* 181 * DAX device mappings require predictable access latency, so avoid 182 * incurring periodic faults. 183 */ 184 if (vma_is_dax(vma)) 185 return false; 186 187#ifndef CONFIG_ARCH_ENABLE_HUGEPAGE_MIGRATION 188 if (vma->vm_flags & VM_HUGETLB) 189 return false; 190#endif 191 192 /* 193 * Migration allocates pages in the highest zone. If we cannot 194 * do so then migration (at least from node to node) is not 195 * possible. 196 */ 197 if (vma->vm_file && 198 gfp_zone(mapping_gfp_mask(vma->vm_file->f_mapping)) 199 < policy_zone) 200 return false; 201 return true; 202} 203 204extern int mpol_misplaced(struct page *, struct vm_area_struct *, unsigned long); 205extern void mpol_put_task_policy(struct task_struct *); 206 207#else 208 209struct mempolicy {}; 210 211static inline bool mpol_equal(struct mempolicy *a, struct mempolicy *b) 212{ 213 return true; 214} 215 216static inline void mpol_put(struct mempolicy *p) 217{ 218} 219 220static inline void mpol_cond_put(struct mempolicy *pol) 221{ 222} 223 224static inline void mpol_get(struct mempolicy *pol) 225{ 226} 227 228struct shared_policy {}; 229 230static inline void mpol_shared_policy_init(struct shared_policy *sp, 231 struct mempolicy *mpol) 232{ 233} 234 235static inline void mpol_free_shared_policy(struct shared_policy *p) 236{ 237} 238 239static inline struct mempolicy * 240mpol_shared_policy_lookup(struct shared_policy *sp, unsigned long idx) 241{ 242 return NULL; 243} 244 245#define vma_policy(vma) NULL 246 247static inline int 248vma_dup_policy(struct vm_area_struct *src, struct vm_area_struct *dst) 249{ 250 return 0; 251} 252 253static inline void numa_policy_init(void) 254{ 255} 256 257static inline void numa_default_policy(void) 258{ 259} 260 261static inline void mpol_rebind_task(struct task_struct *tsk, 262 const nodemask_t *new) 263{ 264} 265 266static inline void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new) 267{ 268} 269 270static inline int huge_node(struct vm_area_struct *vma, 271 unsigned long addr, gfp_t gfp_flags, 272 struct mempolicy **mpol, nodemask_t **nodemask) 273{ 274 *mpol = NULL; 275 *nodemask = NULL; 276 return 0; 277} 278 279static inline bool init_nodemask_of_mempolicy(nodemask_t *m) 280{ 281 return false; 282} 283 284static inline int do_migrate_pages(struct mm_struct *mm, const nodemask_t *from, 285 const nodemask_t *to, int flags) 286{ 287 return 0; 288} 289 290static inline void check_highest_zone(int k) 291{ 292} 293 294#ifdef CONFIG_TMPFS 295static inline int mpol_parse_str(char *str, struct mempolicy **mpol) 296{ 297 return 1; /* error */ 298} 299#endif 300 301static inline int mpol_misplaced(struct page *page, struct vm_area_struct *vma, 302 unsigned long address) 303{ 304 return -1; /* no node preference */ 305} 306 307static inline void mpol_put_task_policy(struct task_struct *task) 308{ 309} 310#endif /* CONFIG_NUMA */ 311#endif