blob: c7ac77e873b3fa800e4c4d3a3db0bd43dcaf7192 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#ifndef _LINUX_MEMPOLICY_H
2#define _LINUX_MEMPOLICY_H 1
3
4#include <linux/errno.h>
5
6/*
7 * NUMA memory policies for Linux.
8 * Copyright 2003,2004 Andi Kleen SuSE Labs
9 */
10
11/* Policies */
12#define MPOL_DEFAULT 0
13#define MPOL_PREFERRED 1
14#define MPOL_BIND 2
15#define MPOL_INTERLEAVE 3
16
17#define MPOL_MAX MPOL_INTERLEAVE
18
19/* Flags for get_mem_policy */
20#define MPOL_F_NODE (1<<0) /* return next IL mode instead of node mask */
21#define MPOL_F_ADDR (1<<1) /* look up vma using address */
22
23/* Flags for mbind */
24#define MPOL_MF_STRICT (1<<0) /* Verify existing pages in the mapping */
Christoph Lameterdc9aa5b2006-01-08 01:00:50 -080025#define MPOL_MF_MOVE (1<<1) /* Move pages owned by this process to conform to mapping */
26#define MPOL_MF_MOVE_ALL (1<<2) /* Move every page to conform to mapping */
27#define MPOL_MF_INTERNAL (1<<3) /* Internal flags start here */
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#ifdef __KERNEL__
30
31#include <linux/config.h>
32#include <linux/mmzone.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#include <linux/slab.h>
34#include <linux/rbtree.h>
35#include <linux/spinlock.h>
Andi Kleendfcd3c02005-10-29 18:15:48 -070036#include <linux/nodemask.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037
38struct vm_area_struct;
39
40#ifdef CONFIG_NUMA
41
42/*
43 * Describe a memory policy.
44 *
45 * A mempolicy can be either associated with a process or with a VMA.
46 * For VMA related allocations the VMA policy is preferred, otherwise
47 * the process policy is used. Interrupts ignore the memory policy
48 * of the current process.
49 *
50 * Locking policy for interlave:
51 * In process context there is no locking because only the process accesses
52 * its own state. All vma manipulation is somewhat protected by a down_read on
Hugh Dickinsb8072f02005-10-29 18:16:41 -070053 * mmap_sem.
Linus Torvalds1da177e2005-04-16 15:20:36 -070054 *
55 * Freeing policy:
56 * When policy is MPOL_BIND v.zonelist is kmalloc'ed and must be kfree'd.
57 * All other policies don't have any external state. mpol_free() handles this.
58 *
59 * Copying policy objects:
60 * For MPOL_BIND the zonelist must be always duplicated. mpol_clone() does this.
61 */
62struct mempolicy {
63 atomic_t refcnt;
64 short policy; /* See MPOL_* above */
65 union {
66 struct zonelist *zonelist; /* bind */
67 short preferred_node; /* preferred */
Andi Kleendfcd3c02005-10-29 18:15:48 -070068 nodemask_t nodes; /* interleave */
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 /* undefined for default */
70 } v;
Paul Jackson74cb2152006-01-08 01:01:56 -080071 nodemask_t cpuset_mems_allowed; /* mempolicy relative to these nodes */
Linus Torvalds1da177e2005-04-16 15:20:36 -070072};
73
74/*
75 * Support for managing mempolicy data objects (clone, copy, destroy)
76 * The default fast path of a NULL MPOL_DEFAULT policy is always inlined.
77 */
78
79extern void __mpol_free(struct mempolicy *pol);
80static inline void mpol_free(struct mempolicy *pol)
81{
82 if (pol)
83 __mpol_free(pol);
84}
85
86extern struct mempolicy *__mpol_copy(struct mempolicy *pol);
87static inline struct mempolicy *mpol_copy(struct mempolicy *pol)
88{
89 if (pol)
90 pol = __mpol_copy(pol);
91 return pol;
92}
93
94#define vma_policy(vma) ((vma)->vm_policy)
95#define vma_set_policy(vma, pol) ((vma)->vm_policy = (pol))
96
97static inline void mpol_get(struct mempolicy *pol)
98{
99 if (pol)
100 atomic_inc(&pol->refcnt);
101}
102
103extern int __mpol_equal(struct mempolicy *a, struct mempolicy *b);
104static inline int mpol_equal(struct mempolicy *a, struct mempolicy *b)
105{
106 if (a == b)
107 return 1;
108 return __mpol_equal(a, b);
109}
110#define vma_mpol_equal(a,b) mpol_equal(vma_policy(a), vma_policy(b))
111
112/* Could later add inheritance of the process policy here. */
113
114#define mpol_set_vma_default(vma) ((vma)->vm_policy = NULL)
115
116/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117 * Tree of shared policies for a shared memory region.
118 * Maintain the policies in a pseudo mm that contains vmas. The vmas
119 * carry the policy. As a special twist the pseudo mm is indexed in pages, not
120 * bytes, so that we can work with shared memory segments bigger than
121 * unsigned long.
122 */
123
124struct sp_node {
125 struct rb_node nd;
126 unsigned long start, end;
127 struct mempolicy *policy;
128};
129
130struct shared_policy {
131 struct rb_root root;
132 spinlock_t lock;
133};
134
135static inline void mpol_shared_policy_init(struct shared_policy *info)
136{
137 info->root = RB_ROOT;
138 spin_lock_init(&info->lock);
139}
140
141int mpol_set_shared_policy(struct shared_policy *info,
142 struct vm_area_struct *vma,
143 struct mempolicy *new);
144void mpol_free_shared_policy(struct shared_policy *p);
145struct mempolicy *mpol_shared_policy_lookup(struct shared_policy *sp,
146 unsigned long idx);
147
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148extern void numa_default_policy(void);
149extern void numa_policy_init(void);
Paul Jackson74cb2152006-01-08 01:01:56 -0800150extern void mpol_rebind_policy(struct mempolicy *pol, const nodemask_t *new);
151extern void mpol_rebind_task(struct task_struct *tsk,
152 const nodemask_t *new);
Paul Jackson42253992006-01-08 01:01:59 -0800153extern void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new);
154#define set_cpuset_being_rebound(x) (cpuset_being_rebound = (x))
155
156#ifdef CONFIG_CPUSET
157#define current_cpuset_is_being_rebound() \
158 (cpuset_being_rebound == current->cpuset)
159#else
160#define current_cpuset_is_being_rebound() 0
161#endif
162
Andi Kleend42c6992005-07-06 19:56:03 +0200163extern struct mempolicy default_policy;
Christoph Lameter5da7ca82006-01-06 00:10:46 -0800164extern struct zonelist *huge_zonelist(struct vm_area_struct *vma,
165 unsigned long addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166
Christoph Lameter4be38e32006-01-06 00:11:17 -0800167extern int policy_zone;
168
169static inline void check_highest_zone(int k)
170{
171 if (k > policy_zone)
172 policy_zone = k;
173}
174
Christoph Lameter39743882006-01-08 01:00:51 -0800175int do_migrate_pages(struct mm_struct *mm,
176 const nodemask_t *from_nodes, const nodemask_t *to_nodes, int flags);
177
Paul Jackson42253992006-01-08 01:01:59 -0800178extern void *cpuset_being_rebound; /* Trigger mpol_copy vma rebind */
179
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180#else
181
182struct mempolicy {};
183
184static inline int mpol_equal(struct mempolicy *a, struct mempolicy *b)
185{
186 return 1;
187}
188#define vma_mpol_equal(a,b) 1
189
190#define mpol_set_vma_default(vma) do {} while(0)
191
192static inline void mpol_free(struct mempolicy *p)
193{
194}
195
196static inline void mpol_get(struct mempolicy *pol)
197{
198}
199
200static inline struct mempolicy *mpol_copy(struct mempolicy *old)
201{
202 return NULL;
203}
204
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205struct shared_policy {};
206
207static inline int mpol_set_shared_policy(struct shared_policy *info,
208 struct vm_area_struct *vma,
209 struct mempolicy *new)
210{
211 return -EINVAL;
212}
213
214static inline void mpol_shared_policy_init(struct shared_policy *info)
215{
216}
217
218static inline void mpol_free_shared_policy(struct shared_policy *p)
219{
220}
221
222static inline struct mempolicy *
223mpol_shared_policy_lookup(struct shared_policy *sp, unsigned long idx)
224{
225 return NULL;
226}
227
228#define vma_policy(vma) NULL
229#define vma_set_policy(vma, pol) do {} while(0)
230
231static inline void numa_policy_init(void)
232{
233}
234
235static inline void numa_default_policy(void)
236{
237}
238
Paul Jackson74cb2152006-01-08 01:01:56 -0800239static inline void mpol_rebind_policy(struct mempolicy *pol,
240 const nodemask_t *new)
241{
242}
243
244static inline void mpol_rebind_task(struct task_struct *tsk,
Paul Jackson68860ec2005-10-30 15:02:36 -0800245 const nodemask_t *new)
246{
247}
248
Paul Jackson42253992006-01-08 01:01:59 -0800249static inline void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new)
250{
251}
252
253#define set_cpuset_being_rebound(x) do {} while (0)
254
Christoph Lameter5da7ca82006-01-06 00:10:46 -0800255static inline struct zonelist *huge_zonelist(struct vm_area_struct *vma,
256 unsigned long addr)
257{
258 return NODE_DATA(0)->node_zonelists + gfp_zone(GFP_HIGHUSER);
259}
260
Paul Jackson45b07ef2006-01-08 01:00:56 -0800261static inline int do_migrate_pages(struct mm_struct *mm,
262 const nodemask_t *from_nodes,
263 const nodemask_t *to_nodes, int flags)
264{
265 return 0;
266}
267
Christoph Lameter4be38e32006-01-06 00:11:17 -0800268static inline void check_highest_zone(int k)
269{
270}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271#endif /* CONFIG_NUMA */
272#endif /* __KERNEL__ */
273
274#endif