blob: 74357cb9bc7ca0caeec26bbf6196be7a767d1abf [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#ifndef _LINUX_MEMPOLICY_H
2#define _LINUX_MEMPOLICY_H 1
3
4#include <linux/errno.h>
5
6/*
7 * NUMA memory policies for Linux.
8 * Copyright 2003,2004 Andi Kleen SuSE Labs
9 */
10
11/* Policies */
12#define MPOL_DEFAULT 0
13#define MPOL_PREFERRED 1
14#define MPOL_BIND 2
15#define MPOL_INTERLEAVE 3
16
17#define MPOL_MAX MPOL_INTERLEAVE
18
19/* Flags for get_mem_policy */
20#define MPOL_F_NODE (1<<0) /* return next IL mode instead of node mask */
21#define MPOL_F_ADDR (1<<1) /* look up vma using address */
22
23/* Flags for mbind */
24#define MPOL_MF_STRICT (1<<0) /* Verify existing pages in the mapping */
Christoph Lameterdc9aa5b2006-01-08 01:00:50 -080025#define MPOL_MF_MOVE (1<<1) /* Move pages owned by this process to conform to mapping */
26#define MPOL_MF_MOVE_ALL (1<<2) /* Move every page to conform to mapping */
27#define MPOL_MF_INTERNAL (1<<3) /* Internal flags start here */
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#ifdef __KERNEL__
30
31#include <linux/config.h>
32#include <linux/mmzone.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033#include <linux/slab.h>
34#include <linux/rbtree.h>
35#include <linux/spinlock.h>
Andi Kleendfcd3c02005-10-29 18:15:48 -070036#include <linux/nodemask.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037
38struct vm_area_struct;
39
40#ifdef CONFIG_NUMA
41
42/*
43 * Describe a memory policy.
44 *
45 * A mempolicy can be either associated with a process or with a VMA.
46 * For VMA related allocations the VMA policy is preferred, otherwise
47 * the process policy is used. Interrupts ignore the memory policy
48 * of the current process.
49 *
50 * Locking policy for interlave:
51 * In process context there is no locking because only the process accesses
52 * its own state. All vma manipulation is somewhat protected by a down_read on
Hugh Dickinsb8072f02005-10-29 18:16:41 -070053 * mmap_sem.
Linus Torvalds1da177e2005-04-16 15:20:36 -070054 *
55 * Freeing policy:
56 * When policy is MPOL_BIND v.zonelist is kmalloc'ed and must be kfree'd.
57 * All other policies don't have any external state. mpol_free() handles this.
58 *
59 * Copying policy objects:
60 * For MPOL_BIND the zonelist must be always duplicated. mpol_clone() does this.
61 */
62struct mempolicy {
63 atomic_t refcnt;
64 short policy; /* See MPOL_* above */
65 union {
66 struct zonelist *zonelist; /* bind */
67 short preferred_node; /* preferred */
Andi Kleendfcd3c02005-10-29 18:15:48 -070068 nodemask_t nodes; /* interleave */
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 /* undefined for default */
70 } v;
Paul Jackson74cb2152006-01-08 01:01:56 -080071 nodemask_t cpuset_mems_allowed; /* mempolicy relative to these nodes */
Linus Torvalds1da177e2005-04-16 15:20:36 -070072};
73
74/*
75 * Support for managing mempolicy data objects (clone, copy, destroy)
76 * The default fast path of a NULL MPOL_DEFAULT policy is always inlined.
77 */
78
79extern void __mpol_free(struct mempolicy *pol);
80static inline void mpol_free(struct mempolicy *pol)
81{
82 if (pol)
83 __mpol_free(pol);
84}
85
86extern struct mempolicy *__mpol_copy(struct mempolicy *pol);
87static inline struct mempolicy *mpol_copy(struct mempolicy *pol)
88{
89 if (pol)
90 pol = __mpol_copy(pol);
91 return pol;
92}
93
94#define vma_policy(vma) ((vma)->vm_policy)
95#define vma_set_policy(vma, pol) ((vma)->vm_policy = (pol))
96
97static inline void mpol_get(struct mempolicy *pol)
98{
99 if (pol)
100 atomic_inc(&pol->refcnt);
101}
102
103extern int __mpol_equal(struct mempolicy *a, struct mempolicy *b);
104static inline int mpol_equal(struct mempolicy *a, struct mempolicy *b)
105{
106 if (a == b)
107 return 1;
108 return __mpol_equal(a, b);
109}
110#define vma_mpol_equal(a,b) mpol_equal(vma_policy(a), vma_policy(b))
111
112/* Could later add inheritance of the process policy here. */
113
114#define mpol_set_vma_default(vma) ((vma)->vm_policy = NULL)
115
116/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117 * Tree of shared policies for a shared memory region.
118 * Maintain the policies in a pseudo mm that contains vmas. The vmas
119 * carry the policy. As a special twist the pseudo mm is indexed in pages, not
120 * bytes, so that we can work with shared memory segments bigger than
121 * unsigned long.
122 */
123
124struct sp_node {
125 struct rb_node nd;
126 unsigned long start, end;
127 struct mempolicy *policy;
128};
129
130struct shared_policy {
131 struct rb_root root;
132 spinlock_t lock;
133};
134
135static inline void mpol_shared_policy_init(struct shared_policy *info)
136{
137 info->root = RB_ROOT;
138 spin_lock_init(&info->lock);
139}
140
141int mpol_set_shared_policy(struct shared_policy *info,
142 struct vm_area_struct *vma,
143 struct mempolicy *new);
144void mpol_free_shared_policy(struct shared_policy *p);
145struct mempolicy *mpol_shared_policy_lookup(struct shared_policy *sp,
146 unsigned long idx);
147
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148extern void numa_default_policy(void);
149extern void numa_policy_init(void);
Paul Jackson74cb2152006-01-08 01:01:56 -0800150extern void mpol_rebind_policy(struct mempolicy *pol, const nodemask_t *new);
151extern void mpol_rebind_task(struct task_struct *tsk,
152 const nodemask_t *new);
Andi Kleend42c6992005-07-06 19:56:03 +0200153extern struct mempolicy default_policy;
Christoph Lameter5da7ca82006-01-06 00:10:46 -0800154extern struct zonelist *huge_zonelist(struct vm_area_struct *vma,
155 unsigned long addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156
Christoph Lameter4be38e32006-01-06 00:11:17 -0800157extern int policy_zone;
158
159static inline void check_highest_zone(int k)
160{
161 if (k > policy_zone)
162 policy_zone = k;
163}
164
Christoph Lameter39743882006-01-08 01:00:51 -0800165int do_migrate_pages(struct mm_struct *mm,
166 const nodemask_t *from_nodes, const nodemask_t *to_nodes, int flags);
167
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168#else
169
170struct mempolicy {};
171
172static inline int mpol_equal(struct mempolicy *a, struct mempolicy *b)
173{
174 return 1;
175}
176#define vma_mpol_equal(a,b) 1
177
178#define mpol_set_vma_default(vma) do {} while(0)
179
180static inline void mpol_free(struct mempolicy *p)
181{
182}
183
184static inline void mpol_get(struct mempolicy *pol)
185{
186}
187
188static inline struct mempolicy *mpol_copy(struct mempolicy *old)
189{
190 return NULL;
191}
192
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193struct shared_policy {};
194
195static inline int mpol_set_shared_policy(struct shared_policy *info,
196 struct vm_area_struct *vma,
197 struct mempolicy *new)
198{
199 return -EINVAL;
200}
201
202static inline void mpol_shared_policy_init(struct shared_policy *info)
203{
204}
205
206static inline void mpol_free_shared_policy(struct shared_policy *p)
207{
208}
209
210static inline struct mempolicy *
211mpol_shared_policy_lookup(struct shared_policy *sp, unsigned long idx)
212{
213 return NULL;
214}
215
216#define vma_policy(vma) NULL
217#define vma_set_policy(vma, pol) do {} while(0)
218
219static inline void numa_policy_init(void)
220{
221}
222
223static inline void numa_default_policy(void)
224{
225}
226
Paul Jackson74cb2152006-01-08 01:01:56 -0800227static inline void mpol_rebind_policy(struct mempolicy *pol,
228 const nodemask_t *new)
229{
230}
231
232static inline void mpol_rebind_task(struct task_struct *tsk,
Paul Jackson68860ec2005-10-30 15:02:36 -0800233 const nodemask_t *new)
234{
235}
236
Christoph Lameter5da7ca82006-01-06 00:10:46 -0800237static inline struct zonelist *huge_zonelist(struct vm_area_struct *vma,
238 unsigned long addr)
239{
240 return NODE_DATA(0)->node_zonelists + gfp_zone(GFP_HIGHUSER);
241}
242
Paul Jackson45b07ef2006-01-08 01:00:56 -0800243static inline int do_migrate_pages(struct mm_struct *mm,
244 const nodemask_t *from_nodes,
245 const nodemask_t *to_nodes, int flags)
246{
247 return 0;
248}
249
Christoph Lameter4be38e32006-01-06 00:11:17 -0800250static inline void check_highest_zone(int k)
251{
252}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253#endif /* CONFIG_NUMA */
254#endif /* __KERNEL__ */
255
256#endif