mempolicy.h 6.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10
#ifndef _LINUX_MEMPOLICY_H
#define _LINUX_MEMPOLICY_H 1

#include <linux/errno.h>

/*
 * NUMA memory policies for Linux.
 * Copyright 2003,2004 Andi Kleen SuSE Labs
 */

11 12 13 14 15 16
/*
 * Both the MPOL_* mempolicy mode and the MPOL_F_* optional mode flags are
 * passed by the user to either set_mempolicy() or mbind() in an 'int' actual.
 * The MPOL_MODE_FLAGS macro determines the legal set of optional mode flags.
 */

L
Linus Torvalds 已提交
17
/* Policies */
18 19 20 21 22 23 24
enum {
	MPOL_DEFAULT,
	MPOL_PREFERRED,
	MPOL_BIND,
	MPOL_INTERLEAVE,
	MPOL_MAX,	/* always last member of enum */
};
L
Linus Torvalds 已提交
25

26
/* Flags for set_mempolicy */
27
#define MPOL_F_STATIC_NODES	(1 << 15)
28
#define MPOL_F_RELATIVE_NODES	(1 << 14)
29

30 31 32 33
/*
 * MPOL_MODE_FLAGS is the union of all possible optional mode flags passed to
 * either set_mempolicy() or mbind().
 */
34
#define MPOL_MODE_FLAGS	(MPOL_F_STATIC_NODES | MPOL_F_RELATIVE_NODES)
35 36

/* Flags for get_mempolicy */
L
Linus Torvalds 已提交
37 38
#define MPOL_F_NODE	(1<<0)	/* return next IL mode instead of node mask */
#define MPOL_F_ADDR	(1<<1)	/* look up vma using address */
39
#define MPOL_F_MEMS_ALLOWED (1<<2) /* return allowed memories */
L
Linus Torvalds 已提交
40 41 42

/* Flags for mbind */
#define MPOL_MF_STRICT	(1<<0)	/* Verify existing pages in the mapping */
43 44 45
#define MPOL_MF_MOVE	(1<<1)	/* Move pages owned by this process to conform to mapping */
#define MPOL_MF_MOVE_ALL (1<<2)	/* Move every page to conform to mapping */
#define MPOL_MF_INTERNAL (1<<3)	/* Internal flags start here */
L
Linus Torvalds 已提交
46 47 48 49 50 51 52

#ifdef __KERNEL__

#include <linux/mmzone.h>
#include <linux/slab.h>
#include <linux/rbtree.h>
#include <linux/spinlock.h>
53
#include <linux/nodemask.h>
L
Linus Torvalds 已提交
54

55
struct mm_struct;
L
Linus Torvalds 已提交
56 57 58 59 60 61 62 63 64 65 66 67 68 69

#ifdef CONFIG_NUMA

/*
 * Describe a memory policy.
 *
 * A mempolicy can be either associated with a process or with a VMA.
 * For VMA related allocations the VMA policy is preferred, otherwise
 * the process policy is used. Interrupts ignore the memory policy
 * of the current process.
 *
 * Locking policy for interlave:
 * In process context there is no locking because only the process accesses
 * its own state. All vma manipulation is somewhat protected by a down_read on
70
 * mmap_sem.
L
Linus Torvalds 已提交
71 72
 *
 * Freeing policy:
73
 * Mempolicy objects are reference counted.  A mempolicy will be freed when
74
 * mpol_put() decrements the reference count to zero.
L
Linus Torvalds 已提交
75
 *
76 77
 * Duplicating policy objects:
 * mpol_dup() allocates a new mempolicy and copies the specified mempolicy
78
 * to the new storage.  The reference count of the new object is initialized
79
 * to 1, representing the caller of mpol_dup().
L
Linus Torvalds 已提交
80 81 82
 */
struct mempolicy {
	atomic_t refcnt;
83
	unsigned short mode; 	/* See MPOL_* above */
84
	unsigned short flags;	/* See set_mempolicy() MPOL_F_* above */
L
Linus Torvalds 已提交
85 86
	union {
		short 		 preferred_node; /* preferred */
87
		nodemask_t	 nodes;		/* interleave/bind */
L
Linus Torvalds 已提交
88 89
		/* undefined for default */
	} v;
90 91 92 93
	union {
		nodemask_t cpuset_mems_allowed;	/* relative to these nodes */
		nodemask_t user_nodemask;	/* nodemask passed by user */
	} w;
L
Linus Torvalds 已提交
94 95 96 97 98 99 100
};

/*
 * Support for managing mempolicy data objects (clone, copy, destroy)
 * The default fast path of a NULL MPOL_DEFAULT policy is always inlined.
 */

101 102
extern void __mpol_put(struct mempolicy *pol);
static inline void mpol_put(struct mempolicy *pol)
L
Linus Torvalds 已提交
103 104
{
	if (pol)
105
		__mpol_put(pol);
L
Linus Torvalds 已提交
106 107
}

108 109
extern struct mempolicy *__mpol_dup(struct mempolicy *pol);
static inline struct mempolicy *mpol_dup(struct mempolicy *pol)
L
Linus Torvalds 已提交
110 111
{
	if (pol)
112
		pol = __mpol_dup(pol);
L
Linus Torvalds 已提交
113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151
	return pol;
}

#define vma_policy(vma) ((vma)->vm_policy)
#define vma_set_policy(vma, pol) ((vma)->vm_policy = (pol))

static inline void mpol_get(struct mempolicy *pol)
{
	if (pol)
		atomic_inc(&pol->refcnt);
}

extern int __mpol_equal(struct mempolicy *a, struct mempolicy *b);
static inline int mpol_equal(struct mempolicy *a, struct mempolicy *b)
{
	if (a == b)
		return 1;
	return __mpol_equal(a, b);
}

/*
 * Tree of shared policies for a shared memory region.
 * Maintain the policies in a pseudo mm that contains vmas. The vmas
 * carry the policy. As a special twist the pseudo mm is indexed in pages, not
 * bytes, so that we can work with shared memory segments bigger than
 * unsigned long.
 */

struct sp_node {
	struct rb_node nd;
	unsigned long start, end;
	struct mempolicy *policy;
};

struct shared_policy {
	struct rb_root root;
	spinlock_t lock;
};

152
void mpol_shared_policy_init(struct shared_policy *info, unsigned short mode,
153
				unsigned short flags, nodemask_t *nodes);
L
Linus Torvalds 已提交
154 155 156 157 158 159 160 161 162
int mpol_set_shared_policy(struct shared_policy *info,
				struct vm_area_struct *vma,
				struct mempolicy *new);
void mpol_free_shared_policy(struct shared_policy *p);
struct mempolicy *mpol_shared_policy_lookup(struct shared_policy *sp,
					    unsigned long idx);

extern void numa_default_policy(void);
extern void numa_policy_init(void);
163 164
extern void mpol_rebind_task(struct task_struct *tsk,
					const nodemask_t *new);
165
extern void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new);
166
extern void mpol_fix_fork_child_flag(struct task_struct *p);
167

168
extern struct zonelist *huge_zonelist(struct vm_area_struct *vma,
169 170
				unsigned long addr, gfp_t gfp_flags,
				struct mempolicy **mpol, nodemask_t **nodemask);
171
extern unsigned slab_node(struct mempolicy *policy);
L
Linus Torvalds 已提交
172

173
extern enum zone_type policy_zone;
174

175
static inline void check_highest_zone(enum zone_type k)
176
{
177
	if (k > policy_zone && k != ZONE_MOVABLE)
178 179 180
		policy_zone = k;
}

181 182 183
int do_migrate_pages(struct mm_struct *mm,
	const nodemask_t *from_nodes, const nodemask_t *to_nodes, int flags);

L
Linus Torvalds 已提交
184 185 186 187 188 189 190 191 192
#else

struct mempolicy {};

static inline int mpol_equal(struct mempolicy *a, struct mempolicy *b)
{
	return 1;
}

193
static inline void mpol_put(struct mempolicy *p)
L
Linus Torvalds 已提交
194 195 196 197 198 199 200
{
}

static inline void mpol_get(struct mempolicy *pol)
{
}

201
static inline struct mempolicy *mpol_dup(struct mempolicy *old)
L
Linus Torvalds 已提交
202 203 204 205 206 207 208 209 210 211 212 213 214
{
	return NULL;
}

struct shared_policy {};

static inline int mpol_set_shared_policy(struct shared_policy *info,
					struct vm_area_struct *vma,
					struct mempolicy *new)
{
	return -EINVAL;
}

215
static inline void mpol_shared_policy_init(struct shared_policy *info,
216
		unsigned short mode, unsigned short flags, nodemask_t *nodes)
L
Linus Torvalds 已提交
217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240
{
}

static inline void mpol_free_shared_policy(struct shared_policy *p)
{
}

static inline struct mempolicy *
mpol_shared_policy_lookup(struct shared_policy *sp, unsigned long idx)
{
	return NULL;
}

#define vma_policy(vma) NULL
#define vma_set_policy(vma, pol) do {} while(0)

static inline void numa_policy_init(void)
{
}

static inline void numa_default_policy(void)
{
}

241
static inline void mpol_rebind_task(struct task_struct *tsk,
242 243 244 245
					const nodemask_t *new)
{
}

246 247 248 249
static inline void mpol_rebind_mm(struct mm_struct *mm, nodemask_t *new)
{
}

250 251 252 253
static inline void mpol_fix_fork_child_flag(struct task_struct *p)
{
}

254
static inline struct zonelist *huge_zonelist(struct vm_area_struct *vma,
255 256
				unsigned long addr, gfp_t gfp_flags,
				struct mempolicy **mpol, nodemask_t **nodemask)
257
{
258 259
	*mpol = NULL;
	*nodemask = NULL;
260
	return node_zonelist(0, gfp_flags);
261 262
}

263 264 265 266 267 268 269
static inline int do_migrate_pages(struct mm_struct *mm,
			const nodemask_t *from_nodes,
			const nodemask_t *to_nodes, int flags)
{
	return 0;
}

270 271 272
static inline void check_highest_zone(int k)
{
}
L
Linus Torvalds 已提交
273 274 275 276
#endif /* CONFIG_NUMA */
#endif /* __KERNEL__ */

#endif