rmap.h 8.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10
#ifndef _LINUX_RMAP_H
#define _LINUX_RMAP_H
/*
 * Declarations for Reverse Mapping functions in mm/rmap.c
 */

#include <linux/list.h>
#include <linux/slab.h>
#include <linux/mm.h>
#include <linux/spinlock.h>
11
#include <linux/memcontrol.h>
L
Linus Torvalds 已提交
12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27

/*
 * The anon_vma heads a list of private "related" vmas, to scan if
 * an anonymous page pointing to this anon_vma needs to be unmapped:
 * the vmas on the list will be related by forking, or by splitting.
 *
 * Since vmas come and go as they are split and merged (particularly
 * in mprotect), the mapping field of an anonymous page cannot point
 * directly to a vma: instead it points to an anon_vma, on whose list
 * the related vmas can be easily linked or unlinked.
 *
 * After unlinking the last vma on the list, we must garbage collect
 * the anon_vma object itself: we're guaranteed no page can be
 * pointing to this anon_vma once its vma list is empty.
 */
struct anon_vma {
28
	struct anon_vma *root;	/* Root of this anon_vma tree */
29
	spinlock_t lock;	/* Serialize access to vma list */
30 31 32 33 34 35 36 37 38 39 40
#if defined(CONFIG_KSM) || defined(CONFIG_MIGRATION)

	/*
	 * The external_refcount is taken by either KSM or page migration
	 * to take a reference to an anon_vma when there is no
	 * guarantee that the vma of page tables will exist for
	 * the duration of the operation. A caller that takes
	 * the reference is responsible for clearing up the
	 * anon_vma if they are the last user on release
	 */
	atomic_t external_refcount;
H
Hugh Dickins 已提交
41
#endif
42 43 44 45 46 47 48 49
	/*
	 * NOTE: the LSB of the head.next is set by
	 * mm_take_all_locks() _after_ taking the above lock. So the
	 * head must only be read/written after taking the above lock
	 * to be sure to see a valid next pointer. The LSB bit itself
	 * is serialized by a system wide lock only visible to
	 * mm_take_all_locks() (mm_all_locks_mutex).
	 */
50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70
	struct list_head head;	/* Chain of private "related" vmas */
};

/*
 * The copy-on-write semantics of fork mean that an anon_vma
 * can become associated with multiple processes. Furthermore,
 * each child process will have its own anon_vma, where new
 * pages for that process are instantiated.
 *
 * This structure allows us to find the anon_vmas associated
 * with a VMA, or the VMAs associated with an anon_vma.
 * The "same_vma" list contains the anon_vma_chains linking
 * all the anon_vmas associated with this VMA.
 * The "same_anon_vma" list contains the anon_vma_chains
 * which link all the VMAs associated with this anon_vma.
 */
struct anon_vma_chain {
	struct vm_area_struct *vma;
	struct anon_vma *anon_vma;
	struct list_head same_vma;   /* locked by mmap_sem & page_table_lock */
	struct list_head same_anon_vma;	/* locked by anon_vma->lock */
L
Linus Torvalds 已提交
71 72 73
};

#ifdef CONFIG_MMU
74 75
#if defined(CONFIG_KSM) || defined(CONFIG_MIGRATION)
static inline void anonvma_external_refcount_init(struct anon_vma *anon_vma)
H
Hugh Dickins 已提交
76
{
77
	atomic_set(&anon_vma->external_refcount, 0);
H
Hugh Dickins 已提交
78 79
}

80
static inline int anonvma_external_refcount(struct anon_vma *anon_vma)
H
Hugh Dickins 已提交
81
{
82
	return atomic_read(&anon_vma->external_refcount);
H
Hugh Dickins 已提交
83
}
84 85 86 87 88 89 90

static inline void get_anon_vma(struct anon_vma *anon_vma)
{
	atomic_inc(&anon_vma->external_refcount);
}

void drop_anon_vma(struct anon_vma *);
H
Hugh Dickins 已提交
91
#else
92
static inline void anonvma_external_refcount_init(struct anon_vma *anon_vma)
H
Hugh Dickins 已提交
93 94 95
{
}

96
static inline int anonvma_external_refcount(struct anon_vma *anon_vma)
H
Hugh Dickins 已提交
97 98 99
{
	return 0;
}
100 101 102 103 104 105 106 107

static inline void get_anon_vma(struct anon_vma *anon_vma)
{
}

static inline void drop_anon_vma(struct anon_vma *anon_vma)
{
}
H
Hugh Dickins 已提交
108
#endif /* CONFIG_KSM */
L
Linus Torvalds 已提交
109

H
Hugh Dickins 已提交
110 111 112 113 114 115 116 117
static inline struct anon_vma *page_anon_vma(struct page *page)
{
	if (((unsigned long)page->mapping & PAGE_MAPPING_FLAGS) !=
					    PAGE_MAPPING_ANON)
		return NULL;
	return page_rmapping(page);
}

118
static inline void vma_lock_anon_vma(struct vm_area_struct *vma)
L
Linus Torvalds 已提交
119 120 121
{
	struct anon_vma *anon_vma = vma->anon_vma;
	if (anon_vma)
122
		spin_lock(&anon_vma->root->lock);
L
Linus Torvalds 已提交
123 124
}

125
static inline void vma_unlock_anon_vma(struct vm_area_struct *vma)
L
Linus Torvalds 已提交
126 127 128
{
	struct anon_vma *anon_vma = vma->anon_vma;
	if (anon_vma)
129
		spin_unlock(&anon_vma->root->lock);
L
Linus Torvalds 已提交
130 131
}

132 133
static inline void anon_vma_lock(struct anon_vma *anon_vma)
{
134
	spin_lock(&anon_vma->root->lock);
135 136 137 138
}

static inline void anon_vma_unlock(struct anon_vma *anon_vma)
{
139
	spin_unlock(&anon_vma->root->lock);
140 141
}

L
Linus Torvalds 已提交
142 143 144 145 146
/*
 * anon_vma helper functions.
 */
void anon_vma_init(void);	/* create anon_vma_cachep */
int  anon_vma_prepare(struct vm_area_struct *);
147 148 149
void unlink_anon_vmas(struct vm_area_struct *);
int anon_vma_clone(struct vm_area_struct *, struct vm_area_struct *);
int anon_vma_fork(struct vm_area_struct *, struct vm_area_struct *);
L
Linus Torvalds 已提交
150
void __anon_vma_link(struct vm_area_struct *);
H
Hugh Dickins 已提交
151
void anon_vma_free(struct anon_vma *);
L
Linus Torvalds 已提交
152

153 154 155 156 157 158 159
static inline void anon_vma_merge(struct vm_area_struct *vma,
				  struct vm_area_struct *next)
{
	VM_BUG_ON(vma->anon_vma != next->anon_vma);
	unlink_anon_vmas(next);
}

L
Linus Torvalds 已提交
160 161 162
/*
 * rmap interfaces called when adding or removing pte of page
 */
163
void page_move_anon_rmap(struct page *, struct vm_area_struct *, unsigned long);
L
Linus Torvalds 已提交
164
void page_add_anon_rmap(struct page *, struct vm_area_struct *, unsigned long);
165 166
void do_page_add_anon_rmap(struct page *, struct vm_area_struct *,
			   unsigned long, int);
N
Nick Piggin 已提交
167
void page_add_new_anon_rmap(struct page *, struct vm_area_struct *, unsigned long);
L
Linus Torvalds 已提交
168
void page_add_file_rmap(struct page *);
169
void page_remove_rmap(struct page *);
L
Linus Torvalds 已提交
170

171 172 173 174 175
void hugepage_add_anon_rmap(struct page *, struct vm_area_struct *,
			    unsigned long);
void hugepage_add_new_anon_rmap(struct page *, struct vm_area_struct *,
				unsigned long);

H
Hugh Dickins 已提交
176
static inline void page_dup_rmap(struct page *page)
L
Linus Torvalds 已提交
177 178 179 180 181 182 183
{
	atomic_inc(&page->_mapcount);
}

/*
 * Called from mm/vmscan.c to handle paging out
 */
184 185
int page_referenced(struct page *, int is_locked,
			struct mem_cgroup *cnt, unsigned long *vm_flags);
H
Hugh Dickins 已提交
186 187 188
int page_referenced_one(struct page *, struct vm_area_struct *,
	unsigned long address, unsigned int *mapcount, unsigned long *vm_flags);

189 190 191 192 193 194 195 196
enum ttu_flags {
	TTU_UNMAP = 0,			/* unmap mode */
	TTU_MIGRATION = 1,		/* migration mode */
	TTU_MUNLOCK = 2,		/* munlock mode */
	TTU_ACTION_MASK = 0xff,

	TTU_IGNORE_MLOCK = (1 << 8),	/* ignore mlock */
	TTU_IGNORE_ACCESS = (1 << 9),	/* don't age */
197
	TTU_IGNORE_HWPOISON = (1 << 10),/* corrupted page is recoverable */
198 199 200
};
#define TTU_ACTION(x) ((x) & TTU_ACTION_MASK)

201 202
bool is_vma_temporary_stack(struct vm_area_struct *vma);

203
int try_to_unmap(struct page *, enum ttu_flags flags);
H
Hugh Dickins 已提交
204 205
int try_to_unmap_one(struct page *, struct vm_area_struct *,
			unsigned long address, enum ttu_flags flags);
L
Linus Torvalds 已提交
206

207 208 209
/*
 * Called from mm/filemap_xip.c to unmap empty zero page
 */
210
pte_t *__page_check_address(struct page *, struct mm_struct *,
N
Nick Piggin 已提交
211
				unsigned long, spinlock_t **, int);
212

213 214 215 216 217 218 219 220 221 222 223
static inline pte_t *page_check_address(struct page *page, struct mm_struct *mm,
					unsigned long address,
					spinlock_t **ptlp, int sync)
{
	pte_t *ptep;

	__cond_lock(*ptlp, ptep = __page_check_address(page, mm, address,
						       ptlp, sync));
	return ptep;
}

L
Linus Torvalds 已提交
224 225 226 227 228
/*
 * Used by swapoff to help locate where page is expected in vma.
 */
unsigned long page_address_in_vma(struct page *, struct vm_area_struct *);

229 230 231 232 233 234 235 236
/*
 * Cleans the PTEs of shared mappings.
 * (and since clean PTEs should also be readonly, write protects them too)
 *
 * returns the number of cleaned PTEs.
 */
int page_mkclean(struct page *);

N
Nick Piggin 已提交
237 238 239 240 241 242
/*
 * called in munlock()/munmap() path to check for other vmas holding
 * the page mlocked.
 */
int try_to_munlock(struct page *);

243 244 245
/*
 * Called by memory-failure.c to kill processes.
 */
246 247 248 249 250 251 252 253 254 255 256 257 258 259
struct anon_vma *__page_lock_anon_vma(struct page *page);

static inline struct anon_vma *page_lock_anon_vma(struct page *page)
{
	struct anon_vma *anon_vma;

	__cond_lock(RCU, anon_vma = __page_lock_anon_vma(page));

	/* (void) is needed to make gcc happy */
	(void) __cond_lock(&anon_vma->root->lock, anon_vma);

	return anon_vma;
}

260
void page_unlock_anon_vma(struct anon_vma *anon_vma);
261
int page_mapped_in_vma(struct page *page, struct vm_area_struct *vma);
262

263 264 265 266 267 268
/*
 * Called by migrate.c to remove migration ptes, but might be used more later.
 */
int rmap_walk(struct page *page, int (*rmap_one)(struct page *,
		struct vm_area_struct *, unsigned long, void *), void *arg);

L
Linus Torvalds 已提交
269 270 271 272 273 274
#else	/* !CONFIG_MMU */

#define anon_vma_init()		do {} while (0)
#define anon_vma_prepare(vma)	(0)
#define anon_vma_link(vma)	do {} while (0)

275 276 277 278 279
static inline int page_referenced(struct page *page, int is_locked,
				  struct mem_cgroup *cnt,
				  unsigned long *vm_flags)
{
	*vm_flags = 0;
280
	return 0;
281 282
}

283
#define try_to_unmap(page, refs) SWAP_FAIL
L
Linus Torvalds 已提交
284

285 286 287 288 289 290
static inline int page_mkclean(struct page *page)
{
	return 0;
}


L
Linus Torvalds 已提交
291 292 293 294 295 296 297 298
#endif	/* CONFIG_MMU */

/*
 * Return values of try_to_unmap
 */
#define SWAP_SUCCESS	0
#define SWAP_AGAIN	1
#define SWAP_FAIL	2
N
Nick Piggin 已提交
299
#define SWAP_MLOCK	3
L
Linus Torvalds 已提交
300 301

#endif	/* _LINUX_RMAP_H */