swap.h 14.1 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7
#ifndef _LINUX_SWAP_H
#define _LINUX_SWAP_H

#include <linux/spinlock.h>
#include <linux/linkage.h>
#include <linux/mmzone.h>
#include <linux/list.h>
8
#include <linux/memcontrol.h>
L
Linus Torvalds 已提交
9
#include <linux/sched.h>
10
#include <linux/node.h>
A
Andrew Morton 已提交
11

L
Linus Torvalds 已提交
12 13 14
#include <asm/atomic.h>
#include <asm/page.h>

15 16
struct notifier_block;

A
Andrew Morton 已提交
17 18
struct bio;

L
Linus Torvalds 已提交
19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36
#define SWAP_FLAG_PREFER	0x8000	/* set if swap priority specified */
#define SWAP_FLAG_PRIO_MASK	0x7fff
#define SWAP_FLAG_PRIO_SHIFT	0

static inline int current_is_kswapd(void)
{
	return current->flags & PF_KSWAPD;
}

/*
 * MAX_SWAPFILES defines the maximum number of swaptypes: things which can
 * be swapped to.  The swap type and the offset into that swap type are
 * encoded into pte's and into pgoff_t's in the swapcache.  Using five bits
 * for the type means that the maximum number of swapcache pages is 27 bits
 * on 32-bit-pgoff_t architectures.  And that assumes that the architecture packs
 * the type/offset into the pte as 5/27 as well.
 */
#define MAX_SWAPFILES_SHIFT	5
37 38 39 40 41 42 43 44 45 46 47 48 49 50

/*
 * Use some of the swap files numbers for other purposes. This
 * is a convenient way to hook into the VM to trigger special
 * actions on faults.
 */

/*
 * NUMA node memory migration support
 */
#ifdef CONFIG_MIGRATION
#define SWP_MIGRATION_NUM 2
#define SWP_MIGRATION_READ	(MAX_SWAPFILES + SWP_HWPOISON_NUM)
#define SWP_MIGRATION_WRITE	(MAX_SWAPFILES + SWP_HWPOISON_NUM + 1)
51
#else
52
#define SWP_MIGRATION_NUM 0
53
#endif
L
Linus Torvalds 已提交
54

55 56 57 58 59 60 61 62 63 64 65 66 67
/*
 * Handling of hardware poisoned pages with memory corruption.
 */
#ifdef CONFIG_MEMORY_FAILURE
#define SWP_HWPOISON_NUM 1
#define SWP_HWPOISON		MAX_SWAPFILES
#else
#define SWP_HWPOISON_NUM 0
#endif

#define MAX_SWAPFILES \
	((1 << MAX_SWAPFILES_SHIFT) - SWP_MIGRATION_NUM - SWP_HWPOISON_NUM)

L
Linus Torvalds 已提交
68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85
/*
 * Magic header for a swap area. The first part of the union is
 * what the swap magic looks like for the old (limited to 128MB)
 * swap area format, the second part of the union adds - in the
 * old reserved area - some extra information. Note that the first
 * kilobyte is reserved for boot loader or disk label stuff...
 *
 * Having the magic at the end of the PAGE_SIZE makes detecting swap
 * areas somewhat tricky on machines that support multiple page sizes.
 * For 2.5 we'll probably want to move the magic to just beyond the
 * bootbits...
 */
union swap_header {
	struct {
		char reserved[PAGE_SIZE - 10];
		char magic[10];			/* SWAP-SPACE or SWAPSPACE2 */
	} magic;
	struct {
86 87 88 89 90 91 92 93
		char		bootbits[1024];	/* Space for disklabel etc. */
		__u32		version;
		__u32		last_page;
		__u32		nr_badpages;
		unsigned char	sws_uuid[16];
		unsigned char	sws_volume[16];
		__u32		padding[117];
		__u32		badpages[1];
L
Linus Torvalds 已提交
94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144
	} info;
};

 /* A swap entry has to fit into a "unsigned long", as
  * the entry is hidden in the "index" field of the
  * swapper address space.
  */
typedef struct {
	unsigned long val;
} swp_entry_t;

/*
 * current->reclaim_state points to one of these when a task is running
 * memory reclaim
 */
struct reclaim_state {
	unsigned long reclaimed_slab;
};

#ifdef __KERNEL__

struct address_space;
struct sysinfo;
struct writeback_control;
struct zone;

/*
 * A swap extent maps a range of a swapfile's PAGE_SIZE pages onto a range of
 * disk blocks.  A list of swap extents maps the entire swapfile.  (Where the
 * term `swapfile' refers to either a blockdevice or an IS_REG file.  Apart
 * from setup, they're handled identically.
 *
 * We always assume that blocks are of size PAGE_SIZE.
 */
struct swap_extent {
	struct list_head list;
	pgoff_t start_page;
	pgoff_t nr_pages;
	sector_t start_block;
};

/*
 * Max bad pages in the new format..
 */
#define __swapoffset(x) ((unsigned long)&((union swap_header *)0)->x)
#define MAX_SWAP_BADPAGES \
	((__swapoffset(magic.magic) - __swapoffset(info.badpages)) / sizeof(int))

enum {
	SWP_USED	= (1 << 0),	/* is slot in swap_info[] used? */
	SWP_WRITEOK	= (1 << 1),	/* ok to write to this swap?	*/
145
	SWP_DISCARDABLE = (1 << 2),	/* blkdev supports discard */
146
	SWP_DISCARDING	= (1 << 3),	/* now discarding a free cluster */
147
	SWP_SOLIDSTATE	= (1 << 4),	/* blkdev seeks are cheap */
H
Hugh Dickins 已提交
148
	SWP_CONTINUED	= (1 << 5),	/* swap_map has count continuation */
149
	SWP_BLKDEV	= (1 << 6),	/* its a block device */
150 151
					/* add others here before... */
	SWP_SCANNING	= (1 << 8),	/* refcount in scan_swap_map */
L
Linus Torvalds 已提交
152 153 154 155
};

#define SWAP_CLUSTER_MAX 32

H
Hugh Dickins 已提交
156 157 158 159 160
#define SWAP_MAP_MAX	0x3e	/* Max duplication count, in first swap_map */
#define SWAP_MAP_BAD	0x3f	/* Note pageblock is bad, in first swap_map */
#define SWAP_HAS_CACHE	0x40	/* Flag page is cached, in first swap_map */
#define SWAP_CONT_MAX	0x7f	/* Max count, in each swap_map continuation */
#define COUNT_CONTINUED	0x80	/* See swap_map continuation for full count */
H
Hugh Dickins 已提交
161
#define SWAP_MAP_SHMEM	0xbf	/* Owned by shmem/tmpfs, in first swap_map */
H
Hugh Dickins 已提交
162

L
Linus Torvalds 已提交
163 164 165 166
/*
 * The in-memory structure used to track swap areas.
 */
struct swap_info_struct {
167 168 169 170
	unsigned long	flags;		/* SWP_USED etc: see above */
	signed short	prio;		/* swap priority of this type */
	signed char	type;		/* strange name for an index */
	signed char	next;		/* next type on the swap list */
H
Hugh Dickins 已提交
171 172 173 174 175 176 177 178
	unsigned int	max;		/* extent of the swap_map */
	unsigned char *swap_map;	/* vmalloc'ed array of usage counts */
	unsigned int lowest_bit;	/* index of first free in swap_map */
	unsigned int highest_bit;	/* index of last free in swap_map */
	unsigned int pages;		/* total of usable pages of swap */
	unsigned int inuse_pages;	/* number of those currently in use */
	unsigned int cluster_next;	/* likely index for next allocation */
	unsigned int cluster_nr;	/* countdown to next cluster search */
179 180
	unsigned int lowest_alloc;	/* while preparing discard cluster */
	unsigned int highest_alloc;	/* while preparing discard cluster */
H
Hugh Dickins 已提交
181 182 183 184 185
	struct swap_extent *curr_swap_extent;
	struct swap_extent first_swap_extent;
	struct block_device *bdev;	/* swap device or bdev of swap file */
	struct file *swap_file;		/* seldom referenced */
	unsigned int old_block_size;	/* seldom referenced */
L
Linus Torvalds 已提交
186 187 188 189 190 191 192 193 194 195 196 197
};

struct swap_list_t {
	int head;	/* head of priority-ordered swapfile list */
	int next;	/* swapfile to be used next */
};

/* Swap 50% full? Release swapcache more aggressively.. */
#define vm_swap_full() (nr_swap_pages*2 < total_swap_pages)

/* linux/mm/page_alloc.c */
extern unsigned long totalram_pages;
198
extern unsigned long totalreserve_pages;
L
Linus Torvalds 已提交
199 200 201
extern unsigned int nr_free_buffer_pages(void);
extern unsigned int nr_free_pagecache_pages(void);

C
Christoph Lameter 已提交
202 203 204 205
/* Definition of global_page_state not available yet */
#define nr_free_pages() global_page_state(NR_FREE_PAGES)


L
Linus Torvalds 已提交
206
/* linux/mm/swap.c */
207 208
extern void __lru_cache_add(struct page *, enum lru_list lru);
extern void lru_cache_add_lru(struct page *, enum lru_list lru);
209 210
extern void activate_page(struct page *);
extern void mark_page_accessed(struct page *);
L
Linus Torvalds 已提交
211
extern void lru_add_drain(void);
212
extern int lru_add_drain_all(void);
213
extern void rotate_reclaimable_page(struct page *page);
L
Linus Torvalds 已提交
214 215
extern void swap_setup(void);

L
Lee Schermerhorn 已提交
216 217
extern void add_page_to_unevictable_list(struct page *page);

218 219 220 221
/**
 * lru_cache_add: add a page to the page lists
 * @page: the page to add
 */
222
static inline void lru_cache_add_anon(struct page *page)
223
{
224
	__lru_cache_add(page, LRU_INACTIVE_ANON);
225 226
}

227 228 229 230 231
static inline void lru_cache_add_file(struct page *page)
{
	__lru_cache_add(page, LRU_INACTIVE_FILE);
}

232 233 234 235 236
/* LRU Isolation modes. */
#define ISOLATE_INACTIVE 0	/* Isolate inactive pages. */
#define ISOLATE_ACTIVE 1	/* Isolate active pages. */
#define ISOLATE_BOTH 2		/* Isolate both active and inactive pages. */

L
Linus Torvalds 已提交
237
/* linux/mm/vmscan.c */
238
extern unsigned long try_to_free_pages(struct zonelist *zonelist, int order,
239
					gfp_t gfp_mask, nodemask_t *mask);
240
extern unsigned long try_to_free_mem_cgroup_pages(struct mem_cgroup *mem,
K
KOSAKI Motohiro 已提交
241 242
						  gfp_t gfp_mask, bool noswap,
						  unsigned int swappiness);
243 244 245 246 247
extern unsigned long mem_cgroup_shrink_node_zone(struct mem_cgroup *mem,
						gfp_t gfp_mask, bool noswap,
						unsigned int swappiness,
						struct zone *zone,
						int nid);
248
extern int __isolate_lru_page(struct page *page, int mode, int file);
249
extern unsigned long shrink_all_memory(unsigned long nr_pages);
L
Linus Torvalds 已提交
250
extern int vm_swappiness;
C
Christoph Lameter 已提交
251
extern int remove_mapping(struct address_space *mapping, struct page *page);
252
extern long vm_total_pages;
C
Christoph Lameter 已提交
253

254 255
#ifdef CONFIG_NUMA
extern int zone_reclaim_mode;
256
extern int sysctl_min_unmapped_ratio;
257
extern int sysctl_min_slab_ratio;
258 259 260 261 262 263 264 265 266
extern int zone_reclaim(struct zone *, gfp_t, unsigned int);
#else
#define zone_reclaim_mode 0
static inline int zone_reclaim(struct zone *z, gfp_t mask, unsigned int order)
{
	return 0;
}
#endif

L
Lee Schermerhorn 已提交
267
extern int page_evictable(struct page *page, struct vm_area_struct *vma);
268
extern void scan_mapping_unevictable_pages(struct address_space *);
269 270

extern unsigned long scan_unevictable_pages;
271
extern int scan_unevictable_handler(struct ctl_table *, int,
272 273 274
					void __user *, size_t *, loff_t *);
extern int scan_unevictable_register_node(struct node *node);
extern void scan_unevictable_unregister_node(struct node *node);
L
Lee Schermerhorn 已提交
275

276
extern int kswapd_run(int nid);
277
extern void kswapd_stop(int nid);
278

L
Linus Torvalds 已提交
279 280 281 282 283 284 285 286 287
#ifdef CONFIG_MMU
/* linux/mm/shmem.c */
extern int shmem_unuse(swp_entry_t entry, struct page *page);
#endif /* CONFIG_MMU */

extern void swap_unplug_io_fn(struct backing_dev_info *, struct page *);

#ifdef CONFIG_SWAP
/* linux/mm/page_io.c */
288
extern int swap_readpage(struct page *);
L
Linus Torvalds 已提交
289
extern int swap_writepage(struct page *page, struct writeback_control *wbc);
290
extern void end_swap_bio_read(struct bio *bio, int err);
L
Linus Torvalds 已提交
291 292 293 294 295

/* linux/mm/swap_state.c */
extern struct address_space swapper_space;
#define total_swapcache_pages  swapper_space.nrpages
extern void show_swap_cache_info(void);
296
extern int add_to_swap(struct page *);
297
extern int add_to_swap_cache(struct page *, swp_entry_t, gfp_t);
L
Linus Torvalds 已提交
298 299 300 301
extern void __delete_from_swap_cache(struct page *);
extern void delete_from_swap_cache(struct page *);
extern void free_page_and_swap_cache(struct page *);
extern void free_pages_and_swap_cache(struct page **, int);
302
extern struct page *lookup_swap_cache(swp_entry_t);
303
extern struct page *read_swap_cache_async(swp_entry_t, gfp_t,
304
			struct vm_area_struct *vma, unsigned long addr);
305
extern struct page *swapin_readahead(swp_entry_t, gfp_t,
306 307
			struct vm_area_struct *vma, unsigned long addr);

L
Linus Torvalds 已提交
308
/* linux/mm/swapfile.c */
309
extern long nr_swap_pages;
L
Linus Torvalds 已提交
310 311 312
extern long total_swap_pages;
extern void si_swapinfo(struct sysinfo *);
extern swp_entry_t get_swap_page(void);
313
extern swp_entry_t get_swap_page_of_type(int);
L
Linus Torvalds 已提交
314
extern int valid_swaphandles(swp_entry_t, unsigned long *);
H
Hugh Dickins 已提交
315
extern int add_swap_count_continuation(swp_entry_t, gfp_t);
H
Hugh Dickins 已提交
316
extern void swap_shmem_alloc(swp_entry_t);
H
Hugh Dickins 已提交
317 318
extern int swap_duplicate(swp_entry_t);
extern int swapcache_prepare(swp_entry_t);
L
Linus Torvalds 已提交
319
extern void swap_free(swp_entry_t);
320
extern void swapcache_free(swp_entry_t, struct page *page);
321
extern int free_swap_and_cache(swp_entry_t);
322
extern int swap_type_of(dev_t, sector_t, struct block_device **);
323
extern unsigned int count_swap_pages(int, int);
324
extern sector_t map_swap_page(struct page *, struct block_device **);
325
extern sector_t swapdev_block(int, pgoff_t);
326
extern int reuse_swap_page(struct page *);
327
extern int try_to_free_swap(struct page *);
L
Linus Torvalds 已提交
328 329 330
struct backing_dev_info;

/* linux/mm/thrash.c */
H
Hugh Dickins 已提交
331 332
extern struct mm_struct *swap_token_mm;
extern void grab_swap_token(struct mm_struct *);
L
Linus Torvalds 已提交
333 334 335 336 337 338 339 340 341 342 343 344 345
extern void __put_swap_token(struct mm_struct *);

static inline int has_swap_token(struct mm_struct *mm)
{
	return (mm == swap_token_mm);
}

static inline void put_swap_token(struct mm_struct *mm)
{
	if (has_swap_token(mm))
		__put_swap_token(mm);
}

346 347 348 349 350
static inline void disable_swap_token(void)
{
	put_swap_token(swap_token_mm);
}

K
KAMEZAWA Hiroyuki 已提交
351
#ifdef CONFIG_CGROUP_MEM_RES_CTLR
K
KAMEZAWA Hiroyuki 已提交
352 353
extern void
mem_cgroup_uncharge_swapcache(struct page *page, swp_entry_t ent, bool swapout);
354
extern int mem_cgroup_count_swap_user(swp_entry_t ent, struct page **pagep);
K
KAMEZAWA Hiroyuki 已提交
355
#else
356
static inline void
K
KAMEZAWA Hiroyuki 已提交
357
mem_cgroup_uncharge_swapcache(struct page *page, swp_entry_t ent, bool swapout)
358 359 360 361 362 363 364
{
}
#endif
#ifdef CONFIG_CGROUP_MEM_RES_CTLR_SWAP
extern void mem_cgroup_uncharge_swap(swp_entry_t ent);
#else
static inline void mem_cgroup_uncharge_swap(swp_entry_t ent)
K
KAMEZAWA Hiroyuki 已提交
365 366 367 368
{
}
#endif

L
Linus Torvalds 已提交
369 370
#else /* CONFIG_SWAP */

371 372
#define nr_swap_pages				0L
#define total_swap_pages			0L
L
Linus Torvalds 已提交
373 374 375 376
#define total_swapcache_pages			0UL

#define si_swapinfo(val) \
	do { (val)->freeswap = (val)->totalswap = 0; } while (0)
377 378
/* only sparc can not include linux/pagemap.h in this file
 * so leave page_cache_release and release_pages undeclared... */
L
Linus Torvalds 已提交
379 380 381 382 383
#define free_page_and_swap_cache(page) \
	page_cache_release(page)
#define free_pages_and_swap_cache(pages, nr) \
	release_pages((pages), (nr), 0);

384 385 386 387
static inline void show_swap_cache_info(void)
{
}

388
#define free_swap_and_cache(swp)	is_migration_entry(swp)
389
#define swapcache_prepare(swp)		is_migration_entry(swp)
390

H
Hugh Dickins 已提交
391
static inline int add_swap_count_continuation(swp_entry_t swp, gfp_t gfp_mask)
392
{
H
Hugh Dickins 已提交
393 394 395
	return 0;
}

H
Hugh Dickins 已提交
396 397 398 399
static inline void swap_shmem_alloc(swp_entry_t swp)
{
}

H
Hugh Dickins 已提交
400 401 402
static inline int swap_duplicate(swp_entry_t swp)
{
	return 0;
403 404
}

405 406 407 408
static inline void swap_free(swp_entry_t swp)
{
}

409 410 411 412
static inline void swapcache_free(swp_entry_t swp, struct page *page)
{
}

413
static inline struct page *swapin_readahead(swp_entry_t swp, gfp_t gfp_mask,
414 415 416 417 418
			struct vm_area_struct *vma, unsigned long addr)
{
	return NULL;
}

H
Hugh Dickins 已提交
419 420 421 422 423
static inline int swap_writepage(struct page *p, struct writeback_control *wbc)
{
	return 0;
}

424 425 426 427 428
static inline struct page *lookup_swap_cache(swp_entry_t swp)
{
	return NULL;
}

H
Hugh Dickins 已提交
429 430 431 432 433
static inline int add_to_swap(struct page *page)
{
	return 0;
}

434 435
static inline int add_to_swap_cache(struct page *page, swp_entry_t entry,
							gfp_t gfp_mask)
436
{
437
	return -1;
438 439 440 441 442 443 444 445 446 447
}

static inline void __delete_from_swap_cache(struct page *page)
{
}

static inline void delete_from_swap_cache(struct page *page)
{
}

448
#define reuse_swap_page(page)	(page_mapcount(page) == 1)
L
Linus Torvalds 已提交
449

450
static inline int try_to_free_swap(struct page *page)
451 452 453 454
{
	return 0;
}

L
Linus Torvalds 已提交
455 456 457 458 459 460 461 462
static inline swp_entry_t get_swap_page(void)
{
	swp_entry_t entry;
	entry.val = 0;
	return entry;
}

/* linux/mm/thrash.c */
463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478
static inline void put_swap_token(struct mm_struct *mm)
{
}

static inline void grab_swap_token(struct mm_struct *mm)
{
}

static inline int has_swap_token(struct mm_struct *mm)
{
	return 0;
}

static inline void disable_swap_token(void)
{
}
L
Linus Torvalds 已提交
479

480 481 482 483 484
static inline void
mem_cgroup_uncharge_swapcache(struct page *page, swp_entry_t ent)
{
}

485 486 487 488 489 490 491 492
#ifdef CONFIG_CGROUP_MEM_RES_CTLR
static inline int
mem_cgroup_count_swap_user(swp_entry_t ent, struct page **pagep)
{
	return 0;
}
#endif

L
Linus Torvalds 已提交
493 494 495
#endif /* CONFIG_SWAP */
#endif /* __KERNEL__*/
#endif /* _LINUX_SWAP_H */