slub_def.h 9.2 KB
Newer Older
C
Christoph Lameter 已提交
1 2 3 4 5 6
#ifndef _LINUX_SLUB_DEF_H
#define _LINUX_SLUB_DEF_H

/*
 * SLUB : A Slab allocator without object queues.
 *
C
Christoph Lameter 已提交
7
 * (C) 2007 SGI, Christoph Lameter
C
Christoph Lameter 已提交
8 9 10
 */
#include <linux/types.h>
#include <linux/gfp.h>
11
#include <linux/bug.h>
C
Christoph Lameter 已提交
12 13 14
#include <linux/workqueue.h>
#include <linux/kobject.h>

15
#include <linux/kmemleak.h>
16

17 18 19 20 21 22 23 24
enum stat_item {
	ALLOC_FASTPATH,		/* Allocation from cpu slab */
	ALLOC_SLOWPATH,		/* Allocation by getting a new cpu slab */
	FREE_FASTPATH,		/* Free to cpu slub */
	FREE_SLOWPATH,		/* Freeing not to cpu slab */
	FREE_FROZEN,		/* Freeing to frozen slab */
	FREE_ADD_PARTIAL,	/* Freeing moves slab to partial list */
	FREE_REMOVE_PARTIAL,	/* Freeing removes last object */
25
	ALLOC_FROM_PARTIAL,	/* Cpu slab acquired from node partial list */
26 27
	ALLOC_SLAB,		/* Cpu slab acquired from page allocator */
	ALLOC_REFILL,		/* Refill cpu slab from slab freelist */
28
	ALLOC_NODE_MISMATCH,	/* Switching cpu slab */
29 30 31 32 33 34 35
	FREE_SLAB,		/* Slab freed to the page allocator */
	CPUSLAB_FLUSH,		/* Abandoning of the cpu slab */
	DEACTIVATE_FULL,	/* Cpu slab was full when deactivated */
	DEACTIVATE_EMPTY,	/* Cpu slab was empty when deactivated */
	DEACTIVATE_TO_HEAD,	/* Cpu slab was moved to the head of partials */
	DEACTIVATE_TO_TAIL,	/* Cpu slab was moved to the tail of partials */
	DEACTIVATE_REMOTE_FREES,/* Slab contained remotely freed objects */
36
	DEACTIVATE_BYPASS,	/* Implicit deactivation */
37
	ORDER_FALLBACK,		/* Number of times fallback was necessary */
38
	CMPXCHG_DOUBLE_CPU_FAIL,/* Failure of this_cpu_cmpxchg_double */
39
	CMPXCHG_DOUBLE_FAIL,	/* Number of times that cmpxchg double did not match */
40
	CPU_PARTIAL_ALLOC,	/* Used cpu partial on alloc */
41 42 43
	CPU_PARTIAL_FREE,	/* Refill cpu partial on free */
	CPU_PARTIAL_NODE,	/* Refill cpu partial from node partial */
	CPU_PARTIAL_DRAIN,	/* Drain cpu partial to node partial */
44 45
	NR_SLUB_STAT_ITEMS };

46
struct kmem_cache_cpu {
47 48
	void **freelist;	/* Pointer to next available object */
	unsigned long tid;	/* Globally unique transaction id */
49
	struct page *page;	/* The slab from which we are allocating */
50
	struct page *partial;	/* Partially allocated frozen slabs */
51 52 53
#ifdef CONFIG_SLUB_STATS
	unsigned stat[NR_SLUB_STAT_ITEMS];
#endif
54
};
55

C
Christoph Lameter 已提交
56 57 58 59
struct kmem_cache_node {
	spinlock_t list_lock;	/* Protect partial list and nr_partial */
	unsigned long nr_partial;
	struct list_head partial;
60
#ifdef CONFIG_SLUB_DEBUG
61
	atomic_long_t nr_slabs;
62
	atomic_long_t total_objects;
63
	struct list_head full;
64
#endif
C
Christoph Lameter 已提交
65 66
};

67 68 69 70 71 72 73 74 75
/*
 * Word size structure that can be atomically updated or read and that
 * contains both the order and the number of objects that a slab of the
 * given order would contain.
 */
struct kmem_cache_order_objects {
	unsigned long x;
};

C
Christoph Lameter 已提交
76 77 78 79
/*
 * Slab cache management.
 */
struct kmem_cache {
80
	struct kmem_cache_cpu __percpu *cpu_slab;
C
Christoph Lameter 已提交
81 82
	/* Used for retriving partial slabs etc */
	unsigned long flags;
83
	unsigned long min_partial;
C
Christoph Lameter 已提交
84
	int size;		/* The size of an object including meta data */
85
	int object_size;	/* The size of an object without meta data */
C
Christoph Lameter 已提交
86
	int offset;		/* Free pointer offset. */
87
	int cpu_partial;	/* Number of per cpu partial objects to keep around */
88
	struct kmem_cache_order_objects oo;
C
Christoph Lameter 已提交
89 90

	/* Allocation and freeing of slabs */
91
	struct kmem_cache_order_objects max;
92
	struct kmem_cache_order_objects min;
93
	gfp_t allocflags;	/* gfp flags to use on each alloc */
C
Christoph Lameter 已提交
94
	int refcount;		/* Refcount for slab cache destroy */
95
	void (*ctor)(void *);
C
Christoph Lameter 已提交
96 97
	int inuse;		/* Offset to metadata */
	int align;		/* Alignment */
98
	int reserved;		/* Reserved bytes at the end of slabs */
C
Christoph Lameter 已提交
99 100
	const char *name;	/* Name (only for display!) */
	struct list_head list;	/* List of slab caches */
101
#ifdef CONFIG_SYSFS
C
Christoph Lameter 已提交
102
	struct kobject kobj;	/* For sysfs */
103
#endif
G
Glauber Costa 已提交
104 105 106
#ifdef CONFIG_MEMCG_KMEM
	struct memcg_cache_params *memcg_params;
#endif
C
Christoph Lameter 已提交
107 108

#ifdef CONFIG_NUMA
109 110 111 112
	/*
	 * Defragmentation by allocating from a remote node.
	 */
	int remote_node_defrag_ratio;
C
Christoph Lameter 已提交
113
#endif
114
	struct kmem_cache_node *node[MAX_NUMNODES];
C
Christoph Lameter 已提交
115 116 117 118 119
};

/*
 * Kmalloc subsystem.
 */
120 121
#if defined(ARCH_DMA_MINALIGN) && ARCH_DMA_MINALIGN > 8
#define KMALLOC_MIN_SIZE ARCH_DMA_MINALIGN
122 123 124 125 126
#else
#define KMALLOC_MIN_SIZE 8
#endif

#define KMALLOC_SHIFT_LOW ilog2(KMALLOC_MIN_SIZE)
C
Christoph Lameter 已提交
127

128 129 130 131 132 133 134 135 136
/*
 * Maximum kmalloc object size handled by SLUB. Larger object allocations
 * are passed through to the page allocator. The page allocator "fastpath"
 * is relatively slow so we need this value sufficiently high so that
 * performance critical objects are allocated through the SLUB fastpath.
 *
 * This should be dropped to PAGE_SIZE / 2 once the page allocator
 * "fastpath" becomes competitive with the slab allocator fastpaths.
 */
137
#define SLUB_MAX_SIZE (2 * PAGE_SIZE)
138

139
#define SLUB_PAGE_SHIFT (PAGE_SHIFT + 2)
140

141 142 143 144 145 146 147
#ifdef CONFIG_ZONE_DMA
#define SLUB_DMA __GFP_DMA
#else
/* Disable DMA functionality */
#define SLUB_DMA (__force gfp_t)0
#endif

C
Christoph Lameter 已提交
148 149 150 151
/*
 * We keep the general caches in an array of slab caches that are used for
 * 2^x bytes of allocations.
 */
152
extern struct kmem_cache *kmalloc_caches[SLUB_PAGE_SHIFT];
C
Christoph Lameter 已提交
153 154 155 156 157

/*
 * Sorry that the following has to be that ugly but some versions of GCC
 * have trouble with constant propagation and loops.
 */
158
static __always_inline int kmalloc_index(size_t size)
C
Christoph Lameter 已提交
159
{
160 161
	if (!size)
		return 0;
162

163 164 165
	if (size <= KMALLOC_MIN_SIZE)
		return KMALLOC_SHIFT_LOW;

166
	if (KMALLOC_MIN_SIZE <= 32 && size > 64 && size <= 96)
C
Christoph Lameter 已提交
167
		return 1;
168
	if (KMALLOC_MIN_SIZE <= 64 && size > 128 && size <= 192)
C
Christoph Lameter 已提交
169 170 171 172 173 174 175 176 177 178
		return 2;
	if (size <=          8) return 3;
	if (size <=         16) return 4;
	if (size <=         32) return 5;
	if (size <=         64) return 6;
	if (size <=        128) return 7;
	if (size <=        256) return 8;
	if (size <=        512) return 9;
	if (size <=       1024) return 10;
	if (size <=   2 * 1024) return 11;
C
Christoph Lameter 已提交
179
	if (size <=   4 * 1024) return 12;
180 181
/*
 * The following is only needed to support architectures with a larger page
182 183
 * size than 4k. We need to support 2 * PAGE_SIZE here. So for a 64k page
 * size we would have to go up to 128k.
184
 */
C
Christoph Lameter 已提交
185 186 187 188 189 190
	if (size <=   8 * 1024) return 13;
	if (size <=  16 * 1024) return 14;
	if (size <=  32 * 1024) return 15;
	if (size <=  64 * 1024) return 16;
	if (size <= 128 * 1024) return 17;
	if (size <= 256 * 1024) return 18;
191
	if (size <= 512 * 1024) return 19;
C
Christoph Lameter 已提交
192 193
	if (size <= 1024 * 1024) return 20;
	if (size <=  2 * 1024 * 1024) return 21;
194 195
	BUG();
	return -1; /* Will never be reached */
C
Christoph Lameter 已提交
196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211

/*
 * What we really wanted to do and cannot do because of compiler issues is:
 *	int i;
 *	for (i = KMALLOC_SHIFT_LOW; i <= KMALLOC_SHIFT_HIGH; i++)
 *		if (size <= (1 << i))
 *			return i;
 */
}

/*
 * Find the slab cache for a given combination of allocation flags and size.
 *
 * This ought to end up with a global pointer to the right cache
 * in kmalloc_caches.
 */
212
static __always_inline struct kmem_cache *kmalloc_slab(size_t size)
C
Christoph Lameter 已提交
213 214 215 216 217 218
{
	int index = kmalloc_index(size);

	if (index == 0)
		return NULL;

219
	return kmalloc_caches[index];
C
Christoph Lameter 已提交
220 221
}

P
Paul Mundt 已提交
222 223 224
void *kmem_cache_alloc(struct kmem_cache *, gfp_t);
void *__kmalloc(size_t size, gfp_t flags);

225 226 227
static __always_inline void *
kmalloc_order(size_t size, gfp_t flags, unsigned int order)
{
228 229 230 231
	void *ret;

	flags |= (__GFP_COMP | __GFP_KMEMCG);
	ret = (void *) __get_free_pages(flags, order);
232 233 234 235
	kmemleak_alloc(ret, size, 1, flags);
	return ret;
}

236 237 238 239 240 241 242 243 244 245 246 247 248
/**
 * Calling this on allocated memory will check that the memory
 * is expected to be in use, and print warnings if not.
 */
#ifdef CONFIG_SLUB_DEBUG
extern bool verify_mem_not_deleted(const void *x);
#else
static inline bool verify_mem_not_deleted(const void *x)
{
	return true;
}
#endif

249
#ifdef CONFIG_TRACING
250 251 252
extern void *
kmem_cache_alloc_trace(struct kmem_cache *s, gfp_t gfpflags, size_t size);
extern void *kmalloc_order_trace(size_t size, gfp_t flags, unsigned int order);
E
Eduard - Gabriel Munteanu 已提交
253 254
#else
static __always_inline void *
255
kmem_cache_alloc_trace(struct kmem_cache *s, gfp_t gfpflags, size_t size)
E
Eduard - Gabriel Munteanu 已提交
256 257 258
{
	return kmem_cache_alloc(s, gfpflags);
}
259 260 261 262 263 264

static __always_inline void *
kmalloc_order_trace(size_t size, gfp_t flags, unsigned int order)
{
	return kmalloc_order(size, flags, order);
}
E
Eduard - Gabriel Munteanu 已提交
265 266
#endif

267 268
static __always_inline void *kmalloc_large(size_t size, gfp_t flags)
{
E
Eduard - Gabriel Munteanu 已提交
269
	unsigned int order = get_order(size);
270
	return kmalloc_order_trace(size, flags, order);
271 272
}

273
static __always_inline void *kmalloc(size_t size, gfp_t flags)
C
Christoph Lameter 已提交
274
{
275
	if (__builtin_constant_p(size)) {
276
		if (size > SLUB_MAX_SIZE)
277
			return kmalloc_large(size, flags);
C
Christoph Lameter 已提交
278

279 280 281 282 283
		if (!(flags & SLUB_DMA)) {
			struct kmem_cache *s = kmalloc_slab(size);

			if (!s)
				return ZERO_SIZE_PTR;
C
Christoph Lameter 已提交
284

285
			return kmem_cache_alloc_trace(s, flags, size);
286 287 288
		}
	}
	return __kmalloc(size, flags);
C
Christoph Lameter 已提交
289 290 291
}

#ifdef CONFIG_NUMA
P
Paul Mundt 已提交
292 293
void *__kmalloc_node(size_t size, gfp_t flags, int node);
void *kmem_cache_alloc_node(struct kmem_cache *, gfp_t flags, int node);
C
Christoph Lameter 已提交
294

295
#ifdef CONFIG_TRACING
296
extern void *kmem_cache_alloc_node_trace(struct kmem_cache *s,
E
Eduard - Gabriel Munteanu 已提交
297
					   gfp_t gfpflags,
298
					   int node, size_t size);
E
Eduard - Gabriel Munteanu 已提交
299 300
#else
static __always_inline void *
301
kmem_cache_alloc_node_trace(struct kmem_cache *s,
E
Eduard - Gabriel Munteanu 已提交
302
			      gfp_t gfpflags,
303
			      int node, size_t size)
E
Eduard - Gabriel Munteanu 已提交
304 305 306 307 308
{
	return kmem_cache_alloc_node(s, gfpflags, node);
}
#endif

309
static __always_inline void *kmalloc_node(size_t size, gfp_t flags, int node)
C
Christoph Lameter 已提交
310
{
311
	if (__builtin_constant_p(size) &&
312
		size <= SLUB_MAX_SIZE && !(flags & SLUB_DMA)) {
313
			struct kmem_cache *s = kmalloc_slab(size);
C
Christoph Lameter 已提交
314 315

		if (!s)
316
			return ZERO_SIZE_PTR;
C
Christoph Lameter 已提交
317

318
		return kmem_cache_alloc_node_trace(s, flags, node, size);
319 320
	}
	return __kmalloc_node(size, flags, node);
C
Christoph Lameter 已提交
321 322 323 324
}
#endif

#endif /* _LINUX_SLUB_DEF_H */