vmalloc.h 9.4 KB
Newer Older
1
/* SPDX-License-Identifier: GPL-2.0 */
L
Linus Torvalds 已提交
2 3 4 5
#ifndef _LINUX_VMALLOC_H
#define _LINUX_VMALLOC_H

#include <linux/spinlock.h>
N
Nick Piggin 已提交
6
#include <linux/init.h>
7
#include <linux/list.h>
8
#include <linux/llist.h>
L
Linus Torvalds 已提交
9
#include <asm/page.h>		/* pgprot_t */
10
#include <linux/rbtree.h>
11
#include <linux/overflow.h>
L
Linus Torvalds 已提交
12

13 14
#include <asm/vmalloc.h>

H
Hugh Dickins 已提交
15
struct vm_area_struct;		/* vma defining user mapping in mm_types.h */
16
struct notifier_block;		/* in notifier.h */
17

H
Hugh Dickins 已提交
18
/* bits in flags of vmalloc's vm_struct below */
19 20 21 22
#define VM_IOREMAP		0x00000001	/* ioremap() and friends */
#define VM_ALLOC		0x00000002	/* vmalloc() */
#define VM_MAP			0x00000004	/* vmap()ed pages */
#define VM_USERMAP		0x00000008	/* suitable for remap_vmalloc_range */
23
#define VM_DMA_COHERENT		0x00000010	/* dma_alloc_coherent */
24
#define VM_UNINITIALIZED	0x00000020	/* vm_struct is not fully initialized */
25
#define VM_NO_GUARD		0x00000040      /* don't add guard page */
26
#define VM_KASAN		0x00000080      /* has allocated kasan shadow memory */
27 28
#define VM_FLUSH_RESET_PERMS	0x00000100	/* reset direct map and flush TLB on unmap, can't be freed in atomic context */
#define VM_MAP_PUT_PAGES	0x00000200	/* put pages and free array in vfree */
29
#define VM_NO_HUGE_VMAP		0x00000400	/* force PAGE_SIZE pte mapping */
30
#define VM_HUGE_PAGES		0x00001000	/* used for vmalloc hugepages */
31 32 33 34 35
#ifdef CONFIG_ASCEND_SHARE_POOL
#define VM_SHAREPOOL		0x00002000      /* remapped to sharepool */
#else
#define VM_SHAREPOOL		0
#endif
36 37 38 39 40 41 42 43 44 45 46 47

/*
 * VM_KASAN is used slighly differently depending on CONFIG_KASAN_VMALLOC.
 *
 * If IS_ENABLED(CONFIG_KASAN_VMALLOC), VM_KASAN is set on a vm_struct after
 * shadow memory has been mapped. It's used to handle allocation errors so that
 * we don't try to poision shadow on free if it was never allocated.
 *
 * Otherwise, VM_KASAN is set for kasan_module_alloc() allocations and used to
 * determine which allocations need the module shadow freed.
 */

L
Linus Torvalds 已提交
48 49
/* bits [20..32] reserved for arch specific ioremap internals */

50 51 52 53 54 55 56 57
/*
 * Maximum alignment for ioremap() regions.
 * Can be overriden by arch-specific value.
 */
#ifndef IOREMAP_MAX_ORDER
#define IOREMAP_MAX_ORDER	(7 + PAGE_SHIFT)	/* 128 pages */
#endif

L
Linus Torvalds 已提交
58
struct vm_struct {
59
	struct vm_struct	*next;
L
Linus Torvalds 已提交
60 61 62 63
	void			*addr;
	unsigned long		size;
	unsigned long		flags;
	struct page		**pages;
64 65 66
#ifdef CONFIG_HAVE_ARCH_HUGE_VMALLOC
	unsigned int		page_order;
#endif
L
Linus Torvalds 已提交
67
	unsigned int		nr_pages;
68
	phys_addr_t		phys_addr;
69
	const void		*caller;
L
Linus Torvalds 已提交
70 71
};

72 73 74
struct vmap_area {
	unsigned long va_start;
	unsigned long va_end;
75

76 77
	struct rb_node rb_node;         /* address sorted rbtree */
	struct list_head list;          /* address sorted list */
78 79

	/*
80 81
	 * The following two variables can be packed, because
	 * a vmap_area object can be either:
82
	 *    1) in "free" tree (root is vmap_area_root)
83
	 *    2) or "busy" tree (root is free_vmap_area_root)
84 85 86 87 88
	 */
	union {
		unsigned long subtree_max_size; /* in "free" tree */
		struct vm_struct *vm;           /* in "busy" tree */
	};
89 90
};

91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110
/* archs that select HAVE_ARCH_HUGE_VMAP should override one or more of these */
#ifndef arch_vmap_p4d_supported
static inline bool arch_vmap_p4d_supported(pgprot_t prot)
{
	return false;
}
#endif

#ifndef arch_vmap_pud_supported
static inline bool arch_vmap_pud_supported(pgprot_t prot)
{
	return false;
}
#endif

#ifndef arch_vmap_pmd_supported
static inline bool arch_vmap_pmd_supported(pgprot_t prot)
{
	return false;
}
111 112
#endif

L
Linus Torvalds 已提交
113 114 115
/*
 *	Highlevel APIs for driver use
 */
N
Nick Piggin 已提交
116
extern void vm_unmap_ram(const void *mem, unsigned int count);
117
extern void *vm_map_ram(struct page **pages, unsigned int count, int node);
N
Nick Piggin 已提交
118 119 120 121
extern void vm_unmap_aliases(void);

#ifdef CONFIG_MMU
extern void __init vmalloc_init(void);
122
extern unsigned long vmalloc_nr_pages(void);
N
Nick Piggin 已提交
123 124 125 126
#else
static inline void vmalloc_init(void)
{
}
127
static inline unsigned long vmalloc_nr_pages(void) { return 0; }
N
Nick Piggin 已提交
128 129
#endif

L
Linus Torvalds 已提交
130
extern void *vmalloc(unsigned long size);
131
extern void *vzalloc(unsigned long size);
132
extern void *vmalloc_user(unsigned long size);
C
Christoph Lameter 已提交
133
extern void *vmalloc_node(unsigned long size, int node);
134
extern void *vzalloc_node(unsigned long size, int node);
L
Linus Torvalds 已提交
135
extern void *vmalloc_32(unsigned long size);
136
extern void *vmalloc_32_user(unsigned long size);
137
extern void *__vmalloc(unsigned long size, gfp_t gfp_mask);
138 139
extern void *__vmalloc_node_range(unsigned long size, unsigned long align,
			unsigned long start, unsigned long end, gfp_t gfp_mask,
140 141
			pgprot_t prot, unsigned long vm_flags, int node,
			const void *caller);
142 143
void *__vmalloc_node(unsigned long size, unsigned long align, gfp_t gfp_mask,
		int node, const void *caller);
144
void *vmalloc_no_huge(unsigned long size);
145 146
extern void *vmalloc_hugepage(unsigned long size);
extern void *vmalloc_hugepage_user(unsigned long size);
147

148
extern void vfree(const void *addr);
A
Andrey Ryabinin 已提交
149
extern void vfree_atomic(const void *addr);
L
Linus Torvalds 已提交
150 151 152

extern void *vmap(struct page **pages, unsigned int count,
			unsigned long flags, pgprot_t prot);
C
Christoph Hellwig 已提交
153
void *vmap_pfn(unsigned long *pfns, unsigned int count, pgprot_t prot);
154
extern void vunmap(const void *addr);
155

156 157
extern int remap_vmalloc_range_partial(struct vm_area_struct *vma,
				       unsigned long uaddr, void *kaddr,
158
				       unsigned long pgoff, unsigned long size);
159

160 161
extern int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
							unsigned long pgoff);
J
Joerg Roedel 已提交
162

163 164 165 166 167 168 169 170
extern void *vmap_hugepage(struct page **pages, unsigned int count,
			   unsigned long flags, pgprot_t prot);
extern int remap_vmalloc_hugepage_range_partial(struct vm_area_struct *vma,
						unsigned long uaddr, void *kaddr,
						unsigned long pgoff, unsigned long size);
extern int remap_vmalloc_hugepage_range(struct vm_area_struct *vma,
					void *addr, unsigned long pgoff);

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
/*
 * Architectures can set this mask to a combination of PGTBL_P?D_MODIFIED values
 * and let generic vmalloc and ioremap code know when arch_sync_kernel_mappings()
 * needs to be called.
 */
#ifndef ARCH_PAGE_TABLE_SYNC_MASK
#define ARCH_PAGE_TABLE_SYNC_MASK 0
#endif

/*
 * There is no default implementation for arch_sync_kernel_mappings(). It is
 * relied upon the compiler to optimize calls out if ARCH_PAGE_TABLE_SYNC_MASK
 * is 0.
 */
void arch_sync_kernel_mappings(unsigned long start, unsigned long end);

L
Linus Torvalds 已提交
187 188 189
/*
 *	Lowlevel-APIs (not for driver use!)
 */
190 191 192

static inline size_t get_vm_area_size(const struct vm_struct *area)
{
193 194 195 196 197 198
	if (!(area->flags & VM_NO_GUARD))
		/* return actual size without guard page */
		return area->size - PAGE_SIZE;
	else
		return area->size;

199 200
}

L
Linus Torvalds 已提交
201
extern struct vm_struct *get_vm_area(unsigned long size, unsigned long flags);
202
extern struct vm_struct *get_vm_area_caller(unsigned long size,
203
					unsigned long flags, const void *caller);
204 205 206
extern struct vm_struct *__get_vm_area_caller(unsigned long size,
					unsigned long flags,
					unsigned long start, unsigned long end,
207
					const void *caller);
C
Christoph Hellwig 已提交
208
void free_vm_area(struct vm_struct *area);
209
extern struct vm_struct *remove_vm_area(const void *addr);
210
extern struct vm_struct *find_vm_area(const void *addr);
211

212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227
static inline bool is_vm_area_hugepages(const void *addr)
{
	/*
	 * This may not 100% tell if the area is mapped with > PAGE_SIZE
	 * page table entries, if for some reason the architecture indicates
	 * larger sizes are available but decides not to use them, nothing
	 * prevents that. This only indicates the size of the physical page
	 * allocated in the vmalloc layer.
	 */
#ifdef CONFIG_HAVE_ARCH_HUGE_VMALLOC
	return find_vm_area(addr)->page_order > 0;
#else
	return false;
#endif
}

228
#ifdef CONFIG_MMU
229 230 231
int vmap_range(unsigned long addr, unsigned long end,
			phys_addr_t phys_addr, pgprot_t prot,
			unsigned int max_page_shift);
232 233
extern int map_kernel_range_noflush(unsigned long start, unsigned long size,
				    pgprot_t prot, struct page **pages);
C
Christoph Hellwig 已提交
234 235
int map_kernel_range(unsigned long start, unsigned long size, pgprot_t prot,
		struct page **pages);
236
extern void unmap_kernel_range_noflush(unsigned long addr, unsigned long size);
237
extern void unmap_kernel_range(unsigned long addr, unsigned long size);
238 239 240 241 242 243 244
static inline void set_vm_flush_reset_perms(void *addr)
{
	struct vm_struct *vm = find_vm_area(addr);

	if (vm)
		vm->flags |= VM_FLUSH_RESET_PERMS;
}
245

246 247 248 249 250 251 252
#else
static inline int
map_kernel_range_noflush(unsigned long start, unsigned long size,
			pgprot_t prot, struct page **pages)
{
	return size >> PAGE_SHIFT;
}
C
Christoph Hellwig 已提交
253
#define map_kernel_range map_kernel_range_noflush
254 255 256 257
static inline void
unmap_kernel_range_noflush(unsigned long addr, unsigned long size)
{
}
C
Christoph Hellwig 已提交
258
#define unmap_kernel_range unmap_kernel_range_noflush
259 260 261
static inline void set_vm_flush_reset_perms(void *addr)
{
}
262
#endif
L
Linus Torvalds 已提交
263

264 265 266 267
/* for /dev/kmem */
extern long vread(char *buf, char *addr, unsigned long count);
extern long vwrite(char *buf, char *addr, unsigned long count);

L
Linus Torvalds 已提交
268 269 270
/*
 *	Internals.  Dont't use..
 */
271
extern struct list_head vmap_area_list;
N
Nicolas Pitre 已提交
272
extern __init void vm_area_add_early(struct vm_struct *vm);
273
extern __init void vm_area_register_early(struct vm_struct *vm, size_t align);
L
Linus Torvalds 已提交
274

275
#ifdef CONFIG_SMP
276
# ifdef CONFIG_MMU
277 278
struct vm_struct **pcpu_get_vm_areas(const unsigned long *offsets,
				     const size_t *sizes, int nr_vms,
279
				     size_t align);
280 281

void pcpu_free_vm_areas(struct vm_struct **vms, int nr_vms);
282 283 284 285 286 287 288 289 290 291 292 293 294 295
# else
static inline struct vm_struct **
pcpu_get_vm_areas(const unsigned long *offsets,
		const size_t *sizes, int nr_vms,
		size_t align)
{
	return NULL;
}

static inline void
pcpu_free_vm_areas(struct vm_struct **vms, int nr_vms)
{
}
# endif
296
#endif
297

298 299 300 301 302 303
#ifdef CONFIG_MMU
#define VMALLOC_TOTAL (VMALLOC_END - VMALLOC_START)
#else
#define VMALLOC_TOTAL 0UL
#endif

304 305 306
int register_vmap_purge_notifier(struct notifier_block *nb);
int unregister_vmap_purge_notifier(struct notifier_block *nb);

L
Linus Torvalds 已提交
307
#endif /* _LINUX_VMALLOC_H */