tlb.h 5.8 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 *  arch/arm/include/asm/tlb.h
L
Linus Torvalds 已提交
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20
 *
 *  Copyright (C) 2002 Russell King
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 *
 *  Experimentation shows that on a StrongARM, it appears to be faster
 *  to use the "invalidate whole tlb" rather than "invalidate single
 *  tlb" for this.
 *
 *  This appears true for both the process fork+exit case, as well as
 *  the munmap-large-area case.
 */
#ifndef __ASMARM_TLB_H
#define __ASMARM_TLB_H

#include <asm/cacheflush.h>
21 22 23 24

#ifndef CONFIG_MMU

#include <linux/pagemap.h>
25 26 27

#define tlb_flush(tlb)	((void) tlb)

28 29 30 31
#include <asm-generic/tlb.h>

#else /* !CONFIG_MMU */

32
#include <linux/swap.h>
L
Linus Torvalds 已提交
33
#include <asm/pgalloc.h>
34 35 36 37 38 39 40 41 42 43 44 45 46
#include <asm/tlbflush.h>

/*
 * We need to delay page freeing for SMP as other CPUs can access pages
 * which have been removed but not yet had their TLB entries invalidated.
 * Also, as ARMv7 speculative prefetch can drag new entries into the TLB,
 * we need to apply this same delaying tactic to ensure correct operation.
 */
#if defined(CONFIG_SMP) || defined(CONFIG_CPU_32v7)
#define tlb_fast_mode(tlb)	0
#else
#define tlb_fast_mode(tlb)	1
#endif
L
Linus Torvalds 已提交
47

P
Peter Zijlstra 已提交
48 49
#define MMU_GATHER_BUNDLE	8

L
Linus Torvalds 已提交
50 51 52 53 54 55 56
/*
 * TLB handling.  This allows us to remove pages from the page
 * tables, and efficiently handle the TLB issues.
 */
struct mmu_gather {
	struct mm_struct	*mm;
	unsigned int		fullmm;
57
	struct vm_area_struct	*vma;
58 59
	unsigned long		range_start;
	unsigned long		range_end;
60
	unsigned int		nr;
P
Peter Zijlstra 已提交
61 62 63
	unsigned int		max;
	struct page		**pages;
	struct page		*local[MMU_GATHER_BUNDLE];
L
Linus Torvalds 已提交
64 65 66 67
};

DECLARE_PER_CPU(struct mmu_gather, mmu_gathers);

68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101
/*
 * This is unnecessarily complex.  There's three ways the TLB shootdown
 * code is used:
 *  1. Unmapping a range of vmas.  See zap_page_range(), unmap_region().
 *     tlb->fullmm = 0, and tlb_start_vma/tlb_end_vma will be called.
 *     tlb->vma will be non-NULL.
 *  2. Unmapping all vmas.  See exit_mmap().
 *     tlb->fullmm = 1, and tlb_start_vma/tlb_end_vma will be called.
 *     tlb->vma will be non-NULL.  Additionally, page tables will be freed.
 *  3. Unmapping argument pages.  See shift_arg_pages().
 *     tlb->fullmm = 0, but tlb_start_vma/tlb_end_vma will not be called.
 *     tlb->vma will be NULL.
 */
static inline void tlb_flush(struct mmu_gather *tlb)
{
	if (tlb->fullmm || !tlb->vma)
		flush_tlb_mm(tlb->mm);
	else if (tlb->range_end > 0) {
		flush_tlb_range(tlb->vma, tlb->range_start, tlb->range_end);
		tlb->range_start = TASK_SIZE;
		tlb->range_end = 0;
	}
}

static inline void tlb_add_flush(struct mmu_gather *tlb, unsigned long addr)
{
	if (!tlb->fullmm) {
		if (addr < tlb->range_start)
			tlb->range_start = addr;
		if (addr + PAGE_SIZE > tlb->range_end)
			tlb->range_end = addr + PAGE_SIZE;
	}
}

P
Peter Zijlstra 已提交
102 103 104 105 106 107 108 109 110 111
static inline void __tlb_alloc_page(struct mmu_gather *tlb)
{
	unsigned long addr = __get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);

	if (addr) {
		tlb->pages = (void *)addr;
		tlb->max = PAGE_SIZE / sizeof(struct page *);
	}
}

112 113 114 115 116 117
static inline void tlb_flush_mmu(struct mmu_gather *tlb)
{
	tlb_flush(tlb);
	if (!tlb_fast_mode(tlb)) {
		free_pages_and_swap_cache(tlb->pages, tlb->nr);
		tlb->nr = 0;
P
Peter Zijlstra 已提交
118 119
		if (tlb->pages == tlb->local)
			__tlb_alloc_page(tlb);
120 121 122
	}
}

P
Peter Zijlstra 已提交
123 124
static inline void
tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, unsigned int fullmm)
L
Linus Torvalds 已提交
125 126
{
	tlb->mm = mm;
P
Peter Zijlstra 已提交
127
	tlb->fullmm = fullmm;
128
	tlb->vma = NULL;
P
Peter Zijlstra 已提交
129 130
	tlb->max = ARRAY_SIZE(tlb->local);
	tlb->pages = tlb->local;
131
	tlb->nr = 0;
P
Peter Zijlstra 已提交
132
	__tlb_alloc_page(tlb);
L
Linus Torvalds 已提交
133 134 135 136 137
}

static inline void
tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
{
138
	tlb_flush_mmu(tlb);
L
Linus Torvalds 已提交
139 140 141

	/* keep the page table cache within bounds */
	check_pgt_cache();
142

P
Peter Zijlstra 已提交
143 144
	if (tlb->pages != tlb->local)
		free_pages((unsigned long)tlb->pages, 0);
L
Linus Torvalds 已提交
145 146
}

147 148 149 150 151 152
/*
 * Memorize the range for the TLB flush.
 */
static inline void
tlb_remove_tlb_entry(struct mmu_gather *tlb, pte_t *ptep, unsigned long addr)
{
153
	tlb_add_flush(tlb, addr);
154
}
L
Linus Torvalds 已提交
155 156 157 158 159 160 161 162 163

/*
 * In the case of tlb vma handling, we can optimise these away in the
 * case where we're doing a full MM flush.  When we're doing a munmap,
 * the vmas are adjusted to only cover the region to be torn down.
 */
static inline void
tlb_start_vma(struct mmu_gather *tlb, struct vm_area_struct *vma)
{
164
	if (!tlb->fullmm) {
L
Linus Torvalds 已提交
165
		flush_cache_range(vma, vma->vm_start, vma->vm_end);
166
		tlb->vma = vma;
167 168 169
		tlb->range_start = TASK_SIZE;
		tlb->range_end = 0;
	}
L
Linus Torvalds 已提交
170 171 172 173 174
}

static inline void
tlb_end_vma(struct mmu_gather *tlb, struct vm_area_struct *vma)
{
175 176 177 178
	if (!tlb->fullmm)
		tlb_flush(tlb);
}

P
Peter Zijlstra 已提交
179
static inline int __tlb_remove_page(struct mmu_gather *tlb, struct page *page)
180 181 182
{
	if (tlb_fast_mode(tlb)) {
		free_page_and_swap_cache(page);
P
Peter Zijlstra 已提交
183
		return 1; /* avoid calling tlb_flush_mmu */
184
	}
P
Peter Zijlstra 已提交
185 186 187 188 189 190 191 192 193 194

	tlb->pages[tlb->nr++] = page;
	VM_BUG_ON(tlb->nr > tlb->max);
	return tlb->max - tlb->nr;
}

static inline void tlb_remove_page(struct mmu_gather *tlb, struct page *page)
{
	if (!__tlb_remove_page(tlb, page))
		tlb_flush_mmu(tlb);
195 196 197 198 199 200
}

static inline void __pte_free_tlb(struct mmu_gather *tlb, pgtable_t pte,
	unsigned long addr)
{
	pgtable_page_dtor(pte);
201

202 203 204
#ifdef CONFIG_ARM_LPAE
	tlb_add_flush(tlb, addr);
#else
205 206 207 208 209 210 211
	/*
	 * With the classic ARM MMU, a pte page has two corresponding pmd
	 * entries, each covering 1MB.
	 */
	addr &= PMD_MASK;
	tlb_add_flush(tlb, addr + SZ_1M - PAGE_SIZE);
	tlb_add_flush(tlb, addr + SZ_1M);
212
#endif
213

214
	tlb_remove_page(tlb, pte);
L
Linus Torvalds 已提交
215 216
}

217 218 219 220 221 222 223 224 225
static inline void __pmd_free_tlb(struct mmu_gather *tlb, pmd_t *pmdp,
				  unsigned long addr)
{
#ifdef CONFIG_ARM_LPAE
	tlb_add_flush(tlb, addr);
	tlb_remove_page(tlb, virt_to_page(pmdp));
#endif
}

226
#define pte_free_tlb(tlb, ptep, addr)	__pte_free_tlb(tlb, ptep, addr)
227
#define pmd_free_tlb(tlb, pmdp, addr)	__pmd_free_tlb(tlb, pmdp, addr)
228
#define pud_free_tlb(tlb, pudp, addr)	pud_free((tlb)->mm, pudp)
L
Linus Torvalds 已提交
229 230 231

#define tlb_migrate_finish(mm)		do { } while (0)

232
#endif /* CONFIG_MMU */
L
Linus Torvalds 已提交
233
#endif