hugetlbpage.c 4.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9
/*
 * IA-32 Huge TLB Page Support for Kernel.
 *
 * Copyright (C) 2002, Rohit Seth <rohit.seth@intel.com>
 */

#include <linux/init.h>
#include <linux/fs.h>
#include <linux/mm.h>
10
#include <linux/sched/mm.h>
L
Linus Torvalds 已提交
11 12 13 14
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/err.h>
#include <linux/sysctl.h>
15
#include <linux/compat.h>
L
Linus Torvalds 已提交
16 17 18
#include <asm/mman.h>
#include <asm/tlb.h>
#include <asm/tlbflush.h>
19
#include <asm/pgalloc.h>
20
#include <asm/elf.h>
L
Linus Torvalds 已提交
21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42

#if 0	/* This is just for testing */
struct page *
follow_huge_addr(struct mm_struct *mm, unsigned long address, int write)
{
	unsigned long start = address;
	int length = 1;
	int nr;
	struct page *page;
	struct vm_area_struct *vma;

	vma = find_vma(mm, addr);
	if (!vma || !is_vm_hugetlb_page(vma))
		return ERR_PTR(-EINVAL);

	pte = huge_pte_offset(mm, address);

	/* hugetlb should be locked, and hence, prefaulted */
	WARN_ON(!pte || pte_none(*pte));

	page = &pte_page(*pte)[vpfn % (HPAGE_SIZE/PAGE_SIZE)];

43
	WARN_ON(!PageHead(page));
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52

	return page;
}

int pmd_huge(pmd_t pmd)
{
	return 0;
}

A
Andi Kleen 已提交
53 54 55 56 57
int pud_huge(pud_t pud)
{
	return 0;
}

L
Linus Torvalds 已提交
58 59
#else

60 61 62 63 64
/*
 * pmd_huge() returns 1 if @pmd is hugetlb related entry, that is normal
 * hugetlb entry or non-present (migration or hwpoisoned) hugetlb entry.
 * Otherwise, returns 0.
 */
L
Linus Torvalds 已提交
65 66
int pmd_huge(pmd_t pmd)
{
67 68
	return !pmd_none(pmd) &&
		(pmd_val(pmd) & (_PAGE_PRESENT|_PAGE_PSE)) != _PAGE_PRESENT;
L
Linus Torvalds 已提交
69 70
}

A
Andi Kleen 已提交
71 72
int pud_huge(pud_t pud)
{
A
Andi Kleen 已提交
73
	return !!(pud_val(pud) & _PAGE_PSE);
A
Andi Kleen 已提交
74
}
L
Linus Torvalds 已提交
75 76
#endif

77
#ifdef CONFIG_HUGETLB_PAGE
L
Linus Torvalds 已提交
78 79 80 81
static unsigned long hugetlb_get_unmapped_area_bottomup(struct file *file,
		unsigned long addr, unsigned long len,
		unsigned long pgoff, unsigned long flags)
{
A
Andi Kleen 已提交
82
	struct hstate *h = hstate_file(file);
83 84 85 86
	struct vm_unmapped_area_info info;

	info.flags = 0;
	info.length = len;
87 88 89
	info.low_limit = get_mmap_base(1);
	info.high_limit = in_compat_syscall() ?
		tasksize_32bit() : tasksize_64bit();
90 91 92
	info.align_mask = PAGE_MASK & ~huge_page_mask(h);
	info.align_offset = 0;
	return vm_unmapped_area(&info);
L
Linus Torvalds 已提交
93 94 95 96 97 98
}

static unsigned long hugetlb_get_unmapped_area_topdown(struct file *file,
		unsigned long addr0, unsigned long len,
		unsigned long pgoff, unsigned long flags)
{
A
Andi Kleen 已提交
99
	struct hstate *h = hstate_file(file);
100 101
	struct vm_unmapped_area_info info;
	unsigned long addr;
L
Linus Torvalds 已提交
102

103 104 105
	info.flags = VM_UNMAPPED_AREA_TOPDOWN;
	info.length = len;
	info.low_limit = PAGE_SIZE;
106
	info.high_limit = get_mmap_base(0);
107 108 109
	info.align_mask = PAGE_MASK & ~huge_page_mask(h);
	info.align_offset = 0;
	addr = vm_unmapped_area(&info);
L
Linus Torvalds 已提交
110 111 112 113 114 115 116

	/*
	 * A failed mmap() very likely causes application failure,
	 * so fall back to the bottom-up function here. This scenario
	 * can happen with large stack limits and large mmap()
	 * allocations.
	 */
117 118 119 120 121 122 123
	if (addr & ~PAGE_MASK) {
		VM_BUG_ON(addr != -ENOMEM);
		info.flags = 0;
		info.low_limit = TASK_UNMAPPED_BASE;
		info.high_limit = TASK_SIZE;
		addr = vm_unmapped_area(&info);
	}
L
Linus Torvalds 已提交
124 125 126 127 128 129 130 131

	return addr;
}

unsigned long
hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
		unsigned long len, unsigned long pgoff, unsigned long flags)
{
A
Andi Kleen 已提交
132
	struct hstate *h = hstate_file(file);
L
Linus Torvalds 已提交
133 134 135
	struct mm_struct *mm = current->mm;
	struct vm_area_struct *vma;

A
Andi Kleen 已提交
136
	if (len & ~huge_page_mask(h))
L
Linus Torvalds 已提交
137 138 139 140
		return -EINVAL;
	if (len > TASK_SIZE)
		return -ENOMEM;

141
	if (flags & MAP_FIXED) {
142
		if (prepare_hugepage_range(file, addr, len))
143 144 145 146
			return -EINVAL;
		return addr;
	}

L
Linus Torvalds 已提交
147
	if (addr) {
A
Andi Kleen 已提交
148
		addr = ALIGN(addr, huge_page_size(h));
L
Linus Torvalds 已提交
149 150 151 152 153 154 155 156 157 158 159 160
		vma = find_vma(mm, addr);
		if (TASK_SIZE - len >= addr &&
		    (!vma || addr + len <= vma->vm_start))
			return addr;
	}
	if (mm->get_unmapped_area == arch_get_unmapped_area)
		return hugetlb_get_unmapped_area_bottomup(file, addr, len,
				pgoff, flags);
	else
		return hugetlb_get_unmapped_area_topdown(file, addr, len,
				pgoff, flags);
}
161
#endif /* CONFIG_HUGETLB_PAGE */
L
Linus Torvalds 已提交
162

163 164 165 166 167 168
#ifdef CONFIG_X86_64
static __init int setup_hugepagesz(char *opt)
{
	unsigned long ps = memparse(opt, &opt);
	if (ps == PMD_SIZE) {
		hugetlb_add_hstate(PMD_SHIFT - PAGE_SHIFT);
169
	} else if (ps == PUD_SIZE && boot_cpu_has(X86_FEATURE_GBPAGES)) {
170 171
		hugetlb_add_hstate(PUD_SHIFT - PAGE_SHIFT);
	} else {
172
		hugetlb_bad_size();
173 174 175 176 177 178 179
		printk(KERN_ERR "hugepagesz: Unsupported page size %lu M\n",
			ps >> 20);
		return 0;
	}
	return 1;
}
__setup("hugepagesz=", setup_hugepagesz);
180

181
#if (defined(CONFIG_MEMORY_ISOLATION) && defined(CONFIG_COMPACTION)) || defined(CONFIG_CMA)
182 183
static __init int gigantic_pages_init(void)
{
184
	/* With compaction or CMA we can allocate gigantic pages at runtime */
185
	if (boot_cpu_has(X86_FEATURE_GBPAGES) && !size_to_hstate(1UL << PUD_SHIFT))
186 187 188 189 190
		hugetlb_add_hstate(PUD_SHIFT - PAGE_SHIFT);
	return 0;
}
arch_initcall(gigantic_pages_init);
#endif
191
#endif