page.c 7.0 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
M
Mike Rapoport 已提交
2
#include <linux/memblock.h>
3 4 5
#include <linux/compiler.h>
#include <linux/fs.h>
#include <linux/init.h>
H
Hugh Dickins 已提交
6
#include <linux/ksm.h>
7 8
#include <linux/mm.h>
#include <linux/mmzone.h>
9
#include <linux/huge_mm.h>
10 11
#include <linux/proc_fs.h>
#include <linux/seq_file.h>
12
#include <linux/hugetlb.h>
V
Vladimir Davydov 已提交
13
#include <linux/memcontrol.h>
14 15
#include <linux/mmu_notifier.h>
#include <linux/page_idle.h>
W
Wu Fengguang 已提交
16
#include <linux/kernel-page-flags.h>
17
#include <linux/uaccess.h>
18 19 20 21
#include "internal.h"

#define KPMSIZE sizeof(u64)
#define KPMMASK (KPMSIZE - 1)
22
#define KPMBITS (KPMSIZE * BITS_PER_BYTE)
23

24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46
/* /proc/kpagecount - an array exposing page counts
 *
 * Each entry is a u64 representing the corresponding
 * physical page count.
 */
static ssize_t kpagecount_read(struct file *file, char __user *buf,
			     size_t count, loff_t *ppos)
{
	u64 __user *out = (u64 __user *)buf;
	struct page *ppage;
	unsigned long src = *ppos;
	unsigned long pfn;
	ssize_t ret = 0;
	u64 pcount;

	pfn = src / KPMSIZE;
	count = min_t(size_t, count, (max_pfn * KPMSIZE) - src);
	if (src & KPMMASK || count & KPMMASK)
		return -EINVAL;

	while (count > 0) {
		if (pfn_valid(pfn))
			ppage = pfn_to_page(pfn);
47 48
		else
			ppage = NULL;
49
		if (!ppage || PageSlab(ppage) || page_has_type(ppage))
50 51 52 53
			pcount = 0;
		else
			pcount = page_mapcount(ppage);

54
		if (put_user(pcount, out)) {
55 56 57 58
			ret = -EFAULT;
			break;
		}

59 60
		pfn++;
		out++;
61
		count -= KPMSIZE;
62 63

		cond_resched();
64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82
	}

	*ppos += (char __user *)out - buf;
	if (!ret)
		ret = (char __user *)out - buf;
	return ret;
}

static const struct file_operations proc_kpagecount_operations = {
	.llseek = mem_lseek,
	.read = kpagecount_read,
};

/* /proc/kpageflags - an array exposing page flags
 *
 * Each entry is a u64 representing the corresponding
 * physical page flags.
 */

83 84 85 86 87
static inline u64 kpf_copy_bit(u64 kflags, int ubit, int kbit)
{
	return ((kflags >> kbit) & 1) << ubit;
}

W
Wu Fengguang 已提交
88
u64 stable_page_flags(struct page *page)
89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106
{
	u64 k;
	u64 u;

	/*
	 * pseudo flag: KPF_NOPAGE
	 * it differentiates a memory hole from a page with no flags
	 */
	if (!page)
		return 1 << KPF_NOPAGE;

	k = page->flags;
	u = 0;

	/*
	 * pseudo flags for the well known (anonymous) memory mapped pages
	 *
	 * Note that page->_mapcount is overloaded in SLOB/SLUB/SLQB, so the
107
	 * simple test in page_mapped() is not enough.
108
	 */
109
	if (!PageSlab(page) && page_mapped(page))
110 111 112
		u |= 1 << KPF_MMAP;
	if (PageAnon(page))
		u |= 1 << KPF_ANON;
H
Hugh Dickins 已提交
113 114
	if (PageKsm(page))
		u |= 1 << KPF_KSM;
115 116 117 118 119 120 121 122 123 124 125

	/*
	 * compound pages: export both head/tail info
	 * they together define a compound page's start/end pos and order
	 */
	if (PageHead(page))
		u |= 1 << KPF_COMPOUND_HEAD;
	if (PageTail(page))
		u |= 1 << KPF_COMPOUND_TAIL;
	if (PageHuge(page))
		u |= 1 << KPF_HUGE;
126 127 128
	/*
	 * PageTransCompound can be true for non-huge compound pages (slab
	 * pages or pages allocated by drivers with __GFP_COMP) because it
129 130
	 * just checks PG_head/PG_tail, so we need to check PageLRU/PageAnon
	 * to make sure a given page is a thp, not a non-huge compound page.
131
	 */
132 133 134 135 136 137 138 139 140 141 142 143
	else if (PageTransCompound(page)) {
		struct page *head = compound_head(page);

		if (PageLRU(head) || PageAnon(head))
			u |= 1 << KPF_THP;
		else if (is_huge_zero_page(head)) {
			u |= 1 << KPF_ZERO_PAGE;
			u |= 1 << KPF_THP;
		}
	} else if (is_zero_pfn(page_to_pfn(page)))
		u |= 1 << KPF_ZERO_PAGE;

144 145

	/*
146
	 * Caveats on high order pages: page->_refcount will only be set
A
Andrea Arcangeli 已提交
147 148
	 * -1 on the head page; SLUB/SLQB do the same for PG_slab;
	 * SLOB won't set PG_slab at all on compound pages.
149
	 */
A
Andrea Arcangeli 已提交
150 151
	if (PageBuddy(page))
		u |= 1 << KPF_BUDDY;
152 153
	else if (page_count(page) == 0 && is_free_buddy_page(page))
		u |= 1 << KPF_BUDDY;
A
Andrea Arcangeli 已提交
154

155 156
	if (PageBalloon(page))
		u |= 1 << KPF_BALLOON;
157 158
	if (PageTable(page))
		u |= 1 << KPF_PGTABLE;
159

160 161 162
	if (page_is_idle(page))
		u |= 1 << KPF_IDLE;

A
Andrea Arcangeli 已提交
163 164
	u |= kpf_copy_bit(k, KPF_LOCKED,	PG_locked);

165
	u |= kpf_copy_bit(k, KPF_SLAB,		PG_slab);
166 167
	if (PageTail(page) && PageSlab(compound_head(page)))
		u |= 1 << KPF_SLAB;
168 169 170 171 172 173 174 175 176 177 178

	u |= kpf_copy_bit(k, KPF_ERROR,		PG_error);
	u |= kpf_copy_bit(k, KPF_DIRTY,		PG_dirty);
	u |= kpf_copy_bit(k, KPF_UPTODATE,	PG_uptodate);
	u |= kpf_copy_bit(k, KPF_WRITEBACK,	PG_writeback);

	u |= kpf_copy_bit(k, KPF_LRU,		PG_lru);
	u |= kpf_copy_bit(k, KPF_REFERENCED,	PG_referenced);
	u |= kpf_copy_bit(k, KPF_ACTIVE,	PG_active);
	u |= kpf_copy_bit(k, KPF_RECLAIM,	PG_reclaim);

179 180
	if (PageSwapCache(page))
		u |= 1 << KPF_SWAPCACHE;
181 182 183 184 185
	u |= kpf_copy_bit(k, KPF_SWAPBACKED,	PG_swapbacked);

	u |= kpf_copy_bit(k, KPF_UNEVICTABLE,	PG_unevictable);
	u |= kpf_copy_bit(k, KPF_MLOCKED,	PG_mlocked);

W
Wu Fengguang 已提交
186 187 188 189
#ifdef CONFIG_MEMORY_FAILURE
	u |= kpf_copy_bit(k, KPF_HWPOISON,	PG_hwpoison);
#endif

190
#ifdef CONFIG_ARCH_USES_PG_UNCACHED
191 192 193 194 195 196 197 198 199 200 201 202
	u |= kpf_copy_bit(k, KPF_UNCACHED,	PG_uncached);
#endif

	u |= kpf_copy_bit(k, KPF_RESERVED,	PG_reserved);
	u |= kpf_copy_bit(k, KPF_MAPPEDTODISK,	PG_mappedtodisk);
	u |= kpf_copy_bit(k, KPF_PRIVATE,	PG_private);
	u |= kpf_copy_bit(k, KPF_PRIVATE_2,	PG_private_2);
	u |= kpf_copy_bit(k, KPF_OWNER_PRIVATE,	PG_owner_priv_1);
	u |= kpf_copy_bit(k, KPF_ARCH,		PG_arch_1);

	return u;
};
203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220

static ssize_t kpageflags_read(struct file *file, char __user *buf,
			     size_t count, loff_t *ppos)
{
	u64 __user *out = (u64 __user *)buf;
	struct page *ppage;
	unsigned long src = *ppos;
	unsigned long pfn;
	ssize_t ret = 0;

	pfn = src / KPMSIZE;
	count = min_t(unsigned long, count, (max_pfn * KPMSIZE) - src);
	if (src & KPMMASK || count & KPMMASK)
		return -EINVAL;

	while (count > 0) {
		if (pfn_valid(pfn))
			ppage = pfn_to_page(pfn);
221 222
		else
			ppage = NULL;
223

W
Wu Fengguang 已提交
224
		if (put_user(stable_page_flags(ppage), out)) {
225 226 227 228
			ret = -EFAULT;
			break;
		}

229 230
		pfn++;
		out++;
231
		count -= KPMSIZE;
232 233

		cond_resched();
234 235 236 237 238 239 240 241 242 243 244 245 246
	}

	*ppos += (char __user *)out - buf;
	if (!ret)
		ret = (char __user *)out - buf;
	return ret;
}

static const struct file_operations proc_kpageflags_operations = {
	.llseek = mem_lseek,
	.read = kpageflags_read,
};

V
Vladimir Davydov 已提交
247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281
#ifdef CONFIG_MEMCG
static ssize_t kpagecgroup_read(struct file *file, char __user *buf,
				size_t count, loff_t *ppos)
{
	u64 __user *out = (u64 __user *)buf;
	struct page *ppage;
	unsigned long src = *ppos;
	unsigned long pfn;
	ssize_t ret = 0;
	u64 ino;

	pfn = src / KPMSIZE;
	count = min_t(unsigned long, count, (max_pfn * KPMSIZE) - src);
	if (src & KPMMASK || count & KPMMASK)
		return -EINVAL;

	while (count > 0) {
		if (pfn_valid(pfn))
			ppage = pfn_to_page(pfn);
		else
			ppage = NULL;

		if (ppage)
			ino = page_cgroup_ino(ppage);
		else
			ino = 0;

		if (put_user(ino, out)) {
			ret = -EFAULT;
			break;
		}

		pfn++;
		out++;
		count -= KPMSIZE;
282 283

		cond_resched();
V
Vladimir Davydov 已提交
284 285 286 287 288 289 290 291 292 293 294 295 296 297
	}

	*ppos += (char __user *)out - buf;
	if (!ret)
		ret = (char __user *)out - buf;
	return ret;
}

static const struct file_operations proc_kpagecgroup_operations = {
	.llseek = mem_lseek,
	.read = kpagecgroup_read,
};
#endif /* CONFIG_MEMCG */

298 299 300 301
static int __init proc_page_init(void)
{
	proc_create("kpagecount", S_IRUSR, NULL, &proc_kpagecount_operations);
	proc_create("kpageflags", S_IRUSR, NULL, &proc_kpageflags_operations);
V
Vladimir Davydov 已提交
302 303 304
#ifdef CONFIG_MEMCG
	proc_create("kpagecgroup", S_IRUSR, NULL, &proc_kpagecgroup_operations);
#endif
305 306
	return 0;
}
307
fs_initcall(proc_page_init);