process_vm_access.c 10.2 KB
Newer Older
C
Christopher Yeoh 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
/*
 * linux/mm/process_vm_access.c
 *
 * Copyright (C) 2010-2011 Christopher Yeoh <cyeoh@au1.ibm.com>, IBM Corp.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version
 * 2 of the License, or (at your option) any later version.
 */

#include <linux/mm.h>
#include <linux/uio.h>
#include <linux/sched.h>
#include <linux/highmem.h>
#include <linux/ptrace.h>
#include <linux/slab.h>
#include <linux/syscalls.h>

#ifdef CONFIG_COMPAT
#include <linux/compat.h>
#endif

/**
 * process_vm_rw_pages - read/write pages from task specified
A
Al Viro 已提交
26
 * @pages: array of pointers to pages we want to copy
C
Christopher Yeoh 已提交
27 28
 * @start_offset: offset in page to start copying from/to
 * @len: number of bytes to copy
A
Al Viro 已提交
29
 * @iter: where to copy to/from locally
C
Christopher Yeoh 已提交
30 31 32
 * @vm_write: 0 means copy from, 1 means copy to
 * Returns 0 on success, error code otherwise
 */
33 34
static int process_vm_rw_pages(struct page **pages,
			       unsigned offset,
35
			       size_t len,
A
Al Viro 已提交
36
			       struct iov_iter *iter,
37
			       int vm_write)
C
Christopher Yeoh 已提交
38 39
{
	/* Do the copy for each page */
40
	while (len && iov_iter_count(iter)) {
41
		struct page *page = *pages++;
42
		size_t copy = PAGE_SIZE - offset;
43
		size_t copied;
44

45 46 47
		if (copy > len)
			copy = len;

48
		if (vm_write) {
A
Al Viro 已提交
49
			copied = copy_page_from_iter(page, offset, copy, iter);
50
			set_page_dirty_lock(page);
C
Christopher Yeoh 已提交
51
		} else {
52
			copied = copy_page_to_iter(page, offset, copy, iter);
C
Christopher Yeoh 已提交
53
		}
54 55 56 57
		len -= copied;
		if (copied < copy && iov_iter_count(iter))
			return -EFAULT;
		offset = 0;
C
Christopher Yeoh 已提交
58
	}
59
	return 0;
C
Christopher Yeoh 已提交
60 61 62 63 64 65 66 67 68
}

/* Maximum number of pages kmalloc'd to hold struct page's during copy */
#define PVM_MAX_KMALLOC_PAGES (PAGE_SIZE * 2)

/**
 * process_vm_rw_single_vec - read/write pages from task specified
 * @addr: start memory address of target process
 * @len: size of area to copy to/from
A
Al Viro 已提交
69
 * @iter: where to copy to/from locally
C
Christopher Yeoh 已提交
70 71 72 73 74 75 76 77 78
 * @process_pages: struct pages area that can store at least
 *  nr_pages_to_copy struct page pointers
 * @mm: mm for task
 * @task: task to read/write from
 * @vm_write: 0 means copy from, 1 means copy to
 * Returns 0 on success or on failure error code
 */
static int process_vm_rw_single_vec(unsigned long addr,
				    unsigned long len,
A
Al Viro 已提交
79
				    struct iov_iter *iter,
C
Christopher Yeoh 已提交
80 81 82
				    struct page **process_pages,
				    struct mm_struct *mm,
				    struct task_struct *task,
83
				    int vm_write)
C
Christopher Yeoh 已提交
84 85 86 87 88 89 90 91 92 93 94 95 96
{
	unsigned long pa = addr & PAGE_MASK;
	unsigned long start_offset = addr - pa;
	unsigned long nr_pages;
	ssize_t rc = 0;
	unsigned long max_pages_per_loop = PVM_MAX_KMALLOC_PAGES
		/ sizeof(struct pages *);

	/* Work out address and page range required */
	if (len == 0)
		return 0;
	nr_pages = (addr + len - 1) / PAGE_SIZE - addr / PAGE_SIZE + 1;

A
Al Viro 已提交
97 98 99
	while (!rc && nr_pages && iov_iter_count(iter)) {
		int pages = min(nr_pages, max_pages_per_loop);
		size_t bytes;
C
Christopher Yeoh 已提交
100

101 102
		/* Get the pages we're interested in */
		down_read(&mm->mmap_sem);
A
Al Viro 已提交
103 104
		pages = get_user_pages(task, mm, pa, pages,
				      vm_write, 0, process_pages, NULL);
105
		up_read(&mm->mmap_sem);
C
Christopher Yeoh 已提交
106

A
Al Viro 已提交
107
		if (pages <= 0)
108 109
			return -EFAULT;

A
Al Viro 已提交
110 111 112
		bytes = pages * PAGE_SIZE - start_offset;
		if (bytes > len)
			bytes = len;
113

114
		rc = process_vm_rw_pages(process_pages,
A
Al Viro 已提交
115
					 start_offset, bytes, iter,
116
					 vm_write);
A
Al Viro 已提交
117
		len -= bytes;
C
Christopher Yeoh 已提交
118
		start_offset = 0;
A
Al Viro 已提交
119 120 121 122
		nr_pages -= pages;
		pa += pages * PAGE_SIZE;
		while (pages)
			put_page(process_pages[--pages]);
C
Christopher Yeoh 已提交
123 124 125 126 127 128 129 130 131 132 133 134
	}

	return rc;
}

/* Maximum number of entries for process pages array
   which lives on stack */
#define PVM_MAX_PP_ARRAY_COUNT 16

/**
 * process_vm_rw_core - core of reading/writing pages from task specified
 * @pid: PID of process to read/write from/to
A
Al Viro 已提交
135
 * @iter: where to copy to/from locally
C
Christopher Yeoh 已提交
136 137 138 139 140 141 142 143
 * @rvec: iovec array specifying where to copy to/from in the other process
 * @riovcnt: size of rvec array
 * @flags: currently unused
 * @vm_write: 0 if reading from other process, 1 if writing to other process
 * Returns the number of bytes read/written or error code. May
 *  return less bytes than expected if an error occurs during the copying
 *  process.
 */
A
Al Viro 已提交
144
static ssize_t process_vm_rw_core(pid_t pid, struct iov_iter *iter,
C
Christopher Yeoh 已提交
145 146 147 148 149 150 151 152 153 154 155 156 157
				  const struct iovec *rvec,
				  unsigned long riovcnt,
				  unsigned long flags, int vm_write)
{
	struct task_struct *task;
	struct page *pp_stack[PVM_MAX_PP_ARRAY_COUNT];
	struct page **process_pages = pp_stack;
	struct mm_struct *mm;
	unsigned long i;
	ssize_t rc = 0;
	unsigned long nr_pages = 0;
	unsigned long nr_pages_iov;
	ssize_t iov_len;
158
	size_t total_len = iov_iter_count(iter);
C
Christopher Yeoh 已提交
159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199

	/*
	 * Work out how many pages of struct pages we're going to need
	 * when eventually calling get_user_pages
	 */
	for (i = 0; i < riovcnt; i++) {
		iov_len = rvec[i].iov_len;
		if (iov_len > 0) {
			nr_pages_iov = ((unsigned long)rvec[i].iov_base
					+ iov_len)
				/ PAGE_SIZE - (unsigned long)rvec[i].iov_base
				/ PAGE_SIZE + 1;
			nr_pages = max(nr_pages, nr_pages_iov);
		}
	}

	if (nr_pages == 0)
		return 0;

	if (nr_pages > PVM_MAX_PP_ARRAY_COUNT) {
		/* For reliability don't try to kmalloc more than
		   2 pages worth */
		process_pages = kmalloc(min_t(size_t, PVM_MAX_KMALLOC_PAGES,
					      sizeof(struct pages *)*nr_pages),
					GFP_KERNEL);

		if (!process_pages)
			return -ENOMEM;
	}

	/* Get process information */
	rcu_read_lock();
	task = find_task_by_vpid(pid);
	if (task)
		get_task_struct(task);
	rcu_read_unlock();
	if (!task) {
		rc = -ESRCH;
		goto free_proc_pages;
	}

200 201 202 203 204 205 206 207 208
	mm = mm_access(task, PTRACE_MODE_ATTACH);
	if (!mm || IS_ERR(mm)) {
		rc = IS_ERR(mm) ? PTR_ERR(mm) : -ESRCH;
		/*
		 * Explicitly map EACCES to EPERM as EPERM is a more a
		 * appropriate error code for process_vw_readv/writev
		 */
		if (rc == -EACCES)
			rc = -EPERM;
C
Christopher Yeoh 已提交
209 210 211
		goto put_task_struct;
	}

212
	for (i = 0; i < riovcnt && iov_iter_count(iter) && !rc; i++)
C
Christopher Yeoh 已提交
213 214
		rc = process_vm_rw_single_vec(
			(unsigned long)rvec[i].iov_base, rvec[i].iov_len,
215 216 217 218 219 220 221 222 223 224
			iter, process_pages, mm, task, vm_write);

	/* copied = space before - space after */
	total_len -= iov_iter_count(iter);

	/* If we have managed to copy any data at all then
	   we return the number of bytes copied. Otherwise
	   we return the error code */
	if (total_len)
		rc = total_len;
C
Christopher Yeoh 已提交
225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260

	mmput(mm);

put_task_struct:
	put_task_struct(task);

free_proc_pages:
	if (process_pages != pp_stack)
		kfree(process_pages);
	return rc;
}

/**
 * process_vm_rw - check iovecs before calling core routine
 * @pid: PID of process to read/write from/to
 * @lvec: iovec array specifying where to copy to/from locally
 * @liovcnt: size of lvec array
 * @rvec: iovec array specifying where to copy to/from in the other process
 * @riovcnt: size of rvec array
 * @flags: currently unused
 * @vm_write: 0 if reading from other process, 1 if writing to other process
 * Returns the number of bytes read/written or error code. May
 *  return less bytes than expected if an error occurs during the copying
 *  process.
 */
static ssize_t process_vm_rw(pid_t pid,
			     const struct iovec __user *lvec,
			     unsigned long liovcnt,
			     const struct iovec __user *rvec,
			     unsigned long riovcnt,
			     unsigned long flags, int vm_write)
{
	struct iovec iovstack_l[UIO_FASTIOV];
	struct iovec iovstack_r[UIO_FASTIOV];
	struct iovec *iov_l = iovstack_l;
	struct iovec *iov_r = iovstack_r;
A
Al Viro 已提交
261
	struct iov_iter iter;
C
Christopher Yeoh 已提交
262 263 264 265 266 267 268 269
	ssize_t rc;

	if (flags != 0)
		return -EINVAL;

	/* Check iovecs */
	if (vm_write)
		rc = rw_copy_check_uvector(WRITE, lvec, liovcnt, UIO_FASTIOV,
270
					   iovstack_l, &iov_l);
C
Christopher Yeoh 已提交
271 272
	else
		rc = rw_copy_check_uvector(READ, lvec, liovcnt, UIO_FASTIOV,
273
					   iovstack_l, &iov_l);
C
Christopher Yeoh 已提交
274 275 276
	if (rc <= 0)
		goto free_iovecs;

A
Al Viro 已提交
277
	iov_iter_init(&iter, vm_write ? WRITE : READ, iov_l, liovcnt, rc);
A
Al Viro 已提交
278

279 280
	rc = rw_copy_check_uvector(CHECK_IOVEC_ONLY, rvec, riovcnt, UIO_FASTIOV,
				   iovstack_r, &iov_r);
C
Christopher Yeoh 已提交
281 282 283
	if (rc <= 0)
		goto free_iovecs;

A
Al Viro 已提交
284
	rc = process_vm_rw_core(pid, &iter, iov_r, riovcnt, flags, vm_write);
C
Christopher Yeoh 已提交
285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311

free_iovecs:
	if (iov_r != iovstack_r)
		kfree(iov_r);
	if (iov_l != iovstack_l)
		kfree(iov_l);

	return rc;
}

SYSCALL_DEFINE6(process_vm_readv, pid_t, pid, const struct iovec __user *, lvec,
		unsigned long, liovcnt, const struct iovec __user *, rvec,
		unsigned long, riovcnt,	unsigned long, flags)
{
	return process_vm_rw(pid, lvec, liovcnt, rvec, riovcnt, flags, 0);
}

SYSCALL_DEFINE6(process_vm_writev, pid_t, pid,
		const struct iovec __user *, lvec,
		unsigned long, liovcnt, const struct iovec __user *, rvec,
		unsigned long, riovcnt,	unsigned long, flags)
{
	return process_vm_rw(pid, lvec, liovcnt, rvec, riovcnt, flags, 1);
}

#ifdef CONFIG_COMPAT

312
static ssize_t
C
Christopher Yeoh 已提交
313 314 315 316 317 318 319 320 321 322 323
compat_process_vm_rw(compat_pid_t pid,
		     const struct compat_iovec __user *lvec,
		     unsigned long liovcnt,
		     const struct compat_iovec __user *rvec,
		     unsigned long riovcnt,
		     unsigned long flags, int vm_write)
{
	struct iovec iovstack_l[UIO_FASTIOV];
	struct iovec iovstack_r[UIO_FASTIOV];
	struct iovec *iov_l = iovstack_l;
	struct iovec *iov_r = iovstack_r;
A
Al Viro 已提交
324
	struct iov_iter iter;
C
Christopher Yeoh 已提交
325 326 327 328 329 330 331 332
	ssize_t rc = -EFAULT;

	if (flags != 0)
		return -EINVAL;

	if (vm_write)
		rc = compat_rw_copy_check_uvector(WRITE, lvec, liovcnt,
						  UIO_FASTIOV, iovstack_l,
333
						  &iov_l);
C
Christopher Yeoh 已提交
334 335 336
	else
		rc = compat_rw_copy_check_uvector(READ, lvec, liovcnt,
						  UIO_FASTIOV, iovstack_l,
337
						  &iov_l);
C
Christopher Yeoh 已提交
338 339
	if (rc <= 0)
		goto free_iovecs;
A
Al Viro 已提交
340
	iov_iter_init(&iter, vm_write ? WRITE : READ, iov_l, liovcnt, rc);
341
	rc = compat_rw_copy_check_uvector(CHECK_IOVEC_ONLY, rvec, riovcnt,
C
Christopher Yeoh 已提交
342
					  UIO_FASTIOV, iovstack_r,
343
					  &iov_r);
C
Christopher Yeoh 已提交
344 345 346
	if (rc <= 0)
		goto free_iovecs;

A
Al Viro 已提交
347
	rc = process_vm_rw_core(pid, &iter, iov_r, riovcnt, flags, vm_write);
C
Christopher Yeoh 已提交
348 349 350 351 352 353 354 355 356

free_iovecs:
	if (iov_r != iovstack_r)
		kfree(iov_r);
	if (iov_l != iovstack_l)
		kfree(iov_l);
	return rc;
}

357 358 359 360 361 362
COMPAT_SYSCALL_DEFINE6(process_vm_readv, compat_pid_t, pid,
		       const struct compat_iovec __user *, lvec,
		       compat_ulong_t, liovcnt,
		       const struct compat_iovec __user *, rvec,
		       compat_ulong_t, riovcnt,
		       compat_ulong_t, flags)
C
Christopher Yeoh 已提交
363 364 365 366 367
{
	return compat_process_vm_rw(pid, lvec, liovcnt, rvec,
				    riovcnt, flags, 0);
}

368 369 370 371 372 373
COMPAT_SYSCALL_DEFINE6(process_vm_writev, compat_pid_t, pid,
		       const struct compat_iovec __user *, lvec,
		       compat_ulong_t, liovcnt,
		       const struct compat_iovec __user *, rvec,
		       compat_ulong_t, riovcnt,
		       compat_ulong_t, flags)
C
Christopher Yeoh 已提交
374 375 376 377 378 379
{
	return compat_process_vm_rw(pid, lvec, liovcnt, rvec,
				    riovcnt, flags, 1);
}

#endif