mem.c 6.9 KB
Newer Older
1
/*
J
Jeff Dike 已提交
2
 * Copyright (C) 2002 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
L
Linus Torvalds 已提交
3 4 5
 * Licensed under the GPL
 */

J
Jeff Dike 已提交
6 7
#include <stddef.h>
#include <unistd.h>
L
Linus Torvalds 已提交
8
#include <errno.h>
9
#include <string.h>
L
Linus Torvalds 已提交
10
#include <sys/mman.h>
J
Jeff Dike 已提交
11 12 13
#include "init.h"
#include "kern_constants.h"
#include "mm_id.h"
L
Linus Torvalds 已提交
14 15
#include "os.h"
#include "proc_mm.h"
16 17
#include "ptrace_user.h"
#include "registers.h"
J
Jeff Dike 已提交
18 19
#include "skas.h"
#include "user.h"
20 21
#include "sysdep/ptrace.h"
#include "sysdep/stub.h"
J
Jeff Dike 已提交
22
#include "uml-config.h"
23

24
extern unsigned long batch_syscall_stub, __syscall_stub_start;
25

J
Jeff Dike 已提交
26
extern void wait_stub_done(int pid);
27

28 29 30
static inline unsigned long *check_init_stack(struct mm_id * mm_idp,
					      unsigned long *stack)
{
J
Jeff Dike 已提交
31
	if (stack == NULL) {
32 33 34 35 36 37
		stack = (unsigned long *) mm_idp->stack + 2;
		*stack = 0;
	}
	return stack;
}

J
Jeff Dike 已提交
38 39 40 41
static unsigned long syscall_regs[MAX_REG_NR];

static int __init init_syscall_regs(void)
{
J
Jeff Dike 已提交
42
	get_safe_registers(syscall_regs);
J
Jeff Dike 已提交
43 44 45 46 47 48 49 50
	syscall_regs[REGS_IP_INDEX] = UML_CONFIG_STUB_CODE +
		((unsigned long) &batch_syscall_stub -
		 (unsigned long) &__syscall_stub_start);
	return 0;
}

__initcall(init_syscall_regs);

51 52
extern int proc_mm;

J
Jeff Dike 已提交
53
int single_count = 0;
54 55
int multi_count = 0;
int multi_op_count = 0;
J
Jeff Dike 已提交
56

57
static inline long do_syscall_stub(struct mm_id * mm_idp, void **addr)
L
Linus Torvalds 已提交
58
{
59
	int n, i;
60
	long ret, offset;
61 62
	unsigned long * data;
	unsigned long * syscall;
J
Jeff Dike 已提交
63
	int err, pid = mm_idp->u.pid;
64

J
Jeff Dike 已提交
65
	if (proc_mm)
66
		/* FIXME: Need to look up userspace_pid by cpu */
67 68 69
		pid = userspace_pid[0];

	multi_count++;
70

J
Jeff Dike 已提交
71
	n = ptrace_setregs(pid, syscall_regs);
J
Jeff Dike 已提交
72 73 74 75
	if (n < 0) {
		printk(UM_KERN_ERR "Registers - \n");
		for (i = 0; i < MAX_REG_NR; i++)
			printk(UM_KERN_ERR "\t%d\t0x%lx\n", i, syscall_regs[i]);
76
		panic("do_syscall_stub : PTRACE_SETREGS failed, errno = %d\n",
77 78
		      -n);
	}
79

J
Jeff Dike 已提交
80
	err = ptrace(PTRACE_CONT, pid, 0, 0);
J
Jeff Dike 已提交
81
	if (err)
J
Jeff Dike 已提交
82 83 84 85
		panic("Failed to continue stub, pid = %d, errno = %d\n", pid,
		      errno);

	wait_stub_done(pid);
86

J
Jeff Dike 已提交
87 88
	/*
	 * When the stub stops, we find the following values on the
89 90 91 92 93 94 95 96 97
	 * beginning of the stack:
	 * (long )return_value
	 * (long )offset to failed sycall-data (0, if no error)
	 */
	ret = *((unsigned long *) mm_idp->stack);
	offset = *((unsigned long *) mm_idp->stack + 1);
	if (offset) {
		data = (unsigned long *)(mm_idp->stack +
					 offset - UML_CONFIG_STUB_DATA);
J
Jeff Dike 已提交
98
		printk(UM_KERN_ERR "do_syscall_stub : ret = %ld, offset = %ld, "
99
		       "data = %p\n", ret, offset, data);
100
		syscall = (unsigned long *)((unsigned long)data + data[0]);
J
Jeff Dike 已提交
101 102
		printk(UM_KERN_ERR "do_syscall_stub: syscall %ld failed, "
		       "return value = 0x%lx, expected return value = 0x%lx\n",
103
		       syscall[0], ret, syscall[7]);
J
Jeff Dike 已提交
104
		printk(UM_KERN_ERR "    syscall parameters: "
105 106 107
		       "0x%lx 0x%lx 0x%lx 0x%lx 0x%lx 0x%lx\n",
		       syscall[1], syscall[2], syscall[3],
		       syscall[4], syscall[5], syscall[6]);
J
Jeff Dike 已提交
108 109 110 111 112 113
		for (n = 1; n < data[0]/sizeof(long); n++) {
			if (n == 1)
				printk(UM_KERN_ERR "    additional syscall "
				       "data:");
			if (n % 4 == 1)
				printk("\n" UM_KERN_ERR "      ");
114 115
			printk("  0x%lx", data[n]);
		}
J
Jeff Dike 已提交
116
		if (n > 1)
117
			printk("\n");
J
Jeff Dike 已提交
118
	}
119
	else ret = 0;
J
Jeff Dike 已提交
120

121
	*addr = check_init_stack(mm_idp, NULL);
J
Jeff Dike 已提交
122

123
	return ret;
J
Jeff Dike 已提交
124 125
}

126 127
long run_syscall_stub(struct mm_id * mm_idp, int syscall,
		      unsigned long *args, long expected, void **addr,
128
		      int done)
J
Jeff Dike 已提交
129
{
130
	unsigned long *stack = check_init_stack(mm_idp, *addr);
131

J
Jeff Dike 已提交
132
	if (done && *addr == NULL)
133 134
		single_count++;

135
	*stack += sizeof(long);
136
	stack += *stack / sizeof(long);
J
Jeff Dike 已提交
137

138 139 140 141 142 143 144
	*stack++ = syscall;
	*stack++ = args[0];
	*stack++ = args[1];
	*stack++ = args[2];
	*stack++ = args[3];
	*stack++ = args[4];
	*stack++ = args[5];
145
	*stack++ = expected;
146 147
	*stack = 0;
	multi_op_count++;
J
Jeff Dike 已提交
148

J
Jeff Dike 已提交
149 150
	if (!done && ((((unsigned long) stack) & ~UM_KERN_PAGE_MASK) <
		     UM_KERN_PAGE_SIZE - 10 * sizeof(long))) {
151
		*addr = stack;
152 153
		return 0;
	}
J
Jeff Dike 已提交
154

155 156
	return do_syscall_stub(mm_idp, addr);
}
J
Jeff Dike 已提交
157

158 159 160 161 162 163 164
long syscall_stub_data(struct mm_id * mm_idp,
		       unsigned long *data, int data_count,
		       void **addr, void **stub_addr)
{
	unsigned long *stack;
	int ret = 0;

J
Jeff Dike 已提交
165 166
	/*
	 * If *addr still is uninitialized, it *must* contain NULL.
167 168
	 * Thus in this case do_syscall_stub correctly won't be called.
	 */
J
Jeff Dike 已提交
169
	if ((((unsigned long) *addr) & ~UM_KERN_PAGE_MASK) >=
J
Jeff Dike 已提交
170
	   UM_KERN_PAGE_SIZE - (10 + data_count) * sizeof(long)) {
171
		ret = do_syscall_stub(mm_idp, addr);
172
		/* in case of error, don't overwrite data on stack */
J
Jeff Dike 已提交
173
		if (ret)
174 175
			return ret;
	}
176

177 178
	stack = check_init_stack(mm_idp, *addr);
	*addr = stack;
179

180
	*stack = data_count * sizeof(long);
L
Linus Torvalds 已提交
181

182
	memcpy(stack + 1, data, data_count * sizeof(long));
J
Jeff Dike 已提交
183

J
Jeff Dike 已提交
184 185
	*stub_addr = (void *)(((unsigned long)(stack + 1) &
			       ~UM_KERN_PAGE_MASK) + UML_CONFIG_STUB_DATA);
J
Jeff Dike 已提交
186

187
	return 0;
J
Jeff Dike 已提交
188 189
}

J
Jeff Dike 已提交
190 191
int map(struct mm_id * mm_idp, unsigned long virt, unsigned long len, int prot,
	int phys_fd, unsigned long long offset, int done, void **data)
L
Linus Torvalds 已提交
192
{
J
Jeff Dike 已提交
193
	int ret;
194

J
Jeff Dike 已提交
195
	if (proc_mm) {
196 197 198 199 200 201 202 203 204 205 206 207 208 209
		struct proc_mm_op map;
		int fd = mm_idp->u.mm_fd;

		map = ((struct proc_mm_op) { .op	= MM_MMAP,
				       .u		=
				       { .mmap	=
					 { .addr	= virt,
					   .len	= len,
					   .prot	= prot,
					   .flags	= MAP_SHARED |
					   MAP_FIXED,
					   .fd	= phys_fd,
					   .offset= offset
					 } } } );
210
		CATCH_EINTR(ret = write(fd, &map, sizeof(map)));
J
Jeff Dike 已提交
211
		if (ret != sizeof(map)) {
212
			ret = -errno;
J
Jeff Dike 已提交
213 214
			printk(UM_KERN_ERR "map : /proc/mm map failed, "
			       "err = %d\n", -ret);
215
		}
216
		else ret = 0;
217 218 219 220 221
	}
	else {
		unsigned long args[] = { virt, len, prot,
					 MAP_SHARED | MAP_FIXED, phys_fd,
					 MMAP_OFFSET(offset) };
222

223 224
		ret = run_syscall_stub(mm_idp, STUB_MMAP_NR, args, virt,
				       data, done);
225
	}
226

227
	return ret;
L
Linus Torvalds 已提交
228 229
}

J
Jeff Dike 已提交
230 231
int unmap(struct mm_id * mm_idp, unsigned long addr, unsigned long len,
	  int done, void **data)
L
Linus Torvalds 已提交
232
{
233 234
	int ret;

J
Jeff Dike 已提交
235
	if (proc_mm) {
236 237 238 239 240 241 242 243 244
		struct proc_mm_op unmap;
		int fd = mm_idp->u.mm_fd;

		unmap = ((struct proc_mm_op) { .op	= MM_MUNMAP,
					 .u	=
					 { .munmap	=
					   { .addr	=
					     (unsigned long) addr,
					     .len		= len } } } );
245
		CATCH_EINTR(ret = write(fd, &unmap, sizeof(unmap)));
J
Jeff Dike 已提交
246
		if (ret != sizeof(unmap)) {
247
			ret = -errno;
J
Jeff Dike 已提交
248 249
			printk(UM_KERN_ERR "unmap - proc_mm write returned "
			       "%d\n", ret);
250
		}
251
		else ret = 0;
252 253 254 255
	}
	else {
		unsigned long args[] = { (unsigned long) addr, len, 0, 0, 0,
					 0 };
256

257 258
		ret = run_syscall_stub(mm_idp, __NR_munmap, args, 0,
				       data, done);
259
	}
260

261
	return ret;
262
}
L
Linus Torvalds 已提交
263

264
int protect(struct mm_id * mm_idp, unsigned long addr, unsigned long len,
J
Jeff Dike 已提交
265
	    unsigned int prot, int done, void **data)
266
{
267
	struct proc_mm_op protect;
J
Jeff Dike 已提交
268
	int ret;
269

J
Jeff Dike 已提交
270
	if (proc_mm) {
271 272 273 274 275 276 277 278 279 280
		int fd = mm_idp->u.mm_fd;

		protect = ((struct proc_mm_op) { .op	= MM_MPROTECT,
					   .u	=
					   { .mprotect	=
					     { .addr	=
					       (unsigned long) addr,
					       .len	= len,
					       .prot	= prot } } } );

281
		CATCH_EINTR(ret = write(fd, &protect, sizeof(protect)));
J
Jeff Dike 已提交
282
		if (ret != sizeof(protect)) {
283
			ret = -errno;
J
Jeff Dike 已提交
284
			printk(UM_KERN_ERR "protect failed, err = %d", -ret);
285
		}
286 287 288 289 290 291 292 293 294 295
		else ret = 0;
	}
	else {
		unsigned long args[] = { addr, len, prot, 0, 0, 0 };

		ret = run_syscall_stub(mm_idp, __NR_mprotect, args, 0,
				       data, done);
	}

	return ret;
L
Linus Torvalds 已提交
296
}