process.c 9.2 KB
Newer Older
J
Jeff Dike 已提交
1
/*
J
Jeff Dike 已提交
2
 * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
L
Linus Torvalds 已提交
3 4 5 6
 * Copyright 2003 PathScale, Inc.
 * Licensed under the GPL
 */

J
Jeff Dike 已提交
7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
#include <linux/stddef.h>
#include <linux/err.h>
#include <linux/hardirq.h>
#include <linux/gfp.h>
#include <linux/mm.h>
#include <linux/personality.h>
#include <linux/proc_fs.h>
#include <linux/ptrace.h>
#include <linux/random.h>
#include <linux/sched.h>
#include <linux/tick.h>
#include <linux/threads.h>
#include <asm/current.h>
#include <asm/pgtable.h>
#include <asm/uaccess.h>
J
Jeff Dike 已提交
22
#include "as-layout.h"
J
Jeff Dike 已提交
23
#include "kern_util.h"
L
Linus Torvalds 已提交
24
#include "os.h"
25
#include "skas.h"
J
Jeff Dike 已提交
26
#include "tlb.h"
L
Linus Torvalds 已提交
27

J
Jeff Dike 已提交
28 29
/*
 * This is a per-cpu array.  A processor only modifies its entry and it only
L
Linus Torvalds 已提交
30 31 32 33 34
 * cares about its entry, so it's OK if another processor is modifying its
 * entry.
 */
struct cpu_task cpu_tasks[NR_CPUS] = { [0 ... NR_CPUS - 1] = { -1, NULL } };

35
static inline int external_pid(void)
L
Linus Torvalds 已提交
36
{
37
	/* FIXME: Need to look up userspace_pid by cpu */
J
Jeff Dike 已提交
38
	return userspace_pid[0];
L
Linus Torvalds 已提交
39 40 41 42 43 44
}

int pid_to_processor_id(int pid)
{
	int i;

J
Jeff Dike 已提交
45
	for (i = 0; i < ncpus; i++) {
J
Jeff Dike 已提交
46
		if (cpu_tasks[i].pid == pid)
J
Jeff Dike 已提交
47
			return i;
L
Linus Torvalds 已提交
48
	}
J
Jeff Dike 已提交
49
	return -1;
L
Linus Torvalds 已提交
50 51 52 53 54 55 56 57 58 59
}

void free_stack(unsigned long stack, int order)
{
	free_pages(stack, order);
}

unsigned long alloc_stack(int order, int atomic)
{
	unsigned long page;
A
Al Viro 已提交
60
	gfp_t flags = GFP_KERNEL;
L
Linus Torvalds 已提交
61

62 63
	if (atomic)
		flags = GFP_ATOMIC;
L
Linus Torvalds 已提交
64
	page = __get_free_pages(flags, order);
65

J
Jeff Dike 已提交
66
	return page;
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74
}

int kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
{
	int pid;

	current->thread.request.u.thread.proc = fn;
	current->thread.request.u.thread.arg = arg;
J
Jeff Dike 已提交
75 76
	pid = do_fork(CLONE_VM | CLONE_UNTRACED | flags, 0,
		      &current->thread.regs, 0, NULL, NULL);
J
Jeff Dike 已提交
77
	return pid;
L
Linus Torvalds 已提交
78 79
}

J
Jeff Dike 已提交
80
static inline void set_current(struct task_struct *task)
L
Linus Torvalds 已提交
81
{
A
Al Viro 已提交
82
	cpu_tasks[task_thread_info(task)->cpu] = ((struct cpu_task)
83
		{ external_pid(), task });
L
Linus Torvalds 已提交
84 85
}

86
extern void arch_switch_to(struct task_struct *to);
87

L
Linus Torvalds 已提交
88 89
void *_switch_to(void *prev, void *next, void *last)
{
J
Jeff Dike 已提交
90
	struct task_struct *from = prev;
91
	struct task_struct *to = next;
92

J
Jeff Dike 已提交
93 94
	to->thread.prev_sched = from;
	set_current(to);
95

96
	do {
J
Jeff Dike 已提交
97
		current->thread.saved_task = NULL;
98

J
Jeff Dike 已提交
99 100
		switch_threads(&from->thread.switch_buf,
			       &to->thread.switch_buf);
101

102
		arch_switch_to(current);
103

J
Jeff Dike 已提交
104
		if (current->thread.saved_task)
105
			show_regs(&(current->thread.regs));
J
Jeff Dike 已提交
106 107
		to = current->thread.saved_task;
		from = current;
108
	} while (current->thread.saved_task);
109

J
Jeff Dike 已提交
110
	return current->thread.prev_sched;
111

L
Linus Torvalds 已提交
112 113 114 115
}

void interrupt_end(void)
{
J
Jeff Dike 已提交
116
	if (need_resched())
J
Jeff Dike 已提交
117
		schedule();
J
Jeff Dike 已提交
118
	if (test_tsk_thread_flag(current, TIF_SIGPENDING))
J
Jeff Dike 已提交
119
		do_signal();
L
Linus Torvalds 已提交
120 121 122 123 124
}

void exit_thread(void)
{
}
J
Jeff Dike 已提交
125

L
Linus Torvalds 已提交
126 127
void *get_current(void)
{
J
Jeff Dike 已提交
128
	return current;
L
Linus Torvalds 已提交
129 130
}

J
Jeff Dike 已提交
131 132
/*
 * This is called magically, by its address being stuffed in a jmp_buf
133 134 135 136 137 138 139
 * and being longjmp-d to.
 */
void new_thread_handler(void)
{
	int (*fn)(void *), n;
	void *arg;

J
Jeff Dike 已提交
140
	if (current->thread.prev_sched != NULL)
141 142 143 144 145 146
		schedule_tail(current->thread.prev_sched);
	current->thread.prev_sched = NULL;

	fn = current->thread.request.u.thread.proc;
	arg = current->thread.request.u.thread.arg;

J
Jeff Dike 已提交
147 148
	/*
	 * The return value is 1 if the kernel thread execs a process,
149 150 151
	 * 0 if it just exits
	 */
	n = run_kernel_thread(fn, arg, &current->thread.exec_buf);
J
Jeff Dike 已提交
152
	if (n == 1) {
153 154 155 156 157 158 159 160 161 162 163 164 165 166
		/* Handle any immediate reschedules or signals */
		interrupt_end();
		userspace(&current->thread.regs.regs);
	}
	else do_exit(0);
}

/* Called magically, see new_thread_handler above */
void fork_handler(void)
{
	force_flush_all();

	schedule_tail(current->thread.prev_sched);

J
Jeff Dike 已提交
167 168
	/*
	 * XXX: if interrupt_end() calls schedule, this call to
169
	 * arch_switch_to isn't needed. We could want to apply this to
J
Jeff Dike 已提交
170 171
	 * improve performance. -bb
	 */
172
	arch_switch_to(current);
173 174 175 176 177 178 179 180 181

	current->thread.prev_sched = NULL;

	/* Handle any immediate reschedules or signals */
	interrupt_end();

	userspace(&current->thread.regs.regs);
}

L
Linus Torvalds 已提交
182
int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
J
Jeff Dike 已提交
183
		unsigned long stack_top, struct task_struct * p,
L
Linus Torvalds 已提交
184 185
		struct pt_regs *regs)
{
186 187
	void (*handler)(void);
	int ret = 0;
188

L
Linus Torvalds 已提交
189
	p->thread = (struct thread_struct) INIT_THREAD;
190

J
Jeff Dike 已提交
191
	if (current->thread.forking) {
192 193
	  	memcpy(&p->thread.regs.regs, &regs->regs,
		       sizeof(p->thread.regs.regs));
194
		REGS_SET_SYSCALL_RETURN(p->thread.regs.regs.gp, 0);
J
Jeff Dike 已提交
195
		if (sp != 0)
196
			REGS_SP(p->thread.regs.regs.gp) = sp;
197

198
		handler = fork_handler;
199

200 201 202
		arch_copy_thread(&current->thread.arch, &p->thread.arch);
	}
	else {
203
		get_safe_registers(p->thread.regs.regs.gp);
204 205 206 207 208 209 210 211 212 213 214 215 216 217 218
		p->thread.request.u.thread = current->thread.request.u.thread;
		handler = new_thread_handler;
	}

	new_thread(task_stack_page(p), &p->thread.switch_buf, handler);

	if (current->thread.forking) {
		clear_flushed_tls(p);

		/*
		 * Set a new TLS for the child thread?
		 */
		if (clone_flags & CLONE_SETTLS)
			ret = arch_copy_tls(p);
	}
219 220

	return ret;
L
Linus Torvalds 已提交
221 222 223 224 225 226 227
}

void initial_thread_cb(void (*proc)(void *), void *arg)
{
	int save_kmalloc_ok = kmalloc_ok;

	kmalloc_ok = 0;
J
Jeff Dike 已提交
228
	initial_thread_cb_skas(proc, arg);
L
Linus Torvalds 已提交
229 230
	kmalloc_ok = save_kmalloc_ok;
}
J
Jeff Dike 已提交
231

L
Linus Torvalds 已提交
232 233
void default_idle(void)
{
234 235
	unsigned long long nsecs;

J
Jeff Dike 已提交
236
	while (1) {
L
Linus Torvalds 已提交
237 238 239 240 241 242
		/* endless idle loop with no priority at all */

		/*
		 * although we are an idle CPU, we do not want to
		 * get into the scheduler unnecessarily.
		 */
J
Jeff Dike 已提交
243
		if (need_resched())
L
Linus Torvalds 已提交
244
			schedule();
J
Jeff Dike 已提交
245

J
Jeff Dike 已提交
246
		tick_nohz_stop_sched_tick();
247 248
		nsecs = disable_timer();
		idle_sleep(nsecs);
J
Jeff Dike 已提交
249
		tick_nohz_restart_sched_tick();
L
Linus Torvalds 已提交
250 251 252 253 254
	}
}

void cpu_idle(void)
{
J
Jeff Dike 已提交
255
	cpu_tasks[current_thread_info()->cpu].pid = os_getpid();
256
	default_idle();
L
Linus Torvalds 已提交
257 258
}

259 260 261
int __cant_sleep(void) {
	return in_atomic() || irqs_disabled() || in_interrupt();
	/* Is in_interrupt() really needed? */
L
Linus Torvalds 已提交
262 263 264 265 266 267 268
}

int user_context(unsigned long sp)
{
	unsigned long stack;

	stack = sp & (PAGE_MASK << CONFIG_KERNEL_STACK_ORDER);
J
Jeff Dike 已提交
269
	return stack != (unsigned long) current_thread_info();
L
Linus Torvalds 已提交
270 271 272 273 274 275 276 277 278 279 280 281 282
}

extern exitcall_t __uml_exitcall_begin, __uml_exitcall_end;

void do_uml_exitcalls(void)
{
	exitcall_t *call;

	call = &__uml_exitcall_end;
	while (--call >= &__uml_exitcall_begin)
		(*call)();
}

W
WANG Cong 已提交
283
char *uml_strdup(const char *string)
L
Linus Torvalds 已提交
284
{
285
	return kstrdup(string, GFP_KERNEL);
L
Linus Torvalds 已提交
286 287 288 289
}

int copy_to_user_proc(void __user *to, void *from, int size)
{
J
Jeff Dike 已提交
290
	return copy_to_user(to, from, size);
L
Linus Torvalds 已提交
291 292 293 294
}

int copy_from_user_proc(void *to, void __user *from, int size)
{
J
Jeff Dike 已提交
295
	return copy_from_user(to, from, size);
L
Linus Torvalds 已提交
296 297 298 299
}

int clear_user_proc(void __user *buf, int size)
{
J
Jeff Dike 已提交
300
	return clear_user(buf, size);
L
Linus Torvalds 已提交
301 302 303 304
}

int strlen_user_proc(char __user *str)
{
J
Jeff Dike 已提交
305
	return strlen_user(str);
L
Linus Torvalds 已提交
306 307 308 309 310
}

int smp_sigio_handler(void)
{
#ifdef CONFIG_SMP
J
Jeff Dike 已提交
311
	int cpu = current_thread_info()->cpu;
L
Linus Torvalds 已提交
312
	IPI_handler(cpu);
J
Jeff Dike 已提交
313
	if (cpu != 0)
J
Jeff Dike 已提交
314
		return 1;
L
Linus Torvalds 已提交
315
#endif
J
Jeff Dike 已提交
316
	return 0;
L
Linus Torvalds 已提交
317 318 319 320
}

int cpu(void)
{
J
Jeff Dike 已提交
321
	return current_thread_info()->cpu;
L
Linus Torvalds 已提交
322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340
}

static atomic_t using_sysemu = ATOMIC_INIT(0);
int sysemu_supported;

void set_using_sysemu(int value)
{
	if (value > sysemu_supported)
		return;
	atomic_set(&using_sysemu, value);
}

int get_using_sysemu(void)
{
	return atomic_read(&using_sysemu);
}

static int proc_read_sysemu(char *buf, char **start, off_t offset, int size,int *eof, void *data)
{
J
Jeff Dike 已提交
341 342
	if (snprintf(buf, size, "%d\n", get_using_sysemu()) < size)
		/* No overflow */
L
Linus Torvalds 已提交
343 344 345 346 347
		*eof = 1;

	return strlen(buf);
}

A
Al Viro 已提交
348
static int proc_write_sysemu(struct file *file,const char __user *buf, unsigned long count,void *data)
L
Linus Torvalds 已提交
349 350 351 352 353 354 355 356
{
	char tmp[2];

	if (copy_from_user(tmp, buf, 1))
		return -EFAULT;

	if (tmp[0] >= '0' && tmp[0] <= '2')
		set_using_sysemu(tmp[0] - '0');
J
Jeff Dike 已提交
357 358
	/* We use the first char, but pretend to write everything */
	return count;
L
Linus Torvalds 已提交
359 360 361 362 363 364 365 366 367 368 369 370
}

int __init make_proc_sysemu(void)
{
	struct proc_dir_entry *ent;
	if (!sysemu_supported)
		return 0;

	ent = create_proc_entry("sysemu", 0600, &proc_root);

	if (ent == NULL)
	{
371
		printk(KERN_WARNING "Failed to register /proc/sysemu\n");
J
Jeff Dike 已提交
372
		return 0;
L
Linus Torvalds 已提交
373 374 375 376 377 378 379 380 381 382 383 384 385 386
	}

	ent->read_proc  = proc_read_sysemu;
	ent->write_proc = proc_write_sysemu;

	return 0;
}

late_initcall(make_proc_sysemu);

int singlestepping(void * t)
{
	struct task_struct *task = t ? t : current;

J
Jeff Dike 已提交
387
	if (!(task->ptrace & PT_DTRACE))
J
Jeff Dike 已提交
388
		return 0;
L
Linus Torvalds 已提交
389 390

	if (task->thread.singlestep_syscall)
J
Jeff Dike 已提交
391
		return 1;
L
Linus Torvalds 已提交
392 393 394 395

	return 2;
}

396 397 398 399 400 401 402 403
/*
 * Only x86 and x86_64 have an arch_align_stack().
 * All other arches have "#define arch_align_stack(x) (x)"
 * in their asm/system.h
 * As this is included in UML from asm-um/system-generic.h,
 * we can use it to behave as the subarch does.
 */
#ifndef arch_align_stack
L
Linus Torvalds 已提交
404 405
unsigned long arch_align_stack(unsigned long sp)
{
J
Jeff Dike 已提交
406
	if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
L
Linus Torvalds 已提交
407 408 409
		sp -= get_random_int() % 8192;
	return sp & ~0xf;
}
410
#endif
J
Jeff Dike 已提交
411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445

unsigned long get_wchan(struct task_struct *p)
{
	unsigned long stack_page, sp, ip;
	bool seen_sched = 0;

	if ((p == NULL) || (p == current) || (p->state == TASK_RUNNING))
		return 0;

	stack_page = (unsigned long) task_stack_page(p);
	/* Bail if the process has no kernel stack for some reason */
	if (stack_page == 0)
		return 0;

	sp = p->thread.switch_buf->JB_SP;
	/*
	 * Bail if the stack pointer is below the bottom of the kernel
	 * stack for some reason
	 */
	if (sp < stack_page)
		return 0;

	while (sp < stack_page + THREAD_SIZE) {
		ip = *((unsigned long *) sp);
		if (in_sched_functions(ip))
			/* Ignore everything until we're above the scheduler */
			seen_sched = 1;
		else if (kernel_text_address(ip) && seen_sched)
			return ip;

		sp += sizeof(unsigned long);
	}

	return 0;
}
J
Jeff Dike 已提交
446 447 448 449 450 451 452 453

int elf_core_copy_fpregs(struct task_struct *t, elf_fpregset_t *fpu)
{
	int cpu = current_thread_info()->cpu;

	return save_fp_registers(userspace_pid[cpu], (unsigned long *) fpu);
}