process.c 9.3 KB
Newer Older
J
Jeff Dike 已提交
1
/*
J
Jeff Dike 已提交
2
 * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
L
Linus Torvalds 已提交
3 4 5 6
 * Copyright 2003 PathScale, Inc.
 * Licensed under the GPL
 */

J
Jeff Dike 已提交
7 8 9
#include "linux/stddef.h"
#include "linux/err.h"
#include "linux/hardirq.h"
L
Linus Torvalds 已提交
10
#include "linux/mm.h"
J
Jeff Dike 已提交
11
#include "linux/personality.h"
L
Linus Torvalds 已提交
12 13 14
#include "linux/proc_fs.h"
#include "linux/ptrace.h"
#include "linux/random.h"
J
Jeff Dike 已提交
15
#include "linux/sched.h"
J
Jeff Dike 已提交
16
#include "linux/tick.h"
J
Jeff Dike 已提交
17
#include "linux/threads.h"
L
Linus Torvalds 已提交
18 19
#include "asm/pgtable.h"
#include "asm/uaccess.h"
J
Jeff Dike 已提交
20
#include "as-layout.h"
J
Jeff Dike 已提交
21
#include "kern_util.h"
L
Linus Torvalds 已提交
22
#include "os.h"
23
#include "skas.h"
J
Jeff Dike 已提交
24
#include "tlb.h"
L
Linus Torvalds 已提交
25

J
Jeff Dike 已提交
26 27
/*
 * This is a per-cpu array.  A processor only modifies its entry and it only
L
Linus Torvalds 已提交
28 29 30 31 32
 * cares about its entry, so it's OK if another processor is modifying its
 * entry.
 */
struct cpu_task cpu_tasks[NR_CPUS] = { [0 ... NR_CPUS - 1] = { -1, NULL } };

J
Jeff Dike 已提交
33
static inline int external_pid(struct task_struct *task)
L
Linus Torvalds 已提交
34
{
35
	/* FIXME: Need to look up userspace_pid by cpu */
J
Jeff Dike 已提交
36
	return userspace_pid[0];
L
Linus Torvalds 已提交
37 38 39 40 41 42
}

int pid_to_processor_id(int pid)
{
	int i;

J
Jeff Dike 已提交
43 44
	for(i = 0; i < ncpus; i++) {
		if (cpu_tasks[i].pid == pid)
J
Jeff Dike 已提交
45
			return i;
L
Linus Torvalds 已提交
46
	}
J
Jeff Dike 已提交
47
	return -1;
L
Linus Torvalds 已提交
48 49 50 51 52 53 54 55 56 57
}

void free_stack(unsigned long stack, int order)
{
	free_pages(stack, order);
}

unsigned long alloc_stack(int order, int atomic)
{
	unsigned long page;
A
Al Viro 已提交
58
	gfp_t flags = GFP_KERNEL;
L
Linus Torvalds 已提交
59

60 61
	if (atomic)
		flags = GFP_ATOMIC;
L
Linus Torvalds 已提交
62
	page = __get_free_pages(flags, order);
63
	if (page == 0)
J
Jeff Dike 已提交
64
		return 0;
65

J
Jeff Dike 已提交
66
	return page;
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74
}

int kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
{
	int pid;

	current->thread.request.u.thread.proc = fn;
	current->thread.request.u.thread.arg = arg;
J
Jeff Dike 已提交
75 76
	pid = do_fork(CLONE_VM | CLONE_UNTRACED | flags, 0,
		      &current->thread.regs, 0, NULL, NULL);
J
Jeff Dike 已提交
77
	return pid;
L
Linus Torvalds 已提交
78 79
}

J
Jeff Dike 已提交
80
static inline void set_current(struct task_struct *task)
L
Linus Torvalds 已提交
81
{
A
Al Viro 已提交
82
	cpu_tasks[task_thread_info(task)->cpu] = ((struct cpu_task)
L
Linus Torvalds 已提交
83 84 85
		{ external_pid(task), task });
}

86 87
extern void arch_switch_to(struct task_struct *from, struct task_struct *to);

L
Linus Torvalds 已提交
88 89
void *_switch_to(void *prev, void *next, void *last)
{
J
Jeff Dike 已提交
90 91
	struct task_struct *from = prev;
	struct task_struct *to= next;
92

J
Jeff Dike 已提交
93 94
	to->thread.prev_sched = from;
	set_current(to);
95

96
	do {
J
Jeff Dike 已提交
97
		current->thread.saved_task = NULL;
98 99 100 101 102 103

		switch_threads(&from->thread.switch_buf,
			       &to->thread.switch_buf);

		arch_switch_to(current->thread.prev_sched, current);

J
Jeff Dike 已提交
104
		if (current->thread.saved_task)
105 106 107 108
			show_regs(&(current->thread.regs));
		next= current->thread.saved_task;
		prev= current;
	} while(current->thread.saved_task);
109

J
Jeff Dike 已提交
110
	return current->thread.prev_sched;
111

L
Linus Torvalds 已提交
112 113 114 115
}

void interrupt_end(void)
{
J
Jeff Dike 已提交
116
	if (need_resched())
J
Jeff Dike 已提交
117
		schedule();
J
Jeff Dike 已提交
118
	if (test_tsk_thread_flag(current, TIF_SIGPENDING))
J
Jeff Dike 已提交
119
		do_signal();
L
Linus Torvalds 已提交
120 121 122 123 124
}

void exit_thread(void)
{
}
J
Jeff Dike 已提交
125

L
Linus Torvalds 已提交
126 127
void *get_current(void)
{
J
Jeff Dike 已提交
128
	return current;
L
Linus Torvalds 已提交
129 130
}

131 132
extern void schedule_tail(struct task_struct *prev);

J
Jeff Dike 已提交
133 134
/*
 * This is called magically, by its address being stuffed in a jmp_buf
135 136 137 138 139 140 141
 * and being longjmp-d to.
 */
void new_thread_handler(void)
{
	int (*fn)(void *), n;
	void *arg;

J
Jeff Dike 已提交
142
	if (current->thread.prev_sched != NULL)
143 144 145 146 147 148
		schedule_tail(current->thread.prev_sched);
	current->thread.prev_sched = NULL;

	fn = current->thread.request.u.thread.proc;
	arg = current->thread.request.u.thread.arg;

J
Jeff Dike 已提交
149 150
	/*
	 * The return value is 1 if the kernel thread execs a process,
151 152 153
	 * 0 if it just exits
	 */
	n = run_kernel_thread(fn, arg, &current->thread.exec_buf);
J
Jeff Dike 已提交
154
	if (n == 1) {
155 156 157 158 159 160 161 162 163 164 165
		/* Handle any immediate reschedules or signals */
		interrupt_end();
		userspace(&current->thread.regs.regs);
	}
	else do_exit(0);
}

/* Called magically, see new_thread_handler above */
void fork_handler(void)
{
	force_flush_all();
J
Jeff Dike 已提交
166
	if (current->thread.prev_sched == NULL)
167 168 169 170
		panic("blech");

	schedule_tail(current->thread.prev_sched);

J
Jeff Dike 已提交
171 172
	/*
	 * XXX: if interrupt_end() calls schedule, this call to
173
	 * arch_switch_to isn't needed. We could want to apply this to
J
Jeff Dike 已提交
174 175
	 * improve performance. -bb
	 */
176 177 178 179 180 181 182 183 184 185
	arch_switch_to(current->thread.prev_sched, current);

	current->thread.prev_sched = NULL;

	/* Handle any immediate reschedules or signals */
	interrupt_end();

	userspace(&current->thread.regs.regs);
}

L
Linus Torvalds 已提交
186
int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
J
Jeff Dike 已提交
187
		unsigned long stack_top, struct task_struct * p,
L
Linus Torvalds 已提交
188 189
		struct pt_regs *regs)
{
190 191
	void (*handler)(void);
	int ret = 0;
192

L
Linus Torvalds 已提交
193
	p->thread = (struct thread_struct) INIT_THREAD;
194

J
Jeff Dike 已提交
195
	if (current->thread.forking) {
196 197
	  	memcpy(&p->thread.regs.regs, &regs->regs,
		       sizeof(p->thread.regs.regs));
198
		REGS_SET_SYSCALL_RETURN(p->thread.regs.regs.gp, 0);
J
Jeff Dike 已提交
199
		if (sp != 0)
200
			REGS_SP(p->thread.regs.regs.gp) = sp;
201

202
		handler = fork_handler;
203

204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222
		arch_copy_thread(&current->thread.arch, &p->thread.arch);
	}
	else {
		init_thread_registers(&p->thread.regs.regs);
		p->thread.request.u.thread = current->thread.request.u.thread;
		handler = new_thread_handler;
	}

	new_thread(task_stack_page(p), &p->thread.switch_buf, handler);

	if (current->thread.forking) {
		clear_flushed_tls(p);

		/*
		 * Set a new TLS for the child thread?
		 */
		if (clone_flags & CLONE_SETTLS)
			ret = arch_copy_tls(p);
	}
223 224

	return ret;
L
Linus Torvalds 已提交
225 226 227 228 229 230 231
}

void initial_thread_cb(void (*proc)(void *), void *arg)
{
	int save_kmalloc_ok = kmalloc_ok;

	kmalloc_ok = 0;
J
Jeff Dike 已提交
232
	initial_thread_cb_skas(proc, arg);
L
Linus Torvalds 已提交
233 234
	kmalloc_ok = save_kmalloc_ok;
}
J
Jeff Dike 已提交
235

L
Linus Torvalds 已提交
236 237
void default_idle(void)
{
238 239
	unsigned long long nsecs;

J
Jeff Dike 已提交
240
	while(1) {
L
Linus Torvalds 已提交
241 242 243 244 245 246
		/* endless idle loop with no priority at all */

		/*
		 * although we are an idle CPU, we do not want to
		 * get into the scheduler unnecessarily.
		 */
J
Jeff Dike 已提交
247
		if (need_resched())
L
Linus Torvalds 已提交
248
			schedule();
J
Jeff Dike 已提交
249

J
Jeff Dike 已提交
250
		tick_nohz_stop_sched_tick();
251 252
		nsecs = disable_timer();
		idle_sleep(nsecs);
J
Jeff Dike 已提交
253
		tick_nohz_restart_sched_tick();
L
Linus Torvalds 已提交
254 255 256 257 258
	}
}

void cpu_idle(void)
{
259 260
	cpu_tasks[current_thread->cpu].pid = os_getpid();
	default_idle();
L
Linus Torvalds 已提交
261 262
}

J
Jeff Dike 已提交
263
void *um_virt_to_phys(struct task_struct *task, unsigned long addr,
L
Linus Torvalds 已提交
264 265 266 267 268 269
		      pte_t *pte_out)
{
	pgd_t *pgd;
	pud_t *pud;
	pmd_t *pmd;
	pte_t *pte;
H
Hugh Dickins 已提交
270
	pte_t ptent;
L
Linus Torvalds 已提交
271

J
Jeff Dike 已提交
272
	if (task->mm == NULL)
J
Jeff Dike 已提交
273
		return ERR_PTR(-EINVAL);
L
Linus Torvalds 已提交
274
	pgd = pgd_offset(task->mm, addr);
J
Jeff Dike 已提交
275
	if (!pgd_present(*pgd))
J
Jeff Dike 已提交
276
		return ERR_PTR(-EINVAL);
L
Linus Torvalds 已提交
277 278

	pud = pud_offset(pgd, addr);
J
Jeff Dike 已提交
279
	if (!pud_present(*pud))
J
Jeff Dike 已提交
280
		return ERR_PTR(-EINVAL);
L
Linus Torvalds 已提交
281 282

	pmd = pmd_offset(pud, addr);
J
Jeff Dike 已提交
283
	if (!pmd_present(*pmd))
J
Jeff Dike 已提交
284
		return ERR_PTR(-EINVAL);
L
Linus Torvalds 已提交
285 286

	pte = pte_offset_kernel(pmd, addr);
H
Hugh Dickins 已提交
287
	ptent = *pte;
J
Jeff Dike 已提交
288
	if (!pte_present(ptent))
J
Jeff Dike 已提交
289
		return ERR_PTR(-EINVAL);
L
Linus Torvalds 已提交
290

J
Jeff Dike 已提交
291
	if (pte_out != NULL)
H
Hugh Dickins 已提交
292
		*pte_out = ptent;
J
Jeff Dike 已提交
293
	return (void *) (pte_val(ptent) & PAGE_MASK) + (addr & ~PAGE_MASK);
L
Linus Torvalds 已提交
294 295 296 297 298
}

char *current_cmd(void)
{
#if defined(CONFIG_SMP) || defined(CONFIG_HIGHMEM)
J
Jeff Dike 已提交
299
	return "(Unknown)";
L
Linus Torvalds 已提交
300 301 302 303 304 305 306 307 308 309
#else
	void *addr = um_virt_to_phys(current, current->mm->arg_start, NULL);
	return IS_ERR(addr) ? "(Unknown)": __va((unsigned long) addr);
#endif
}

void dump_thread(struct pt_regs *regs, struct user *u)
{
}

310 311 312
int __cant_sleep(void) {
	return in_atomic() || irqs_disabled() || in_interrupt();
	/* Is in_interrupt() really needed? */
L
Linus Torvalds 已提交
313 314 315 316 317 318 319
}

int user_context(unsigned long sp)
{
	unsigned long stack;

	stack = sp & (PAGE_MASK << CONFIG_KERNEL_STACK_ORDER);
J
Jeff Dike 已提交
320
	return stack != (unsigned long) current_thread;
L
Linus Torvalds 已提交
321 322 323 324 325 326 327 328 329 330 331 332 333 334 335
}

extern exitcall_t __uml_exitcall_begin, __uml_exitcall_end;

void do_uml_exitcalls(void)
{
	exitcall_t *call;

	call = &__uml_exitcall_end;
	while (--call >= &__uml_exitcall_begin)
		(*call)();
}

char *uml_strdup(char *string)
{
336
	return kstrdup(string, GFP_KERNEL);
L
Linus Torvalds 已提交
337 338 339 340
}

int copy_to_user_proc(void __user *to, void *from, int size)
{
J
Jeff Dike 已提交
341
	return copy_to_user(to, from, size);
L
Linus Torvalds 已提交
342 343 344 345
}

int copy_from_user_proc(void *to, void __user *from, int size)
{
J
Jeff Dike 已提交
346
	return copy_from_user(to, from, size);
L
Linus Torvalds 已提交
347 348 349 350
}

int clear_user_proc(void __user *buf, int size)
{
J
Jeff Dike 已提交
351
	return clear_user(buf, size);
L
Linus Torvalds 已提交
352 353 354 355
}

int strlen_user_proc(char __user *str)
{
J
Jeff Dike 已提交
356
	return strlen_user(str);
L
Linus Torvalds 已提交
357 358 359 360 361 362 363
}

int smp_sigio_handler(void)
{
#ifdef CONFIG_SMP
	int cpu = current_thread->cpu;
	IPI_handler(cpu);
J
Jeff Dike 已提交
364
	if (cpu != 0)
J
Jeff Dike 已提交
365
		return 1;
L
Linus Torvalds 已提交
366
#endif
J
Jeff Dike 已提交
367
	return 0;
L
Linus Torvalds 已提交
368 369 370 371
}

int cpu(void)
{
J
Jeff Dike 已提交
372
	return current_thread->cpu;
L
Linus Torvalds 已提交
373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391
}

static atomic_t using_sysemu = ATOMIC_INIT(0);
int sysemu_supported;

void set_using_sysemu(int value)
{
	if (value > sysemu_supported)
		return;
	atomic_set(&using_sysemu, value);
}

int get_using_sysemu(void)
{
	return atomic_read(&using_sysemu);
}

static int proc_read_sysemu(char *buf, char **start, off_t offset, int size,int *eof, void *data)
{
J
Jeff Dike 已提交
392 393
	if (snprintf(buf, size, "%d\n", get_using_sysemu()) < size)
		/* No overflow */
L
Linus Torvalds 已提交
394 395 396 397 398
		*eof = 1;

	return strlen(buf);
}

A
Al Viro 已提交
399
static int proc_write_sysemu(struct file *file,const char __user *buf, unsigned long count,void *data)
L
Linus Torvalds 已提交
400 401 402 403 404 405 406 407
{
	char tmp[2];

	if (copy_from_user(tmp, buf, 1))
		return -EFAULT;

	if (tmp[0] >= '0' && tmp[0] <= '2')
		set_using_sysemu(tmp[0] - '0');
J
Jeff Dike 已提交
408 409
	/* We use the first char, but pretend to write everything */
	return count;
L
Linus Torvalds 已提交
410 411 412 413 414 415 416 417 418 419 420 421
}

int __init make_proc_sysemu(void)
{
	struct proc_dir_entry *ent;
	if (!sysemu_supported)
		return 0;

	ent = create_proc_entry("sysemu", 0600, &proc_root);

	if (ent == NULL)
	{
422
		printk(KERN_WARNING "Failed to register /proc/sysemu\n");
J
Jeff Dike 已提交
423
		return 0;
L
Linus Torvalds 已提交
424 425 426 427 428 429 430 431 432 433 434 435 436 437 438
	}

	ent->read_proc  = proc_read_sysemu;
	ent->write_proc = proc_write_sysemu;

	return 0;
}

late_initcall(make_proc_sysemu);

int singlestepping(void * t)
{
	struct task_struct *task = t ? t : current;

	if ( ! (task->ptrace & PT_DTRACE) )
J
Jeff Dike 已提交
439
		return 0;
L
Linus Torvalds 已提交
440 441

	if (task->thread.singlestep_syscall)
J
Jeff Dike 已提交
442
		return 1;
L
Linus Torvalds 已提交
443 444 445 446

	return 2;
}

447 448 449 450 451 452 453 454
/*
 * Only x86 and x86_64 have an arch_align_stack().
 * All other arches have "#define arch_align_stack(x) (x)"
 * in their asm/system.h
 * As this is included in UML from asm-um/system-generic.h,
 * we can use it to behave as the subarch does.
 */
#ifndef arch_align_stack
L
Linus Torvalds 已提交
455 456
unsigned long arch_align_stack(unsigned long sp)
{
J
Jeff Dike 已提交
457
	if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
L
Linus Torvalds 已提交
458 459 460
		sp -= get_random_int() % 8192;
	return sp & ~0xf;
}
461
#endif