process.c 9.1 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 * This file handles the architecture dependent parts of process handling.
L
Linus Torvalds 已提交
3
 *
4 5 6 7
 *    Copyright IBM Corp. 1999,2009
 *    Author(s): Martin Schwidefsky <schwidefsky@de.ibm.com>,
 *		 Hartmut Penner <hp@de.ibm.com>,
 *		 Denis Joseph Barrow,
L
Linus Torvalds 已提交
8 9 10 11 12 13 14
 */

#include <linux/compiler.h>
#include <linux/cpu.h>
#include <linux/sched.h>
#include <linux/kernel.h>
#include <linux/mm.h>
15
#include <linux/elfcore.h>
L
Linus Torvalds 已提交
16
#include <linux/smp.h>
17
#include <linux/slab.h>
L
Linus Torvalds 已提交
18
#include <linux/interrupt.h>
19
#include <linux/tick.h>
20
#include <linux/personality.h>
21
#include <linux/syscalls.h>
22
#include <linux/compat.h>
23
#include <linux/kprobes.h>
24
#include <linux/random.h>
25
#include <linux/module.h>
L
Linus Torvalds 已提交
26 27 28 29 30
#include <asm/system.h>
#include <asm/io.h>
#include <asm/processor.h>
#include <asm/irq.h>
#include <asm/timer.h>
31
#include <asm/nmi.h>
32
#include <asm/smp.h>
33
#include "entry.h"
L
Linus Torvalds 已提交
34

35
asmlinkage void ret_from_fork(void) asm ("ret_from_fork");
L
Linus Torvalds 已提交
36 37 38 39 40 41 42 43 44 45 46

/*
 * Return saved PC of a blocked thread. used in kernel/sched.
 * resume in entry.S does not create a new stack frame, it
 * just stores the registers %r6-%r15 to the frame given by
 * schedule. We want to return the address of the caller of
 * schedule, so we have to walk the backchain one time to
 * find the frame schedule() store its return address.
 */
unsigned long thread_saved_pc(struct task_struct *tsk)
{
H
Heiko Carstens 已提交
47
	struct stack_frame *sf, *low, *high;
L
Linus Torvalds 已提交
48

H
Heiko Carstens 已提交
49 50 51 52 53 54 55 56 57 58
	if (!tsk || !task_stack_page(tsk))
		return 0;
	low = task_stack_page(tsk);
	high = (struct stack_frame *) task_pt_regs(tsk);
	sf = (struct stack_frame *) (tsk->thread.ksp & PSW_ADDR_INSN);
	if (sf <= low || sf > high)
		return 0;
	sf = (struct stack_frame *) (sf->back_chain & PSW_ADDR_INSN);
	if (sf <= low || sf > high)
		return 0;
L
Linus Torvalds 已提交
59 60 61 62 63 64
	return sf->gprs[8];
}

/*
 * The idle loop on a S390...
 */
65
static void default_idle(void)
L
Linus Torvalds 已提交
66
{
67
	if (cpu_is_offline(smp_processor_id()))
L
Linus Torvalds 已提交
68
		cpu_die();
69 70 71 72 73
	local_irq_disable();
	if (need_resched()) {
		local_irq_enable();
		return;
	}
74 75 76 77 78 79
	local_mcck_disable();
	if (test_thread_flag(TIF_MCCK_PENDING)) {
		local_mcck_enable();
		local_irq_enable();
		return;
	}
80
	trace_hardirqs_on();
81 82
	/* Don't trace preempt off for idle. */
	stop_critical_timings();
83 84 85
	/* Stop virtual timer and halt the cpu. */
	vtime_stop_cpu();
	/* Reenable preemption tracer. */
86
	start_critical_timings();
L
Linus Torvalds 已提交
87 88 89 90
}

void cpu_idle(void)
{
91
	for (;;) {
92 93
		tick_nohz_idle_enter();
		rcu_idle_enter();
94
		while (!need_resched() && !test_thread_flag(TIF_MCCK_PENDING))
95
			default_idle();
96 97
		rcu_idle_exit();
		tick_nohz_idle_exit();
98 99
		if (test_thread_flag(TIF_MCCK_PENDING))
			s390_handle_mcck();
100 101 102 103
		preempt_enable_no_resched();
		schedule();
		preempt_disable();
	}
L
Linus Torvalds 已提交
104 105
}

106
extern void __kprobes kernel_thread_starter(void);
L
Linus Torvalds 已提交
107

108
asm(
109 110
	".section .kprobes.text, \"ax\"\n"
	".global kernel_thread_starter\n"
L
Linus Torvalds 已提交
111 112 113 114
	"kernel_thread_starter:\n"
	"    la    2,0(10)\n"
	"    basr  14,9\n"
	"    la    2,0\n"
115 116
	"    br    11\n"
	".previous\n");
L
Linus Torvalds 已提交
117 118 119 120 121 122

int kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
{
	struct pt_regs regs;

	memset(&regs, 0, sizeof(regs));
123 124
	regs.psw.mask = psw_kernel_bits |
		PSW_MASK_DAT | PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK;
L
Linus Torvalds 已提交
125 126 127 128 129 130 131 132 133 134
	regs.psw.addr = (unsigned long) kernel_thread_starter | PSW_ADDR_AMODE;
	regs.gprs[9] = (unsigned long) fn;
	regs.gprs[10] = (unsigned long) arg;
	regs.gprs[11] = (unsigned long) do_exit;
	regs.orig_gpr2 = -1;

	/* Ok, create the new process.. */
	return do_fork(flags | CLONE_VM | CLONE_UNTRACED,
		       0, &regs, 0, NULL, NULL);
}
135
EXPORT_SYMBOL(kernel_thread);
L
Linus Torvalds 已提交
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151

/*
 * Free current thread data structures etc..
 */
void exit_thread(void)
{
}

void flush_thread(void)
{
}

void release_thread(struct task_struct *dead_task)
{
}

A
Alexey Dobriyan 已提交
152
int copy_thread(unsigned long clone_flags, unsigned long new_stackp,
153 154
		unsigned long unused,
		struct task_struct *p, struct pt_regs *regs)
L
Linus Torvalds 已提交
155
{
156
	struct thread_info *ti;
157 158 159 160 161 162 163 164
	struct fake_frame
	{
		struct stack_frame sf;
		struct pt_regs childregs;
	} *frame;

	frame = container_of(task_pt_regs(p), struct fake_frame, childregs);
	p->thread.ksp = (unsigned long) frame;
L
Linus Torvalds 已提交
165
	/* Store access registers to kernel stack of new process. */
166
	frame->childregs = *regs;
L
Linus Torvalds 已提交
167
	frame->childregs.gprs[2] = 0;	/* child returns 0 on fork. */
168 169
	frame->childregs.gprs[15] = new_stackp;
	frame->sf.back_chain = 0;
L
Linus Torvalds 已提交
170

171 172
	/* new return point is ret_from_fork */
	frame->sf.gprs[8] = (unsigned long) ret_from_fork;
L
Linus Torvalds 已提交
173

174 175
	/* fake return stack for resume(), don't go back to schedule */
	frame->sf.gprs[9] = (unsigned long) frame;
L
Linus Torvalds 已提交
176 177 178 179

	/* Save access registers to new thread structure. */
	save_access_regs(&p->thread.acrs[0]);

180
#ifndef CONFIG_64BIT
181
	/*
L
Linus Torvalds 已提交
182 183 184 185 186 187 188 189 190
	 * save fprs to current->thread.fp_regs to merge them with
	 * the emulated registers and then copy the result to the child.
	 */
	save_fp_regs(&current->thread.fp_regs);
	memcpy(&p->thread.fp_regs, &current->thread.fp_regs,
	       sizeof(s390_fp_regs));
	/* Set a new TLS ?  */
	if (clone_flags & CLONE_SETTLS)
		p->thread.acrs[0] = regs->gprs[6];
191
#else /* CONFIG_64BIT */
L
Linus Torvalds 已提交
192 193 194 195
	/* Save the fpu registers to new thread structure. */
	save_fp_regs(&p->thread.fp_regs);
	/* Set a new TLS ?  */
	if (clone_flags & CLONE_SETTLS) {
H
Heiko Carstens 已提交
196
		if (is_compat_task()) {
L
Linus Torvalds 已提交
197 198 199 200 201 202
			p->thread.acrs[0] = (unsigned int) regs->gprs[6];
		} else {
			p->thread.acrs[0] = (unsigned int)(regs->gprs[6] >> 32);
			p->thread.acrs[1] = (unsigned int) regs->gprs[6];
		}
	}
203
#endif /* CONFIG_64BIT */
L
Linus Torvalds 已提交
204 205
	/* start new process with ar4 pointing to the correct address space */
	p->thread.mm_segment = get_fs();
206
	/* Don't copy debug registers */
M
Martin Schwidefsky 已提交
207 208
	memset(&p->thread.per_user, 0, sizeof(p->thread.per_user));
	memset(&p->thread.per_event, 0, sizeof(p->thread.per_event));
209
	clear_tsk_thread_flag(p, TIF_SINGLE_STEP);
M
Martin Schwidefsky 已提交
210
	clear_tsk_thread_flag(p, TIF_PER_TRAP);
211 212 213 214
	/* Initialize per thread user and system timer values */
	ti = task_thread_info(p);
	ti->user_timer = 0;
	ti->system_timer = 0;
215
	return 0;
L
Linus Torvalds 已提交
216 217
}

218
SYSCALL_DEFINE0(fork)
L
Linus Torvalds 已提交
219
{
M
Martin Schwidefsky 已提交
220 221
	struct pt_regs *regs = task_pt_regs(current);
	return do_fork(SIGCHLD, regs->gprs[15], regs, 0, NULL, NULL);
L
Linus Torvalds 已提交
222 223
}

224 225
SYSCALL_DEFINE4(clone, unsigned long, newsp, unsigned long, clone_flags,
		int __user *, parent_tidptr, int __user *, child_tidptr)
L
Linus Torvalds 已提交
226
{
M
Martin Schwidefsky 已提交
227
	struct pt_regs *regs = task_pt_regs(current);
L
Linus Torvalds 已提交
228

M
Martin Schwidefsky 已提交
229 230 231
	if (!newsp)
		newsp = regs->gprs[15];
	return do_fork(clone_flags, newsp, regs, 0,
L
Linus Torvalds 已提交
232 233 234 235 236 237 238 239 240 241 242 243 244
		       parent_tidptr, child_tidptr);
}

/*
 * This is trivial, and on the face of it looks like it
 * could equally well be done in user mode.
 *
 * Not so, for quite unobvious reasons - register pressure.
 * In user mode vfork() cannot have a stack frame, and if
 * done by calling the "clone()" system call directly, you
 * do not have enough call-clobbered registers to hold all
 * the information you need.
 */
245
SYSCALL_DEFINE0(vfork)
L
Linus Torvalds 已提交
246
{
M
Martin Schwidefsky 已提交
247
	struct pt_regs *regs = task_pt_regs(current);
L
Linus Torvalds 已提交
248
	return do_fork(CLONE_VFORK | CLONE_VM | SIGCHLD,
M
Martin Schwidefsky 已提交
249 250 251 252 253 254 255 256
		       regs->gprs[15], regs, 0, NULL, NULL);
}

asmlinkage void execve_tail(void)
{
	current->thread.fp_regs.fpc = 0;
	if (MACHINE_HAS_IEEE)
		asm volatile("sfpc %0,%0" : : "d" (0));
L
Linus Torvalds 已提交
257 258 259 260 261
}

/*
 * sys_execve() executes a new program.
 */
262 263 264
SYSCALL_DEFINE3(execve, const char __user *, name,
		const char __user *const __user *, argv,
		const char __user *const __user *, envp)
L
Linus Torvalds 已提交
265
{
M
Martin Schwidefsky 已提交
266 267
	struct pt_regs *regs = task_pt_regs(current);
	char *filename;
268
	long rc;
M
Martin Schwidefsky 已提交
269

270 271 272 273 274 275
	filename = getname(name);
	rc = PTR_ERR(filename);
	if (IS_ERR(filename))
		return rc;
	rc = do_execve(filename, argv, envp, regs);
	if (rc)
M
Martin Schwidefsky 已提交
276 277
		goto out;
	execve_tail();
278
	rc = regs->gprs[2];
L
Linus Torvalds 已提交
279
out:
280 281
	putname(filename);
	return rc;
L
Linus Torvalds 已提交
282 283 284 285 286 287 288
}

/*
 * fill in the FPU structure for a core dump.
 */
int dump_fpu (struct pt_regs * regs, s390_fp_regs *fpregs)
{
289
#ifndef CONFIG_64BIT
290
	/*
L
Linus Torvalds 已提交
291 292 293 294 295
	 * save fprs to current->thread.fp_regs to merge them with
	 * the emulated registers and then copy the result to the dump.
	 */
	save_fp_regs(&current->thread.fp_regs);
	memcpy(fpregs, &current->thread.fp_regs, sizeof(s390_fp_regs));
296
#else /* CONFIG_64BIT */
L
Linus Torvalds 已提交
297
	save_fp_regs(fpregs);
298
#endif /* CONFIG_64BIT */
L
Linus Torvalds 已提交
299 300
	return 1;
}
301
EXPORT_SYMBOL(dump_fpu);
L
Linus Torvalds 已提交
302 303 304 305 306 307 308

unsigned long get_wchan(struct task_struct *p)
{
	struct stack_frame *sf, *low, *high;
	unsigned long return_address;
	int count;

A
Al Viro 已提交
309
	if (!p || p == current || p->state == TASK_RUNNING || !task_stack_page(p))
L
Linus Torvalds 已提交
310
		return 0;
A
Al Viro 已提交
311 312
	low = task_stack_page(p);
	high = (struct stack_frame *) task_pt_regs(p);
L
Linus Torvalds 已提交
313 314 315 316 317 318 319 320 321 322 323 324 325
	sf = (struct stack_frame *) (p->thread.ksp & PSW_ADDR_INSN);
	if (sf <= low || sf > high)
		return 0;
	for (count = 0; count < 16; count++) {
		sf = (struct stack_frame *) (sf->back_chain & PSW_ADDR_INSN);
		if (sf <= low || sf > high)
			return 0;
		return_address = sf->gprs[8] & PSW_ADDR_INSN;
		if (!in_sched_functions(return_address))
			return return_address;
	}
	return 0;
}
326 327 328 329 330 331 332

unsigned long arch_align_stack(unsigned long sp)
{
	if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
		sp -= get_random_int() & ~PAGE_MASK;
	return sp & ~0xf;
}
H
Heiko Carstens 已提交
333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350

static inline unsigned long brk_rnd(void)
{
	/* 8MB for 32bit, 1GB for 64bit */
	if (is_32bit_task())
		return (get_random_int() & 0x7ffUL) << PAGE_SHIFT;
	else
		return (get_random_int() & 0x3ffffUL) << PAGE_SHIFT;
}

unsigned long arch_randomize_brk(struct mm_struct *mm)
{
	unsigned long ret = PAGE_ALIGN(mm->brk + brk_rnd());

	if (ret < mm->brk)
		return mm->brk;
	return ret;
}
H
Heiko Carstens 已提交
351 352 353 354 355 356 357 358 359 360 361

unsigned long randomize_et_dyn(unsigned long base)
{
	unsigned long ret = PAGE_ALIGN(base + brk_rnd());

	if (!(current->flags & PF_RANDOMIZE))
		return base;
	if (ret < base)
		return base;
	return ret;
}