setup.c 23.1 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 *  arch/s390/kernel/setup.c
 *
 *  S390 version
 *    Copyright (C) 1999,2000 IBM Deutschland Entwicklung GmbH, IBM Corporation
 *    Author(s): Hartmut Penner (hp@de.ibm.com),
 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
 *
 *  Derived from "arch/i386/kernel/setup.c"
 *    Copyright (C) 1995, Linus Torvalds
 */

/*
 * This file handles the architecture-dependent parts of initialization
 */

17 18 19
#define KMSG_COMPONENT "setup"
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt

L
Linus Torvalds 已提交
20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
#include <linux/errno.h>
#include <linux/module.h>
#include <linux/sched.h>
#include <linux/kernel.h>
#include <linux/mm.h>
#include <linux/stddef.h>
#include <linux/unistd.h>
#include <linux/ptrace.h>
#include <linux/slab.h>
#include <linux/user.h>
#include <linux/tty.h>
#include <linux/ioport.h>
#include <linux/delay.h>
#include <linux/init.h>
#include <linux/initrd.h>
#include <linux/bootmem.h>
#include <linux/root_dev.h>
#include <linux/console.h>
#include <linux/kernel_stat.h>
39
#include <linux/device.h>
40
#include <linux/notifier.h>
41
#include <linux/pfn.h>
H
Hongjie Yang 已提交
42
#include <linux/ctype.h>
43
#include <linux/reboot.h>
44
#include <linux/topology.h>
45
#include <linux/ftrace.h>
L
Linus Torvalds 已提交
46

M
Michael Holzheu 已提交
47
#include <asm/ipl.h>
L
Linus Torvalds 已提交
48 49 50 51 52 53 54
#include <asm/uaccess.h>
#include <asm/system.h>
#include <asm/smp.h>
#include <asm/mmu_context.h>
#include <asm/cpcmd.h>
#include <asm/lowcore.h>
#include <asm/irq.h>
55 56
#include <asm/page.h>
#include <asm/ptrace.h>
57
#include <asm/sections.h>
H
Hongjie Yang 已提交
58
#include <asm/ebcdic.h>
G
Gerald Schaefer 已提交
59
#include <asm/compat.h>
60
#include <asm/kvm_virtio.h>
G
Gerald Schaefer 已提交
61 62 63 64 65 66

long psw_kernel_bits	= (PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_PRIMARY |
			   PSW_MASK_MCHECK | PSW_DEFAULT_KEY);
long psw_user_bits	= (PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_HOME |
			   PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			   PSW_MASK_PSTATE | PSW_DEFAULT_KEY);
L
Linus Torvalds 已提交
67

68 69 70 71
/*
 * User copy operations.
 */
struct uaccess_ops uaccess;
72
EXPORT_SYMBOL(uaccess);
73

L
Linus Torvalds 已提交
74 75 76 77
/*
 * Machine setup..
 */
unsigned int console_mode = 0;
78 79
EXPORT_SYMBOL(console_mode);

L
Linus Torvalds 已提交
80
unsigned int console_devno = -1;
81 82
EXPORT_SYMBOL(console_devno);

L
Linus Torvalds 已提交
83
unsigned int console_irq = -1;
84 85
EXPORT_SYMBOL(console_irq);

86 87
unsigned long elf_hwcap = 0;
char elf_platform[ELF_PLATFORM_SIZE];
88

89
struct mem_chunk __initdata memory_chunk[MEMORY_CHUNKS];
L
Linus Torvalds 已提交
90
volatile int __cpu_logical_map[NR_CPUS]; /* logical cpu to cpu address */
91 92 93

int __initdata memory_end_set;
unsigned long __initdata memory_end;
L
Linus Torvalds 已提交
94

F
Frank Munzert 已提交
95 96 97 98
/* An array with a pointer to the lowcore of every CPU. */
struct _lowcore *lowcore_ptr[NR_CPUS];
EXPORT_SYMBOL(lowcore_ptr);

L
Linus Torvalds 已提交
99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119
/*
 * This is set up by the setup-routine at boot-time
 * for S390 need to find out, what we have to setup
 * using address 0x10400 ...
 */

#include <asm/setup.h>

static struct resource code_resource = {
	.name  = "Kernel code",
	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
};

static struct resource data_resource = {
	.name = "Kernel data",
	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
};

/*
 * cpu_init() initializes state that is per-CPU.
 */
H
Heiko Carstens 已提交
120
void __cpuinit cpu_init(void)
L
Linus Torvalds 已提交
121 122 123 124
{
        /*
         * Store processor id in lowcore (used e.g. in timer_interrupt)
         */
125
	get_cpu_id(&S390_lowcore.cpu_id);
L
Linus Torvalds 已提交
126 127 128 129 130 131 132 133 134

        /*
         * Force FPU initialization:
         */
        clear_thread_flag(TIF_USEDFPU);
        clear_used_math();

	atomic_inc(&init_mm.mm_count);
	current->active_mm = &init_mm;
S
Stoyan Gaydarov 已提交
135
	BUG_ON(current->mm);
L
Linus Torvalds 已提交
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
        enter_lazy_tlb(&init_mm, current);
}

/*
 * condev= and conmode= setup parameter.
 */

static int __init condev_setup(char *str)
{
	int vdev;

	vdev = simple_strtoul(str, &str, 0);
	if (vdev >= 0 && vdev < 65536) {
		console_devno = vdev;
		console_irq = -1;
	}
	return 1;
}

__setup("condev=", condev_setup);

157 158
static void __init set_preferred_console(void)
{
159
	if (MACHINE_IS_KVM)
160
		add_preferred_console("hvc", 0, NULL);
161
	else if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
162
		add_preferred_console("ttyS", 0, NULL);
163
	else if (CONSOLE_IS_3270)
164 165 166
		add_preferred_console("tty3270", 0, NULL);
}

L
Linus Torvalds 已提交
167 168
static int __init conmode_setup(char *str)
{
169
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
170 171 172 173 174 175 176 177 178 179 180
	if (strncmp(str, "hwc", 4) == 0 || strncmp(str, "sclp", 5) == 0)
                SET_CONSOLE_SCLP;
#endif
#if defined(CONFIG_TN3215_CONSOLE)
	if (strncmp(str, "3215", 5) == 0)
		SET_CONSOLE_3215;
#endif
#if defined(CONFIG_TN3270_CONSOLE)
	if (strncmp(str, "3270", 5) == 0)
		SET_CONSOLE_3270;
#endif
181
	set_preferred_console();
L
Linus Torvalds 已提交
182 183 184 185 186 187 188 189 190 191 192
        return 1;
}

__setup("conmode=", conmode_setup);

static void __init conmode_default(void)
{
	char query_buffer[1024];
	char *ptr;

        if (MACHINE_IS_VM) {
193
		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
L
Linus Torvalds 已提交
194 195 196
		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
		ptr = strstr(query_buffer, "SUBCHANNEL =");
		console_irq = simple_strtoul(ptr + 13, NULL, 16);
197
		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
L
Linus Torvalds 已提交
198 199 200 201 202 203 204 205
		ptr = strstr(query_buffer, "CONMODE");
		/*
		 * Set the conmode to 3215 so that the device recognition 
		 * will set the cu_type of the console to 3215. If the
		 * conmode is 3270 and we don't set it back then both
		 * 3215 and the 3270 driver will try to access the console
		 * device (3215 as console and 3270 as normal tty).
		 */
206
		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
L
Linus Torvalds 已提交
207
		if (ptr == NULL) {
208
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
209 210 211 212 213 214 215 216 217
			SET_CONSOLE_SCLP;
#endif
			return;
		}
		if (strncmp(ptr + 8, "3270", 4) == 0) {
#if defined(CONFIG_TN3270_CONSOLE)
			SET_CONSOLE_3270;
#elif defined(CONFIG_TN3215_CONSOLE)
			SET_CONSOLE_3215;
218
#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
219 220 221 222 223 224 225
			SET_CONSOLE_SCLP;
#endif
		} else if (strncmp(ptr + 8, "3215", 4) == 0) {
#if defined(CONFIG_TN3215_CONSOLE)
			SET_CONSOLE_3215;
#elif defined(CONFIG_TN3270_CONSOLE)
			SET_CONSOLE_3270;
226
#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
227 228 229 230
			SET_CONSOLE_SCLP;
#endif
		}
	} else {
231
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
232 233 234 235 236
		SET_CONSOLE_SCLP;
#endif
	}
}

237
#ifdef CONFIG_ZFCPDUMP
M
Michael Holzheu 已提交
238 239
static void __init setup_zfcpdump(unsigned int console_devno)
{
240
	static char str[41];
M
Michael Holzheu 已提交
241 242 243 244

	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
	if (console_devno != -1)
245
		sprintf(str, " cio_ignore=all,!0.0.%04x,!0.0.%04x",
M
Michael Holzheu 已提交
246 247
			ipl_info.data.fcp.dev_id.devno, console_devno);
	else
248
		sprintf(str, " cio_ignore=all,!0.0.%04x",
M
Michael Holzheu 已提交
249
			ipl_info.data.fcp.dev_id.devno);
250
	strcat(boot_command_line, str);
M
Michael Holzheu 已提交
251 252 253 254 255 256
	console_loglevel = 2;
}
#else
static inline void setup_zfcpdump(unsigned int console_devno) {}
#endif /* CONFIG_ZFCPDUMP */

L
Linus Torvalds 已提交
257 258 259 260 261 262 263
 /*
 * Reboot, halt and power_off stubs. They just call _machine_restart,
 * _machine_halt or _machine_power_off. 
 */

void machine_restart(char *command)
{
264
	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
265 266 267 268 269
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
270 271 272 273 274
	_machine_restart(command);
}

void machine_halt(void)
{
275 276 277 278 279 280
	if (!in_interrupt() || oops_in_progress)
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
281 282 283 284 285
	_machine_halt();
}

void machine_power_off(void)
{
286 287 288 289 290 291
	if (!in_interrupt() || oops_in_progress)
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
292 293 294
	_machine_power_off();
}

295 296 297 298 299
/*
 * Dummy power off function.
 */
void (*pm_power_off)(void) = machine_power_off;

300 301 302
static int __init early_parse_mem(char *p)
{
	memory_end = memparse(p, &p);
303
	memory_end_set = 1;
304 305 306 307
	return 0;
}
early_param("mem", early_parse_mem);

G
Gerald Schaefer 已提交
308 309 310 311
#ifdef CONFIG_S390_SWITCH_AMODE
unsigned int switch_amode = 0;
EXPORT_SYMBOL_GPL(switch_amode);

312 313
static int set_amode_and_uaccess(unsigned long user_amode,
				 unsigned long user32_amode)
G
Gerald Schaefer 已提交
314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330
{
	psw_user_bits = PSW_BASE_BITS | PSW_MASK_DAT | user_amode |
			PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			PSW_MASK_PSTATE | PSW_DEFAULT_KEY;
#ifdef CONFIG_COMPAT
	psw_user32_bits = PSW_BASE32_BITS | PSW_MASK_DAT | user_amode |
			  PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			  PSW_MASK_PSTATE | PSW_DEFAULT_KEY;
	psw32_user_bits = PSW32_BASE_BITS | PSW32_MASK_DAT | user32_amode |
			  PSW32_MASK_IO | PSW32_MASK_EXT | PSW32_MASK_MCHECK |
			  PSW32_MASK_PSTATE;
#endif
	psw_kernel_bits = PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_HOME |
			  PSW_MASK_MCHECK | PSW_DEFAULT_KEY;

	if (MACHINE_HAS_MVCOS) {
		memcpy(&uaccess, &uaccess_mvcos_switch, sizeof(uaccess));
331
		return 1;
G
Gerald Schaefer 已提交
332 333
	} else {
		memcpy(&uaccess, &uaccess_pt, sizeof(uaccess));
334
		return 0;
G
Gerald Schaefer 已提交
335 336 337 338 339 340 341 342 343 344 345 346 347 348
	}
}

/*
 * Switch kernel/user addressing modes?
 */
static int __init early_parse_switch_amode(char *p)
{
	switch_amode = 1;
	return 0;
}
early_param("switch_amode", early_parse_switch_amode);

#else /* CONFIG_S390_SWITCH_AMODE */
349 350
static inline int set_amode_and_uaccess(unsigned long user_amode,
					unsigned long user32_amode)
G
Gerald Schaefer 已提交
351
{
352
	return 0;
G
Gerald Schaefer 已提交
353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376
}
#endif /* CONFIG_S390_SWITCH_AMODE */

#ifdef CONFIG_S390_EXEC_PROTECT
unsigned int s390_noexec = 0;
EXPORT_SYMBOL_GPL(s390_noexec);

/*
 * Enable execute protection?
 */
static int __init early_parse_noexec(char *p)
{
	if (!strncmp(p, "off", 3))
		return 0;
	switch_amode = 1;
	s390_noexec = 1;
	return 0;
}
early_param("noexec", early_parse_noexec);
#endif /* CONFIG_S390_EXEC_PROTECT */

static void setup_addressing_mode(void)
{
	if (s390_noexec) {
377 378 379 380 381 382 383
		if (set_amode_and_uaccess(PSW_ASC_SECONDARY,
					  PSW32_ASC_SECONDARY))
			pr_info("Execute protection active, "
				"mvcos available\n");
		else
			pr_info("Execute protection active, "
				"mvcos not available\n");
384
	} else if (switch_amode) {
385 386 387 388 389 390
		if (set_amode_and_uaccess(PSW_ASC_PRIMARY, PSW32_ASC_PRIMARY))
			pr_info("Address spaces switched, "
				"mvcos available\n");
		else
			pr_info("Address spaces switched, "
				"mvcos not available\n");
G
Gerald Schaefer 已提交
391
	}
392 393 394 395
#ifdef CONFIG_TRACE_IRQFLAGS
	sysc_restore_trace_psw.mask = psw_kernel_bits & ~PSW_MASK_MCHECK;
	io_restore_trace_psw.mask = psw_kernel_bits & ~PSW_MASK_MCHECK;
#endif
G
Gerald Schaefer 已提交
396 397
}

398 399 400 401 402 403 404 405 406 407 408 409 410
static void __init
setup_lowcore(void)
{
	struct _lowcore *lc;
	int lc_pages;

	/*
	 * Setup lowcore for boot cpu
	 */
	lc_pages = sizeof(void *) == 8 ? 2 : 1;
	lc = (struct _lowcore *)
		__alloc_bootmem(lc_pages * PAGE_SIZE, lc_pages * PAGE_SIZE, 0);
	memset(lc, 0, lc_pages * PAGE_SIZE);
411
	lc->restart_psw.mask = PSW_BASE_BITS | PSW_DEFAULT_KEY;
412 413
	lc->restart_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) restart_int_handler;
G
Gerald Schaefer 已提交
414 415 416
	if (switch_amode)
		lc->restart_psw.mask |= PSW_ASC_HOME;
	lc->external_new_psw.mask = psw_kernel_bits;
417 418
	lc->external_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) ext_int_handler;
G
Gerald Schaefer 已提交
419
	lc->svc_new_psw.mask = psw_kernel_bits | PSW_MASK_IO | PSW_MASK_EXT;
420
	lc->svc_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) system_call;
G
Gerald Schaefer 已提交
421
	lc->program_new_psw.mask = psw_kernel_bits;
422 423
	lc->program_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long)pgm_check_handler;
424
	lc->mcck_new_psw.mask =
G
Gerald Schaefer 已提交
425
		psw_kernel_bits & ~PSW_MASK_MCHECK & ~PSW_MASK_DAT;
426 427
	lc->mcck_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) mcck_int_handler;
G
Gerald Schaefer 已提交
428
	lc->io_new_psw.mask = psw_kernel_bits;
429
	lc->io_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) io_int_handler;
430
	lc->clock_comparator = -1ULL;
431 432 433 434 435 436 437
	lc->kernel_stack = ((unsigned long) &init_thread_union) + THREAD_SIZE;
	lc->async_stack = (unsigned long)
		__alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0) + ASYNC_SIZE;
	lc->panic_stack = (unsigned long)
		__alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0) + PAGE_SIZE;
	lc->current_task = (unsigned long) init_thread_union.thread_info.task;
	lc->thread_info = (unsigned long) &init_thread_union;
438
	lc->machine_flags = S390_lowcore.machine_flags;
439
#ifndef CONFIG_64BIT
440 441 442 443
	if (MACHINE_HAS_IEEE) {
		lc->extended_save_area_addr = (__u32)
			__alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0);
		/* enable extended save area */
H
Heiko Carstens 已提交
444
		__ctl_set_bit(14, 29);
445
	}
446 447
#else
	lc->vdso_per_cpu_data = (unsigned long) &lc->paste[0];
448
#endif
449 450 451 452 453 454 455 456
	lc->sync_enter_timer = S390_lowcore.sync_enter_timer;
	lc->async_enter_timer = S390_lowcore.async_enter_timer;
	lc->exit_timer = S390_lowcore.exit_timer;
	lc->user_timer = S390_lowcore.user_timer;
	lc->system_timer = S390_lowcore.system_timer;
	lc->steal_timer = S390_lowcore.steal_timer;
	lc->last_update_timer = S390_lowcore.last_update_timer;
	lc->last_update_clock = S390_lowcore.last_update_clock;
457
	lc->ftrace_func = S390_lowcore.ftrace_func;
458
	set_prefix((u32)(unsigned long) lc);
F
Frank Munzert 已提交
459
	lowcore_ptr[0] = lc;
460 461 462 463 464
}

static void __init
setup_resources(void)
{
H
Hongjie Yang 已提交
465
	struct resource *res, *sub_res;
466 467
	int i;

468 469 470 471 472
	code_resource.start = (unsigned long) &_text;
	code_resource.end = (unsigned long) &_etext - 1;
	data_resource.start = (unsigned long) &_etext;
	data_resource.end = (unsigned long) &_edata - 1;

473 474 475
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		if (!memory_chunk[i].size)
			continue;
476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491
		res = alloc_bootmem_low(sizeof(struct resource));
		res->flags = IORESOURCE_BUSY | IORESOURCE_MEM;
		switch (memory_chunk[i].type) {
		case CHUNK_READ_WRITE:
			res->name = "System RAM";
			break;
		case CHUNK_READ_ONLY:
			res->name = "System ROM";
			res->flags |= IORESOURCE_READONLY;
			break;
		default:
			res->name = "reserved";
		}
		res->start = memory_chunk[i].addr;
		res->end = memory_chunk[i].addr +  memory_chunk[i].size - 1;
		request_resource(&iomem_resource, res);
H
Hongjie Yang 已提交
492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523

		if (code_resource.start >= res->start  &&
			code_resource.start <= res->end &&
			code_resource.end > res->end) {
			sub_res = alloc_bootmem_low(sizeof(struct resource));
			memcpy(sub_res, &code_resource,
				sizeof(struct resource));
			sub_res->end = res->end;
			code_resource.start = res->end + 1;
			request_resource(res, sub_res);
		}

		if (code_resource.start >= res->start &&
			code_resource.start <= res->end &&
			code_resource.end <= res->end)
			request_resource(res, &code_resource);

		if (data_resource.start >= res->start &&
			data_resource.start <= res->end &&
			data_resource.end > res->end) {
			sub_res = alloc_bootmem_low(sizeof(struct resource));
			memcpy(sub_res, &data_resource,
				sizeof(struct resource));
			sub_res->end = res->end;
			data_resource.start = res->end + 1;
			request_resource(res, sub_res);
		}

		if (data_resource.start >= res->start &&
			data_resource.start <= res->end &&
			data_resource.end <= res->end)
			request_resource(res, &data_resource);
524 525 526
	}
}

M
Michael Holzheu 已提交
527 528 529
unsigned long real_memory_size;
EXPORT_SYMBOL_GPL(real_memory_size);

H
Heiko Carstens 已提交
530 531
static void __init setup_memory_end(void)
{
M
Michael Holzheu 已提交
532
	unsigned long memory_size;
533
	unsigned long max_mem;
H
Heiko Carstens 已提交
534 535
	int i;

536
#ifdef CONFIG_ZFCPDUMP
537
	if (ipl_info.type == IPL_TYPE_FCP_DUMP) {
M
Michael Holzheu 已提交
538
		memory_end = ZFCPDUMP_HSA_SIZE;
539 540
		memory_end_set = 1;
	}
M
Michael Holzheu 已提交
541 542
#endif
	memory_size = 0;
H
Heiko Carstens 已提交
543 544
	memory_end &= PAGE_MASK;

545
	max_mem = memory_end ? min(VMEM_MAX_PHYS, memory_end) : VMEM_MAX_PHYS;
546
	memory_end = min(max_mem, memory_end);
H
Heiko Carstens 已提交
547

548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568
	/*
	 * Make sure all chunks are MAX_ORDER aligned so we don't need the
	 * extra checks that HOLES_IN_ZONE would require.
	 */
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		unsigned long start, end;
		struct mem_chunk *chunk;
		unsigned long align;

		chunk = &memory_chunk[i];
		align = 1UL << (MAX_ORDER + PAGE_SHIFT - 1);
		start = (chunk->addr + align - 1) & ~(align - 1);
		end = (chunk->addr + chunk->size) & ~(align - 1);
		if (start >= end)
			memset(chunk, 0, sizeof(*chunk));
		else {
			chunk->addr = start;
			chunk->size = end - start;
		}
	}

H
Heiko Carstens 已提交
569 570 571
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		struct mem_chunk *chunk = &memory_chunk[i];

M
Michael Holzheu 已提交
572 573
		real_memory_size = max(real_memory_size,
				       chunk->addr + chunk->size);
H
Heiko Carstens 已提交
574 575 576 577 578 579 580 581 582 583 584 585
		if (chunk->addr >= max_mem) {
			memset(chunk, 0, sizeof(*chunk));
			continue;
		}
		if (chunk->addr + chunk->size > max_mem)
			chunk->size = max_mem - chunk->addr;
		memory_size = max(memory_size, chunk->addr + chunk->size);
	}
	if (!memory_end)
		memory_end = memory_size;
}

586 587 588 589
static void __init
setup_memory(void)
{
        unsigned long bootmap_size;
H
Hongjie Yang 已提交
590
	unsigned long start_pfn, end_pfn;
591
	int i;
L
Linus Torvalds 已提交
592 593 594 595 596

	/*
	 * partially used pages are not usable - thus
	 * we are rounding upwards:
	 */
597 598
	start_pfn = PFN_UP(__pa(&_end));
	end_pfn = max_pfn = PFN_DOWN(memory_end);
L
Linus Torvalds 已提交
599

600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616
#ifdef CONFIG_BLK_DEV_INITRD
	/*
	 * Move the initrd in case the bitmap of the bootmem allocater
	 * would overwrite it.
	 */

	if (INITRD_START && INITRD_SIZE) {
		unsigned long bmap_size;
		unsigned long start;

		bmap_size = bootmem_bootmap_pages(end_pfn - start_pfn + 1);
		bmap_size = PFN_PHYS(bmap_size);

		if (PFN_PHYS(start_pfn) + bmap_size > INITRD_START) {
			start = PFN_PHYS(start_pfn) + bmap_size + PAGE_SIZE;

			if (start + INITRD_SIZE > memory_end) {
617 618
				pr_err("initrd extends beyond end of "
				       "memory (0x%08lx > 0x%08lx) "
619 620 621 622
				       "disabling initrd\n",
				       start + INITRD_SIZE, memory_end);
				INITRD_START = INITRD_SIZE = 0;
			} else {
623 624 625
				pr_info("Moving initrd (0x%08lx -> "
					"0x%08lx, size: %ld)\n",
					INITRD_START, start, INITRD_SIZE);
626 627 628 629 630 631 632 633
				memmove((void *) start, (void *) INITRD_START,
					INITRD_SIZE);
				INITRD_START = start;
			}
		}
	}
#endif

L
Linus Torvalds 已提交
634
	/*
635
	 * Initialize the boot-time allocator
L
Linus Torvalds 已提交
636 637 638 639 640 641
	 */
	bootmap_size = init_bootmem(start_pfn, end_pfn);

	/*
	 * Register RAM areas with the bootmem allocator.
	 */
642

643
	for (i = 0; i < MEMORY_CHUNKS && memory_chunk[i].size > 0; i++) {
644
		unsigned long start_chunk, end_chunk, pfn;
L
Linus Torvalds 已提交
645 646 647

		if (memory_chunk[i].type != CHUNK_READ_WRITE)
			continue;
648
		start_chunk = PFN_DOWN(memory_chunk[i].addr);
649
		end_chunk = start_chunk + PFN_DOWN(memory_chunk[i].size);
650 651 652 653 654
		end_chunk = min(end_chunk, end_pfn);
		if (start_chunk >= end_chunk)
			continue;
		add_active_range(0, start_chunk, end_chunk);
		pfn = max(start_chunk, start_pfn);
655
		for (; pfn < end_chunk; pfn++)
656
			page_set_storage_key(PFN_PHYS(pfn), PAGE_DEFAULT_KEY);
L
Linus Torvalds 已提交
657 658
	}

659 660
	psw_set_key(PAGE_DEFAULT_KEY);

661
	free_bootmem_with_active_regions(0, max_pfn);
662

663 664 665
	/*
	 * Reserve memory used for lowcore/command line/kernel image.
	 */
666
	reserve_bootmem(0, (unsigned long)_ehead, BOOTMEM_DEFAULT);
667
	reserve_bootmem((unsigned long)_stext,
668 669
			PFN_PHYS(start_pfn) - (unsigned long)_stext,
			BOOTMEM_DEFAULT);
670 671 672 673 674 675
	/*
	 * Reserve the bootmem bitmap itself as well. We do this in two
	 * steps (first step was init_bootmem()) because this catches
	 * the (very unlikely) case of us accidentally initializing the
	 * bootmem allocator with an invalid RAM area.
	 */
676 677
	reserve_bootmem(start_pfn << PAGE_SHIFT, bootmap_size,
			BOOTMEM_DEFAULT);
L
Linus Torvalds 已提交
678 679

#ifdef CONFIG_BLK_DEV_INITRD
680
	if (INITRD_START && INITRD_SIZE) {
L
Linus Torvalds 已提交
681
		if (INITRD_START + INITRD_SIZE <= memory_end) {
682 683
			reserve_bootmem(INITRD_START, INITRD_SIZE,
					BOOTMEM_DEFAULT);
L
Linus Torvalds 已提交
684 685 686
			initrd_start = INITRD_START;
			initrd_end = initrd_start + INITRD_SIZE;
		} else {
687 688 689
			pr_err("initrd extends beyond end of "
			       "memory (0x%08lx > 0x%08lx) "
			       "disabling initrd\n",
690 691
			       initrd_start + INITRD_SIZE, memory_end);
			initrd_start = initrd_end = 0;
L
Linus Torvalds 已提交
692
		}
693
	}
L
Linus Torvalds 已提交
694
#endif
695
}
L
Linus Torvalds 已提交
696

697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717
/*
 * Setup hardware capabilities.
 */
static void __init setup_hwcaps(void)
{
	static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
	unsigned long long facility_list_extended;
	unsigned int facility_list;
	int i;

	facility_list = stfl();
	/*
	 * The store facility list bits numbers as found in the principles
	 * of operation are numbered with bit 1UL<<31 as number 0 to
	 * bit 1UL<<0 as number 31.
	 *   Bit 0: instructions named N3, "backported" to esa-mode
	 *   Bit 2: z/Architecture mode is active
	 *   Bit 7: the store-facility-list-extended facility is installed
	 *   Bit 17: the message-security assist is installed
	 *   Bit 19: the long-displacement facility is installed
	 *   Bit 21: the extended-immediate facility is installed
718 719
	 *   Bit 22: extended-translation facility 3 is installed
	 *   Bit 30: extended-translation facility 3 enhancement facility
720 721 722
	 * These get translated to:
	 *   HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
	 *   HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
723 724
	 *   HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
	 *   HWCAP_S390_ETF3EH bit 8 (22 && 30).
725 726 727 728 729
	 */
	for (i = 0; i < 6; i++)
		if (facility_list & (1UL << (31 - stfl_bits[i])))
			elf_hwcap |= 1UL << i;

730 731
	if ((facility_list & (1UL << (31 - 22)))
	    && (facility_list & (1UL << (31 - 30))))
732
		elf_hwcap |= HWCAP_S390_ETF3EH;
733

734 735 736 737 738 739 740 741
	/*
	 * Check for additional facilities with store-facility-list-extended.
	 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
	 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
	 * as stored by stfl, bits 32-xxx contain additional facilities.
	 * How many facility words are stored depends on the number of
	 * doublewords passed to the instruction. The additional facilites
	 * are:
742 743
	 *   Bit 42: decimal floating point facility is installed
	 *   Bit 44: perform floating point operation facility is installed
744
	 * translated to:
745
	 *   HWCAP_S390_DFP bit 6 (42 && 44).
746 747
	 */
	if ((elf_hwcap & (1UL << 2)) &&
H
Heiko Carstens 已提交
748
	    __stfle(&facility_list_extended, 1) > 0) {
749
		if ((facility_list_extended & (1ULL << (63 - 42)))
750
		    && (facility_list_extended & (1ULL << (63 - 44))))
751
			elf_hwcap |= HWCAP_S390_DFP;
752 753
	}

754 755 756
	/*
	 * Huge page support HWCAP_S390_HPAGE is bit 7.
	 */
757
	if (MACHINE_HAS_HPAGE)
758 759 760 761 762 763 764
		elf_hwcap |= HWCAP_S390_HPAGE;

	/*
	 * 64-bit register support for 31-bit processes
	 * HWCAP_S390_HIGH_GPRS is bit 9.
	 */
	elf_hwcap |= HWCAP_S390_HIGH_GPRS;
765

766
	switch (S390_lowcore.cpu_id.machine) {
767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784
	case 0x9672:
#if !defined(CONFIG_64BIT)
	default:	/* Use "g5" as default for 31 bit kernels. */
#endif
		strcpy(elf_platform, "g5");
		break;
	case 0x2064:
	case 0x2066:
#if defined(CONFIG_64BIT)
	default:	/* Use "z900" as default for 64 bit kernels. */
#endif
		strcpy(elf_platform, "z900");
		break;
	case 0x2084:
	case 0x2086:
		strcpy(elf_platform, "z990");
		break;
	case 0x2094:
785
	case 0x2096:
786 787
		strcpy(elf_platform, "z9-109");
		break;
788 789 790 791
	case 0x2097:
	case 0x2098:
		strcpy(elf_platform, "z10");
		break;
792 793 794
	}
}

795 796 797 798
/*
 * Setup function called from init/main.c just after the banner
 * was printed.
 */
L
Linus Torvalds 已提交
799

800 801 802
void __init
setup_arch(char **cmdline_p)
{
L
Linus Torvalds 已提交
803
        /*
804
         * print what head.S has found out about the machine
L
Linus Torvalds 已提交
805
         */
806
#ifndef CONFIG_64BIT
807 808 809 810 811 812 813 814 815 816 817
	if (MACHINE_IS_VM)
		pr_info("Linux is running as a z/VM "
			"guest operating system in 31-bit mode\n");
	else
		pr_info("Linux is running natively in 31-bit mode\n");
	if (MACHINE_HAS_IEEE)
		pr_info("The hardware system has IEEE compatible "
			"floating point units\n");
	else
		pr_info("The hardware system has no IEEE compatible "
			"floating point units\n");
818
#else /* CONFIG_64BIT */
819
	if (MACHINE_IS_VM)
820 821
		pr_info("Linux is running as a z/VM "
			"guest operating system in 64-bit mode\n");
822
	else if (MACHINE_IS_KVM)
823
		pr_info("Linux is running under KVM in 64-bit mode\n");
824
	else
825
		pr_info("Linux is running natively in 64-bit mode\n");
826
#endif /* CONFIG_64BIT */
827

828 829 830
	/* Have one command line that is parsed and saved in /proc/cmdline */
	/* boot_command_line has been already set up in early.c */
	*cmdline_p = boot_command_line;
831

832
        ROOT_DEV = Root_RAM0;
833 834 835 836 837 838

	init_mm.start_code = PAGE_OFFSET;
	init_mm.end_code = (unsigned long) &_etext;
	init_mm.end_data = (unsigned long) &_edata;
	init_mm.brk = (unsigned long) &_end;

839 840 841 842 843
	if (MACHINE_HAS_MVCOS)
		memcpy(&uaccess, &uaccess_mvcos, sizeof(uaccess));
	else
		memcpy(&uaccess, &uaccess_std, sizeof(uaccess));

844 845
	parse_early_param();

846
	setup_ipl();
H
Heiko Carstens 已提交
847
	setup_memory_end();
G
Gerald Schaefer 已提交
848
	setup_addressing_mode();
849 850 851 852
	setup_memory();
	setup_resources();
	setup_lowcore();

L
Linus Torvalds 已提交
853
        cpu_init();
854
	__cpu_logical_map[0] = stap();
855
	s390_init_cpu_topology();
L
Linus Torvalds 已提交
856

857 858 859 860 861
	/*
	 * Setup capabilities (ELF_HWCAP & ELF_PLATFORM).
	 */
	setup_hwcaps();

L
Linus Torvalds 已提交
862 863 864 865 866 867 868
	/*
	 * Create kernel page tables and switch to virtual addressing.
	 */
        paging_init();

        /* Setup default console */
	conmode_default();
869
	set_preferred_console();
M
Michael Holzheu 已提交
870 871 872

	/* Setup zfcpdump support */
	setup_zfcpdump(console_devno);
L
Linus Torvalds 已提交
873
}