setup.c 23.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 *  arch/s390/kernel/setup.c
 *
 *  S390 version
 *    Copyright (C) 1999,2000 IBM Deutschland Entwicklung GmbH, IBM Corporation
 *    Author(s): Hartmut Penner (hp@de.ibm.com),
 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
 *
 *  Derived from "arch/i386/kernel/setup.c"
 *    Copyright (C) 1995, Linus Torvalds
 */

/*
 * This file handles the architecture-dependent parts of initialization
 */

17 18 19
#define KMSG_COMPONENT "setup"
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt

L
Linus Torvalds 已提交
20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37
#include <linux/errno.h>
#include <linux/module.h>
#include <linux/sched.h>
#include <linux/kernel.h>
#include <linux/mm.h>
#include <linux/stddef.h>
#include <linux/unistd.h>
#include <linux/ptrace.h>
#include <linux/user.h>
#include <linux/tty.h>
#include <linux/ioport.h>
#include <linux/delay.h>
#include <linux/init.h>
#include <linux/initrd.h>
#include <linux/bootmem.h>
#include <linux/root_dev.h>
#include <linux/console.h>
#include <linux/kernel_stat.h>
38
#include <linux/device.h>
39
#include <linux/notifier.h>
40
#include <linux/pfn.h>
H
Hongjie Yang 已提交
41
#include <linux/ctype.h>
42
#include <linux/reboot.h>
43
#include <linux/topology.h>
44
#include <linux/ftrace.h>
L
Linus Torvalds 已提交
45

M
Michael Holzheu 已提交
46
#include <asm/ipl.h>
L
Linus Torvalds 已提交
47 48 49 50 51 52 53
#include <asm/uaccess.h>
#include <asm/system.h>
#include <asm/smp.h>
#include <asm/mmu_context.h>
#include <asm/cpcmd.h>
#include <asm/lowcore.h>
#include <asm/irq.h>
54 55
#include <asm/page.h>
#include <asm/ptrace.h>
56
#include <asm/sections.h>
H
Hongjie Yang 已提交
57
#include <asm/ebcdic.h>
G
Gerald Schaefer 已提交
58
#include <asm/compat.h>
59
#include <asm/kvm_virtio.h>
G
Gerald Schaefer 已提交
60 61 62 63 64 65

long psw_kernel_bits	= (PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_PRIMARY |
			   PSW_MASK_MCHECK | PSW_DEFAULT_KEY);
long psw_user_bits	= (PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_HOME |
			   PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			   PSW_MASK_PSTATE | PSW_DEFAULT_KEY);
L
Linus Torvalds 已提交
66

67 68 69 70
/*
 * User copy operations.
 */
struct uaccess_ops uaccess;
71
EXPORT_SYMBOL(uaccess);
72

L
Linus Torvalds 已提交
73 74 75 76
/*
 * Machine setup..
 */
unsigned int console_mode = 0;
77 78
EXPORT_SYMBOL(console_mode);

L
Linus Torvalds 已提交
79
unsigned int console_devno = -1;
80 81
EXPORT_SYMBOL(console_devno);

L
Linus Torvalds 已提交
82
unsigned int console_irq = -1;
83 84
EXPORT_SYMBOL(console_irq);

85 86
unsigned long elf_hwcap = 0;
char elf_platform[ELF_PLATFORM_SIZE];
87

88
struct mem_chunk __initdata memory_chunk[MEMORY_CHUNKS];
89 90 91

int __initdata memory_end_set;
unsigned long __initdata memory_end;
L
Linus Torvalds 已提交
92

F
Frank Munzert 已提交
93 94 95 96
/* An array with a pointer to the lowcore of every CPU. */
struct _lowcore *lowcore_ptr[NR_CPUS];
EXPORT_SYMBOL(lowcore_ptr);

L
Linus Torvalds 已提交
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117
/*
 * This is set up by the setup-routine at boot-time
 * for S390 need to find out, what we have to setup
 * using address 0x10400 ...
 */

#include <asm/setup.h>

static struct resource code_resource = {
	.name  = "Kernel code",
	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
};

static struct resource data_resource = {
	.name = "Kernel data",
	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
};

/*
 * cpu_init() initializes state that is per-CPU.
 */
H
Heiko Carstens 已提交
118
void __cpuinit cpu_init(void)
L
Linus Torvalds 已提交
119 120 121 122
{
        /*
         * Store processor id in lowcore (used e.g. in timer_interrupt)
         */
123
	get_cpu_id(&S390_lowcore.cpu_id);
L
Linus Torvalds 已提交
124 125 126

	atomic_inc(&init_mm.mm_count);
	current->active_mm = &init_mm;
S
Stoyan Gaydarov 已提交
127
	BUG_ON(current->mm);
L
Linus Torvalds 已提交
128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148
        enter_lazy_tlb(&init_mm, current);
}

/*
 * condev= and conmode= setup parameter.
 */

static int __init condev_setup(char *str)
{
	int vdev;

	vdev = simple_strtoul(str, &str, 0);
	if (vdev >= 0 && vdev < 65536) {
		console_devno = vdev;
		console_irq = -1;
	}
	return 1;
}

__setup("condev=", condev_setup);

149 150
static void __init set_preferred_console(void)
{
151
	if (MACHINE_IS_KVM)
152
		add_preferred_console("hvc", 0, NULL);
153
	else if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
154
		add_preferred_console("ttyS", 0, NULL);
155
	else if (CONSOLE_IS_3270)
156 157 158
		add_preferred_console("tty3270", 0, NULL);
}

L
Linus Torvalds 已提交
159 160
static int __init conmode_setup(char *str)
{
161
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
162 163 164 165 166 167 168 169 170 171 172
	if (strncmp(str, "hwc", 4) == 0 || strncmp(str, "sclp", 5) == 0)
                SET_CONSOLE_SCLP;
#endif
#if defined(CONFIG_TN3215_CONSOLE)
	if (strncmp(str, "3215", 5) == 0)
		SET_CONSOLE_3215;
#endif
#if defined(CONFIG_TN3270_CONSOLE)
	if (strncmp(str, "3270", 5) == 0)
		SET_CONSOLE_3270;
#endif
173
	set_preferred_console();
L
Linus Torvalds 已提交
174 175 176 177 178 179 180 181 182 183 184
        return 1;
}

__setup("conmode=", conmode_setup);

static void __init conmode_default(void)
{
	char query_buffer[1024];
	char *ptr;

        if (MACHINE_IS_VM) {
185
		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
L
Linus Torvalds 已提交
186 187 188
		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
		ptr = strstr(query_buffer, "SUBCHANNEL =");
		console_irq = simple_strtoul(ptr + 13, NULL, 16);
189
		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
L
Linus Torvalds 已提交
190 191 192 193 194 195 196 197
		ptr = strstr(query_buffer, "CONMODE");
		/*
		 * Set the conmode to 3215 so that the device recognition 
		 * will set the cu_type of the console to 3215. If the
		 * conmode is 3270 and we don't set it back then both
		 * 3215 and the 3270 driver will try to access the console
		 * device (3215 as console and 3270 as normal tty).
		 */
198
		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
L
Linus Torvalds 已提交
199
		if (ptr == NULL) {
200
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
201 202 203 204 205 206 207 208 209
			SET_CONSOLE_SCLP;
#endif
			return;
		}
		if (strncmp(ptr + 8, "3270", 4) == 0) {
#if defined(CONFIG_TN3270_CONSOLE)
			SET_CONSOLE_3270;
#elif defined(CONFIG_TN3215_CONSOLE)
			SET_CONSOLE_3215;
210
#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
211 212 213 214 215 216 217
			SET_CONSOLE_SCLP;
#endif
		} else if (strncmp(ptr + 8, "3215", 4) == 0) {
#if defined(CONFIG_TN3215_CONSOLE)
			SET_CONSOLE_3215;
#elif defined(CONFIG_TN3270_CONSOLE)
			SET_CONSOLE_3270;
218
#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
219 220 221 222
			SET_CONSOLE_SCLP;
#endif
		}
	} else {
223
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
224 225 226 227 228
		SET_CONSOLE_SCLP;
#endif
	}
}

229
#ifdef CONFIG_ZFCPDUMP
M
Michael Holzheu 已提交
230 231
static void __init setup_zfcpdump(unsigned int console_devno)
{
232
	static char str[41];
M
Michael Holzheu 已提交
233 234 235 236

	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
	if (console_devno != -1)
237
		sprintf(str, " cio_ignore=all,!0.0.%04x,!0.0.%04x",
M
Michael Holzheu 已提交
238 239
			ipl_info.data.fcp.dev_id.devno, console_devno);
	else
240
		sprintf(str, " cio_ignore=all,!0.0.%04x",
M
Michael Holzheu 已提交
241
			ipl_info.data.fcp.dev_id.devno);
242
	strcat(boot_command_line, str);
M
Michael Holzheu 已提交
243 244 245 246 247 248
	console_loglevel = 2;
}
#else
static inline void setup_zfcpdump(unsigned int console_devno) {}
#endif /* CONFIG_ZFCPDUMP */

L
Linus Torvalds 已提交
249 250 251 252 253 254 255
 /*
 * Reboot, halt and power_off stubs. They just call _machine_restart,
 * _machine_halt or _machine_power_off. 
 */

void machine_restart(char *command)
{
256
	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
257 258 259 260 261
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
262 263 264 265 266
	_machine_restart(command);
}

void machine_halt(void)
{
267 268 269 270 271 272
	if (!in_interrupt() || oops_in_progress)
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
273 274 275 276 277
	_machine_halt();
}

void machine_power_off(void)
{
278 279 280 281 282 283
	if (!in_interrupt() || oops_in_progress)
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
284 285 286
	_machine_power_off();
}

287 288 289 290 291
/*
 * Dummy power off function.
 */
void (*pm_power_off)(void) = machine_power_off;

292 293 294
static int __init early_parse_mem(char *p)
{
	memory_end = memparse(p, &p);
295
	memory_end_set = 1;
296 297 298 299
	return 0;
}
early_param("mem", early_parse_mem);

300 301
unsigned int user_mode = HOME_SPACE_MODE;
EXPORT_SYMBOL_GPL(user_mode);
G
Gerald Schaefer 已提交
302

303 304
static int set_amode_and_uaccess(unsigned long user_amode,
				 unsigned long user32_amode)
G
Gerald Schaefer 已提交
305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321
{
	psw_user_bits = PSW_BASE_BITS | PSW_MASK_DAT | user_amode |
			PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			PSW_MASK_PSTATE | PSW_DEFAULT_KEY;
#ifdef CONFIG_COMPAT
	psw_user32_bits = PSW_BASE32_BITS | PSW_MASK_DAT | user_amode |
			  PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			  PSW_MASK_PSTATE | PSW_DEFAULT_KEY;
	psw32_user_bits = PSW32_BASE_BITS | PSW32_MASK_DAT | user32_amode |
			  PSW32_MASK_IO | PSW32_MASK_EXT | PSW32_MASK_MCHECK |
			  PSW32_MASK_PSTATE;
#endif
	psw_kernel_bits = PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_HOME |
			  PSW_MASK_MCHECK | PSW_DEFAULT_KEY;

	if (MACHINE_HAS_MVCOS) {
		memcpy(&uaccess, &uaccess_mvcos_switch, sizeof(uaccess));
322
		return 1;
G
Gerald Schaefer 已提交
323 324
	} else {
		memcpy(&uaccess, &uaccess_pt, sizeof(uaccess));
325
		return 0;
G
Gerald Schaefer 已提交
326 327 328 329 330 331 332 333
	}
}

/*
 * Switch kernel/user addressing modes?
 */
static int __init early_parse_switch_amode(char *p)
{
334 335
	if (user_mode != SECONDARY_SPACE_MODE)
		user_mode = PRIMARY_SPACE_MODE;
G
Gerald Schaefer 已提交
336 337 338 339
	return 0;
}
early_param("switch_amode", early_parse_switch_amode);

340
static int __init early_parse_user_mode(char *p)
G
Gerald Schaefer 已提交
341
{
342 343 344 345 346 347 348 349 350 351
	if (p && strcmp(p, "primary") == 0)
		user_mode = PRIMARY_SPACE_MODE;
#ifdef CONFIG_S390_EXEC_PROTECT
	else if (p && strcmp(p, "secondary") == 0)
		user_mode = SECONDARY_SPACE_MODE;
#endif
	else if (!p || strcmp(p, "home") == 0)
		user_mode = HOME_SPACE_MODE;
	else
		return 1;
352
	return 0;
G
Gerald Schaefer 已提交
353
}
354
early_param("user_mode", early_parse_user_mode);
G
Gerald Schaefer 已提交
355 356 357 358 359 360 361 362 363

#ifdef CONFIG_S390_EXEC_PROTECT
/*
 * Enable execute protection?
 */
static int __init early_parse_noexec(char *p)
{
	if (!strncmp(p, "off", 3))
		return 0;
364
	user_mode = SECONDARY_SPACE_MODE;
G
Gerald Schaefer 已提交
365 366 367 368 369 370 371
	return 0;
}
early_param("noexec", early_parse_noexec);
#endif /* CONFIG_S390_EXEC_PROTECT */

static void setup_addressing_mode(void)
{
372
	if (user_mode == SECONDARY_SPACE_MODE) {
373 374 375 376 377 378 379
		if (set_amode_and_uaccess(PSW_ASC_SECONDARY,
					  PSW32_ASC_SECONDARY))
			pr_info("Execute protection active, "
				"mvcos available\n");
		else
			pr_info("Execute protection active, "
				"mvcos not available\n");
380
	} else if (user_mode == PRIMARY_SPACE_MODE) {
381 382 383 384 385 386
		if (set_amode_and_uaccess(PSW_ASC_PRIMARY, PSW32_ASC_PRIMARY))
			pr_info("Address spaces switched, "
				"mvcos available\n");
		else
			pr_info("Address spaces switched, "
				"mvcos not available\n");
G
Gerald Schaefer 已提交
387
	}
388 389 390 391
#ifdef CONFIG_TRACE_IRQFLAGS
	sysc_restore_trace_psw.mask = psw_kernel_bits & ~PSW_MASK_MCHECK;
	io_restore_trace_psw.mask = psw_kernel_bits & ~PSW_MASK_MCHECK;
#endif
G
Gerald Schaefer 已提交
392 393
}

394 395 396 397 398 399 400 401
static void __init
setup_lowcore(void)
{
	struct _lowcore *lc;

	/*
	 * Setup lowcore for boot cpu
	 */
402
	BUILD_BUG_ON(sizeof(struct _lowcore) != LC_PAGES * 4096);
403
	lc = __alloc_bootmem_low(LC_PAGES * PAGE_SIZE, LC_PAGES * PAGE_SIZE, 0);
404
	lc->restart_psw.mask = PSW_BASE_BITS | PSW_DEFAULT_KEY;
405 406
	lc->restart_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) restart_int_handler;
407
	if (user_mode != HOME_SPACE_MODE)
G
Gerald Schaefer 已提交
408 409
		lc->restart_psw.mask |= PSW_ASC_HOME;
	lc->external_new_psw.mask = psw_kernel_bits;
410 411
	lc->external_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) ext_int_handler;
G
Gerald Schaefer 已提交
412
	lc->svc_new_psw.mask = psw_kernel_bits | PSW_MASK_IO | PSW_MASK_EXT;
413
	lc->svc_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) system_call;
G
Gerald Schaefer 已提交
414
	lc->program_new_psw.mask = psw_kernel_bits;
415 416
	lc->program_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long)pgm_check_handler;
417
	lc->mcck_new_psw.mask =
G
Gerald Schaefer 已提交
418
		psw_kernel_bits & ~PSW_MASK_MCHECK & ~PSW_MASK_DAT;
419 420
	lc->mcck_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) mcck_int_handler;
G
Gerald Schaefer 已提交
421
	lc->io_new_psw.mask = psw_kernel_bits;
422
	lc->io_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) io_int_handler;
423
	lc->clock_comparator = -1ULL;
424 425 426 427 428 429 430
	lc->kernel_stack = ((unsigned long) &init_thread_union) + THREAD_SIZE;
	lc->async_stack = (unsigned long)
		__alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0) + ASYNC_SIZE;
	lc->panic_stack = (unsigned long)
		__alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0) + PAGE_SIZE;
	lc->current_task = (unsigned long) init_thread_union.thread_info.task;
	lc->thread_info = (unsigned long) &init_thread_union;
431
	lc->machine_flags = S390_lowcore.machine_flags;
432
#ifndef CONFIG_64BIT
433 434
	if (MACHINE_HAS_IEEE) {
		lc->extended_save_area_addr = (__u32)
435
			__alloc_bootmem_low(PAGE_SIZE, PAGE_SIZE, 0);
436
		/* enable extended save area */
H
Heiko Carstens 已提交
437
		__ctl_set_bit(14, 29);
438
	}
439 440
#else
	lc->vdso_per_cpu_data = (unsigned long) &lc->paste[0];
441
#endif
442 443 444 445 446 447 448 449
	lc->sync_enter_timer = S390_lowcore.sync_enter_timer;
	lc->async_enter_timer = S390_lowcore.async_enter_timer;
	lc->exit_timer = S390_lowcore.exit_timer;
	lc->user_timer = S390_lowcore.user_timer;
	lc->system_timer = S390_lowcore.system_timer;
	lc->steal_timer = S390_lowcore.steal_timer;
	lc->last_update_timer = S390_lowcore.last_update_timer;
	lc->last_update_clock = S390_lowcore.last_update_clock;
450
	lc->ftrace_func = S390_lowcore.ftrace_func;
451
	set_prefix((u32)(unsigned long) lc);
F
Frank Munzert 已提交
452
	lowcore_ptr[0] = lc;
453 454 455 456 457
}

static void __init
setup_resources(void)
{
H
Hongjie Yang 已提交
458
	struct resource *res, *sub_res;
459 460
	int i;

461 462 463 464 465
	code_resource.start = (unsigned long) &_text;
	code_resource.end = (unsigned long) &_etext - 1;
	data_resource.start = (unsigned long) &_etext;
	data_resource.end = (unsigned long) &_edata - 1;

466 467 468
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		if (!memory_chunk[i].size)
			continue;
469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484
		res = alloc_bootmem_low(sizeof(struct resource));
		res->flags = IORESOURCE_BUSY | IORESOURCE_MEM;
		switch (memory_chunk[i].type) {
		case CHUNK_READ_WRITE:
			res->name = "System RAM";
			break;
		case CHUNK_READ_ONLY:
			res->name = "System ROM";
			res->flags |= IORESOURCE_READONLY;
			break;
		default:
			res->name = "reserved";
		}
		res->start = memory_chunk[i].addr;
		res->end = memory_chunk[i].addr +  memory_chunk[i].size - 1;
		request_resource(&iomem_resource, res);
H
Hongjie Yang 已提交
485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516

		if (code_resource.start >= res->start  &&
			code_resource.start <= res->end &&
			code_resource.end > res->end) {
			sub_res = alloc_bootmem_low(sizeof(struct resource));
			memcpy(sub_res, &code_resource,
				sizeof(struct resource));
			sub_res->end = res->end;
			code_resource.start = res->end + 1;
			request_resource(res, sub_res);
		}

		if (code_resource.start >= res->start &&
			code_resource.start <= res->end &&
			code_resource.end <= res->end)
			request_resource(res, &code_resource);

		if (data_resource.start >= res->start &&
			data_resource.start <= res->end &&
			data_resource.end > res->end) {
			sub_res = alloc_bootmem_low(sizeof(struct resource));
			memcpy(sub_res, &data_resource,
				sizeof(struct resource));
			sub_res->end = res->end;
			data_resource.start = res->end + 1;
			request_resource(res, sub_res);
		}

		if (data_resource.start >= res->start &&
			data_resource.start <= res->end &&
			data_resource.end <= res->end)
			request_resource(res, &data_resource);
517 518 519
	}
}

M
Michael Holzheu 已提交
520 521 522
unsigned long real_memory_size;
EXPORT_SYMBOL_GPL(real_memory_size);

H
Heiko Carstens 已提交
523 524
static void __init setup_memory_end(void)
{
M
Michael Holzheu 已提交
525
	unsigned long memory_size;
526
	unsigned long max_mem;
H
Heiko Carstens 已提交
527 528
	int i;

529
#ifdef CONFIG_ZFCPDUMP
530
	if (ipl_info.type == IPL_TYPE_FCP_DUMP) {
M
Michael Holzheu 已提交
531
		memory_end = ZFCPDUMP_HSA_SIZE;
532 533
		memory_end_set = 1;
	}
M
Michael Holzheu 已提交
534 535
#endif
	memory_size = 0;
H
Heiko Carstens 已提交
536 537
	memory_end &= PAGE_MASK;

538
	max_mem = memory_end ? min(VMEM_MAX_PHYS, memory_end) : VMEM_MAX_PHYS;
539
	memory_end = min(max_mem, memory_end);
H
Heiko Carstens 已提交
540

541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561
	/*
	 * Make sure all chunks are MAX_ORDER aligned so we don't need the
	 * extra checks that HOLES_IN_ZONE would require.
	 */
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		unsigned long start, end;
		struct mem_chunk *chunk;
		unsigned long align;

		chunk = &memory_chunk[i];
		align = 1UL << (MAX_ORDER + PAGE_SHIFT - 1);
		start = (chunk->addr + align - 1) & ~(align - 1);
		end = (chunk->addr + chunk->size) & ~(align - 1);
		if (start >= end)
			memset(chunk, 0, sizeof(*chunk));
		else {
			chunk->addr = start;
			chunk->size = end - start;
		}
	}

H
Heiko Carstens 已提交
562 563 564
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		struct mem_chunk *chunk = &memory_chunk[i];

M
Michael Holzheu 已提交
565 566
		real_memory_size = max(real_memory_size,
				       chunk->addr + chunk->size);
H
Heiko Carstens 已提交
567 568 569 570 571 572 573 574 575 576 577 578
		if (chunk->addr >= max_mem) {
			memset(chunk, 0, sizeof(*chunk));
			continue;
		}
		if (chunk->addr + chunk->size > max_mem)
			chunk->size = max_mem - chunk->addr;
		memory_size = max(memory_size, chunk->addr + chunk->size);
	}
	if (!memory_end)
		memory_end = memory_size;
}

579 580 581 582
static void __init
setup_memory(void)
{
        unsigned long bootmap_size;
H
Hongjie Yang 已提交
583
	unsigned long start_pfn, end_pfn;
584
	int i;
L
Linus Torvalds 已提交
585 586 587 588 589

	/*
	 * partially used pages are not usable - thus
	 * we are rounding upwards:
	 */
590 591
	start_pfn = PFN_UP(__pa(&_end));
	end_pfn = max_pfn = PFN_DOWN(memory_end);
L
Linus Torvalds 已提交
592

593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609
#ifdef CONFIG_BLK_DEV_INITRD
	/*
	 * Move the initrd in case the bitmap of the bootmem allocater
	 * would overwrite it.
	 */

	if (INITRD_START && INITRD_SIZE) {
		unsigned long bmap_size;
		unsigned long start;

		bmap_size = bootmem_bootmap_pages(end_pfn - start_pfn + 1);
		bmap_size = PFN_PHYS(bmap_size);

		if (PFN_PHYS(start_pfn) + bmap_size > INITRD_START) {
			start = PFN_PHYS(start_pfn) + bmap_size + PAGE_SIZE;

			if (start + INITRD_SIZE > memory_end) {
610 611
				pr_err("initrd extends beyond end of "
				       "memory (0x%08lx > 0x%08lx) "
612 613 614 615
				       "disabling initrd\n",
				       start + INITRD_SIZE, memory_end);
				INITRD_START = INITRD_SIZE = 0;
			} else {
616 617 618
				pr_info("Moving initrd (0x%08lx -> "
					"0x%08lx, size: %ld)\n",
					INITRD_START, start, INITRD_SIZE);
619 620 621 622 623 624 625 626
				memmove((void *) start, (void *) INITRD_START,
					INITRD_SIZE);
				INITRD_START = start;
			}
		}
	}
#endif

L
Linus Torvalds 已提交
627
	/*
628
	 * Initialize the boot-time allocator
L
Linus Torvalds 已提交
629 630 631 632 633 634
	 */
	bootmap_size = init_bootmem(start_pfn, end_pfn);

	/*
	 * Register RAM areas with the bootmem allocator.
	 */
635

636
	for (i = 0; i < MEMORY_CHUNKS && memory_chunk[i].size > 0; i++) {
637
		unsigned long start_chunk, end_chunk, pfn;
L
Linus Torvalds 已提交
638 639 640

		if (memory_chunk[i].type != CHUNK_READ_WRITE)
			continue;
641
		start_chunk = PFN_DOWN(memory_chunk[i].addr);
642
		end_chunk = start_chunk + PFN_DOWN(memory_chunk[i].size);
643 644 645 646 647
		end_chunk = min(end_chunk, end_pfn);
		if (start_chunk >= end_chunk)
			continue;
		add_active_range(0, start_chunk, end_chunk);
		pfn = max(start_chunk, start_pfn);
648
		for (; pfn < end_chunk; pfn++)
649
			page_set_storage_key(PFN_PHYS(pfn), PAGE_DEFAULT_KEY);
L
Linus Torvalds 已提交
650 651
	}

652 653
	psw_set_key(PAGE_DEFAULT_KEY);

654
	free_bootmem_with_active_regions(0, max_pfn);
655

656 657 658
	/*
	 * Reserve memory used for lowcore/command line/kernel image.
	 */
659
	reserve_bootmem(0, (unsigned long)_ehead, BOOTMEM_DEFAULT);
660
	reserve_bootmem((unsigned long)_stext,
661 662
			PFN_PHYS(start_pfn) - (unsigned long)_stext,
			BOOTMEM_DEFAULT);
663 664 665 666 667 668
	/*
	 * Reserve the bootmem bitmap itself as well. We do this in two
	 * steps (first step was init_bootmem()) because this catches
	 * the (very unlikely) case of us accidentally initializing the
	 * bootmem allocator with an invalid RAM area.
	 */
669 670
	reserve_bootmem(start_pfn << PAGE_SHIFT, bootmap_size,
			BOOTMEM_DEFAULT);
L
Linus Torvalds 已提交
671 672

#ifdef CONFIG_BLK_DEV_INITRD
673
	if (INITRD_START && INITRD_SIZE) {
L
Linus Torvalds 已提交
674
		if (INITRD_START + INITRD_SIZE <= memory_end) {
675 676
			reserve_bootmem(INITRD_START, INITRD_SIZE,
					BOOTMEM_DEFAULT);
L
Linus Torvalds 已提交
677 678 679
			initrd_start = INITRD_START;
			initrd_end = initrd_start + INITRD_SIZE;
		} else {
680 681 682
			pr_err("initrd extends beyond end of "
			       "memory (0x%08lx > 0x%08lx) "
			       "disabling initrd\n",
683 684
			       initrd_start + INITRD_SIZE, memory_end);
			initrd_start = initrd_end = 0;
L
Linus Torvalds 已提交
685
		}
686
	}
L
Linus Torvalds 已提交
687
#endif
688
}
L
Linus Torvalds 已提交
689

690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710
/*
 * Setup hardware capabilities.
 */
static void __init setup_hwcaps(void)
{
	static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
	unsigned long long facility_list_extended;
	unsigned int facility_list;
	int i;

	facility_list = stfl();
	/*
	 * The store facility list bits numbers as found in the principles
	 * of operation are numbered with bit 1UL<<31 as number 0 to
	 * bit 1UL<<0 as number 31.
	 *   Bit 0: instructions named N3, "backported" to esa-mode
	 *   Bit 2: z/Architecture mode is active
	 *   Bit 7: the store-facility-list-extended facility is installed
	 *   Bit 17: the message-security assist is installed
	 *   Bit 19: the long-displacement facility is installed
	 *   Bit 21: the extended-immediate facility is installed
711 712
	 *   Bit 22: extended-translation facility 3 is installed
	 *   Bit 30: extended-translation facility 3 enhancement facility
713 714 715
	 * These get translated to:
	 *   HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
	 *   HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
716 717
	 *   HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
	 *   HWCAP_S390_ETF3EH bit 8 (22 && 30).
718 719 720 721 722
	 */
	for (i = 0; i < 6; i++)
		if (facility_list & (1UL << (31 - stfl_bits[i])))
			elf_hwcap |= 1UL << i;

723 724
	if ((facility_list & (1UL << (31 - 22)))
	    && (facility_list & (1UL << (31 - 30))))
725
		elf_hwcap |= HWCAP_S390_ETF3EH;
726

727 728 729 730 731 732 733 734
	/*
	 * Check for additional facilities with store-facility-list-extended.
	 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
	 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
	 * as stored by stfl, bits 32-xxx contain additional facilities.
	 * How many facility words are stored depends on the number of
	 * doublewords passed to the instruction. The additional facilites
	 * are:
735 736
	 *   Bit 42: decimal floating point facility is installed
	 *   Bit 44: perform floating point operation facility is installed
737
	 * translated to:
738
	 *   HWCAP_S390_DFP bit 6 (42 && 44).
739 740
	 */
	if ((elf_hwcap & (1UL << 2)) &&
H
Heiko Carstens 已提交
741
	    __stfle(&facility_list_extended, 1) > 0) {
742
		if ((facility_list_extended & (1ULL << (63 - 42)))
743
		    && (facility_list_extended & (1ULL << (63 - 44))))
744
			elf_hwcap |= HWCAP_S390_DFP;
745 746
	}

747 748 749
	/*
	 * Huge page support HWCAP_S390_HPAGE is bit 7.
	 */
750
	if (MACHINE_HAS_HPAGE)
751 752 753 754 755 756 757
		elf_hwcap |= HWCAP_S390_HPAGE;

	/*
	 * 64-bit register support for 31-bit processes
	 * HWCAP_S390_HIGH_GPRS is bit 9.
	 */
	elf_hwcap |= HWCAP_S390_HIGH_GPRS;
758

759
	switch (S390_lowcore.cpu_id.machine) {
760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777
	case 0x9672:
#if !defined(CONFIG_64BIT)
	default:	/* Use "g5" as default for 31 bit kernels. */
#endif
		strcpy(elf_platform, "g5");
		break;
	case 0x2064:
	case 0x2066:
#if defined(CONFIG_64BIT)
	default:	/* Use "z900" as default for 64 bit kernels. */
#endif
		strcpy(elf_platform, "z900");
		break;
	case 0x2084:
	case 0x2086:
		strcpy(elf_platform, "z990");
		break;
	case 0x2094:
778
	case 0x2096:
779 780
		strcpy(elf_platform, "z9-109");
		break;
781 782 783 784
	case 0x2097:
	case 0x2098:
		strcpy(elf_platform, "z10");
		break;
785 786 787
	}
}

788 789 790 791
/*
 * Setup function called from init/main.c just after the banner
 * was printed.
 */
L
Linus Torvalds 已提交
792

793 794 795
void __init
setup_arch(char **cmdline_p)
{
L
Linus Torvalds 已提交
796
        /*
797
         * print what head.S has found out about the machine
L
Linus Torvalds 已提交
798
         */
799
#ifndef CONFIG_64BIT
800 801 802
	if (MACHINE_IS_VM)
		pr_info("Linux is running as a z/VM "
			"guest operating system in 31-bit mode\n");
803
	else if (MACHINE_IS_LPAR)
804 805 806 807 808 809 810
		pr_info("Linux is running natively in 31-bit mode\n");
	if (MACHINE_HAS_IEEE)
		pr_info("The hardware system has IEEE compatible "
			"floating point units\n");
	else
		pr_info("The hardware system has no IEEE compatible "
			"floating point units\n");
811
#else /* CONFIG_64BIT */
812
	if (MACHINE_IS_VM)
813 814
		pr_info("Linux is running as a z/VM "
			"guest operating system in 64-bit mode\n");
815
	else if (MACHINE_IS_KVM)
816
		pr_info("Linux is running under KVM in 64-bit mode\n");
817
	else if (MACHINE_IS_LPAR)
818
		pr_info("Linux is running natively in 64-bit mode\n");
819
#endif /* CONFIG_64BIT */
820

821 822 823
	/* Have one command line that is parsed and saved in /proc/cmdline */
	/* boot_command_line has been already set up in early.c */
	*cmdline_p = boot_command_line;
824

825
        ROOT_DEV = Root_RAM0;
826 827 828 829 830 831

	init_mm.start_code = PAGE_OFFSET;
	init_mm.end_code = (unsigned long) &_etext;
	init_mm.end_data = (unsigned long) &_edata;
	init_mm.brk = (unsigned long) &_end;

832 833 834 835 836
	if (MACHINE_HAS_MVCOS)
		memcpy(&uaccess, &uaccess_mvcos, sizeof(uaccess));
	else
		memcpy(&uaccess, &uaccess_std, sizeof(uaccess));

837 838
	parse_early_param();

839
	setup_ipl();
H
Heiko Carstens 已提交
840
	setup_memory_end();
G
Gerald Schaefer 已提交
841
	setup_addressing_mode();
842 843 844 845
	setup_memory();
	setup_resources();
	setup_lowcore();

L
Linus Torvalds 已提交
846
        cpu_init();
847
	s390_init_cpu_topology();
L
Linus Torvalds 已提交
848

849 850 851 852 853
	/*
	 * Setup capabilities (ELF_HWCAP & ELF_PLATFORM).
	 */
	setup_hwcaps();

L
Linus Torvalds 已提交
854 855 856 857 858 859 860
	/*
	 * Create kernel page tables and switch to virtual addressing.
	 */
        paging_init();

        /* Setup default console */
	conmode_default();
861
	set_preferred_console();
M
Michael Holzheu 已提交
862 863 864

	/* Setup zfcpdump support */
	setup_zfcpdump(console_devno);
L
Linus Torvalds 已提交
865
}