setup.c 22.1 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 *  arch/s390/kernel/setup.c
 *
 *  S390 version
 *    Copyright (C) 1999,2000 IBM Deutschland Entwicklung GmbH, IBM Corporation
 *    Author(s): Hartmut Penner (hp@de.ibm.com),
 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
 *
 *  Derived from "arch/i386/kernel/setup.c"
 *    Copyright (C) 1995, Linus Torvalds
 */

/*
 * This file handles the architecture-dependent parts of initialization
 */

17 18 19
#define KMSG_COMPONENT "setup"
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt

L
Linus Torvalds 已提交
20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
#include <linux/errno.h>
#include <linux/module.h>
#include <linux/sched.h>
#include <linux/kernel.h>
#include <linux/mm.h>
#include <linux/stddef.h>
#include <linux/unistd.h>
#include <linux/ptrace.h>
#include <linux/slab.h>
#include <linux/user.h>
#include <linux/tty.h>
#include <linux/ioport.h>
#include <linux/delay.h>
#include <linux/init.h>
#include <linux/initrd.h>
#include <linux/bootmem.h>
#include <linux/root_dev.h>
#include <linux/console.h>
#include <linux/kernel_stat.h>
39
#include <linux/device.h>
40
#include <linux/notifier.h>
41
#include <linux/pfn.h>
H
Hongjie Yang 已提交
42
#include <linux/ctype.h>
43
#include <linux/reboot.h>
44
#include <linux/topology.h>
L
Linus Torvalds 已提交
45

M
Michael Holzheu 已提交
46
#include <asm/ipl.h>
L
Linus Torvalds 已提交
47 48 49 50 51 52 53
#include <asm/uaccess.h>
#include <asm/system.h>
#include <asm/smp.h>
#include <asm/mmu_context.h>
#include <asm/cpcmd.h>
#include <asm/lowcore.h>
#include <asm/irq.h>
54 55
#include <asm/page.h>
#include <asm/ptrace.h>
56
#include <asm/sections.h>
H
Hongjie Yang 已提交
57
#include <asm/ebcdic.h>
G
Gerald Schaefer 已提交
58
#include <asm/compat.h>
59
#include <asm/kvm_virtio.h>
G
Gerald Schaefer 已提交
60 61 62 63 64 65

long psw_kernel_bits	= (PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_PRIMARY |
			   PSW_MASK_MCHECK | PSW_DEFAULT_KEY);
long psw_user_bits	= (PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_HOME |
			   PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			   PSW_MASK_PSTATE | PSW_DEFAULT_KEY);
L
Linus Torvalds 已提交
66

67 68 69 70
/*
 * User copy operations.
 */
struct uaccess_ops uaccess;
71
EXPORT_SYMBOL(uaccess);
72

L
Linus Torvalds 已提交
73 74 75 76 77 78
/*
 * Machine setup..
 */
unsigned int console_mode = 0;
unsigned int console_devno = -1;
unsigned int console_irq = -1;
79
unsigned long machine_flags;
80 81
unsigned long elf_hwcap = 0;
char elf_platform[ELF_PLATFORM_SIZE];
82

83
struct mem_chunk __initdata memory_chunk[MEMORY_CHUNKS];
L
Linus Torvalds 已提交
84
volatile int __cpu_logical_map[NR_CPUS]; /* logical cpu to cpu address */
85 86 87

int __initdata memory_end_set;
unsigned long __initdata memory_end;
L
Linus Torvalds 已提交
88

F
Frank Munzert 已提交
89 90 91 92
/* An array with a pointer to the lowcore of every CPU. */
struct _lowcore *lowcore_ptr[NR_CPUS];
EXPORT_SYMBOL(lowcore_ptr);

L
Linus Torvalds 已提交
93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113
/*
 * This is set up by the setup-routine at boot-time
 * for S390 need to find out, what we have to setup
 * using address 0x10400 ...
 */

#include <asm/setup.h>

static struct resource code_resource = {
	.name  = "Kernel code",
	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
};

static struct resource data_resource = {
	.name = "Kernel data",
	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
};

/*
 * cpu_init() initializes state that is per-CPU.
 */
H
Heiko Carstens 已提交
114
void __cpuinit cpu_init(void)
L
Linus Torvalds 已提交
115 116 117 118 119 120
{
        int addr = hard_smp_processor_id();

        /*
         * Store processor id in lowcore (used e.g. in timer_interrupt)
         */
121
	get_cpu_id(&S390_lowcore.cpu_data.cpu_id);
L
Linus Torvalds 已提交
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
        S390_lowcore.cpu_data.cpu_addr = addr;

        /*
         * Force FPU initialization:
         */
        clear_thread_flag(TIF_USEDFPU);
        clear_used_math();

	atomic_inc(&init_mm.mm_count);
	current->active_mm = &init_mm;
        if (current->mm)
                BUG();
        enter_lazy_tlb(&init_mm, current);
}

/*
 * condev= and conmode= setup parameter.
 */

static int __init condev_setup(char *str)
{
	int vdev;

	vdev = simple_strtoul(str, &str, 0);
	if (vdev >= 0 && vdev < 65536) {
		console_devno = vdev;
		console_irq = -1;
	}
	return 1;
}

__setup("condev=", condev_setup);

static int __init conmode_setup(char *str)
{
157
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179
	if (strncmp(str, "hwc", 4) == 0 || strncmp(str, "sclp", 5) == 0)
                SET_CONSOLE_SCLP;
#endif
#if defined(CONFIG_TN3215_CONSOLE)
	if (strncmp(str, "3215", 5) == 0)
		SET_CONSOLE_3215;
#endif
#if defined(CONFIG_TN3270_CONSOLE)
	if (strncmp(str, "3270", 5) == 0)
		SET_CONSOLE_3270;
#endif
        return 1;
}

__setup("conmode=", conmode_setup);

static void __init conmode_default(void)
{
	char query_buffer[1024];
	char *ptr;

        if (MACHINE_IS_VM) {
180
		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
L
Linus Torvalds 已提交
181 182 183
		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
		ptr = strstr(query_buffer, "SUBCHANNEL =");
		console_irq = simple_strtoul(ptr + 13, NULL, 16);
184
		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
L
Linus Torvalds 已提交
185 186 187 188 189 190 191 192
		ptr = strstr(query_buffer, "CONMODE");
		/*
		 * Set the conmode to 3215 so that the device recognition 
		 * will set the cu_type of the console to 3215. If the
		 * conmode is 3270 and we don't set it back then both
		 * 3215 and the 3270 driver will try to access the console
		 * device (3215 as console and 3270 as normal tty).
		 */
193
		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
L
Linus Torvalds 已提交
194
		if (ptr == NULL) {
195
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
196 197 198 199 200 201 202 203 204
			SET_CONSOLE_SCLP;
#endif
			return;
		}
		if (strncmp(ptr + 8, "3270", 4) == 0) {
#if defined(CONFIG_TN3270_CONSOLE)
			SET_CONSOLE_3270;
#elif defined(CONFIG_TN3215_CONSOLE)
			SET_CONSOLE_3215;
205
#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
206 207 208 209 210 211 212
			SET_CONSOLE_SCLP;
#endif
		} else if (strncmp(ptr + 8, "3215", 4) == 0) {
#if defined(CONFIG_TN3215_CONSOLE)
			SET_CONSOLE_3215;
#elif defined(CONFIG_TN3270_CONSOLE)
			SET_CONSOLE_3270;
213
#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
214 215 216 217
			SET_CONSOLE_SCLP;
#endif
		}
	} else {
218
#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
L
Linus Torvalds 已提交
219 220 221 222 223
		SET_CONSOLE_SCLP;
#endif
	}
}

M
Michael Holzheu 已提交
224 225 226
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)
static void __init setup_zfcpdump(unsigned int console_devno)
{
227
	static char str[41];
M
Michael Holzheu 已提交
228 229 230 231

	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
	if (console_devno != -1)
232
		sprintf(str, " cio_ignore=all,!0.0.%04x,!0.0.%04x",
M
Michael Holzheu 已提交
233 234
			ipl_info.data.fcp.dev_id.devno, console_devno);
	else
235
		sprintf(str, " cio_ignore=all,!0.0.%04x",
M
Michael Holzheu 已提交
236
			ipl_info.data.fcp.dev_id.devno);
237
	strcat(boot_command_line, str);
M
Michael Holzheu 已提交
238 239 240 241 242 243
	console_loglevel = 2;
}
#else
static inline void setup_zfcpdump(unsigned int console_devno) {}
#endif /* CONFIG_ZFCPDUMP */

L
Linus Torvalds 已提交
244 245 246 247 248 249 250
 /*
 * Reboot, halt and power_off stubs. They just call _machine_restart,
 * _machine_halt or _machine_power_off. 
 */

void machine_restart(char *command)
{
251
	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
252 253 254 255 256
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
257 258 259 260 261
	_machine_restart(command);
}

void machine_halt(void)
{
262 263 264 265 266 267
	if (!in_interrupt() || oops_in_progress)
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
268 269 270 271 272
	_machine_halt();
}

void machine_power_off(void)
{
273 274 275 276 277 278
	if (!in_interrupt() || oops_in_progress)
		/*
		 * Only unblank the console if we are called in enabled
		 * context or a bust_spinlocks cleared the way for us.
		 */
		console_unblank();
L
Linus Torvalds 已提交
279 280 281
	_machine_power_off();
}

282 283 284 285 286
/*
 * Dummy power off function.
 */
void (*pm_power_off)(void) = machine_power_off;

287 288 289
static int __init early_parse_mem(char *p)
{
	memory_end = memparse(p, &p);
290
	memory_end_set = 1;
291 292 293 294
	return 0;
}
early_param("mem", early_parse_mem);

G
Gerald Schaefer 已提交
295
#ifdef CONFIG_S390_SWITCH_AMODE
296 297 298
#ifdef CONFIG_PGSTE
unsigned int switch_amode = 1;
#else
G
Gerald Schaefer 已提交
299
unsigned int switch_amode = 0;
300
#endif
G
Gerald Schaefer 已提交
301 302
EXPORT_SYMBOL_GPL(switch_amode);

303 304
static int set_amode_and_uaccess(unsigned long user_amode,
				 unsigned long user32_amode)
G
Gerald Schaefer 已提交
305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321
{
	psw_user_bits = PSW_BASE_BITS | PSW_MASK_DAT | user_amode |
			PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			PSW_MASK_PSTATE | PSW_DEFAULT_KEY;
#ifdef CONFIG_COMPAT
	psw_user32_bits = PSW_BASE32_BITS | PSW_MASK_DAT | user_amode |
			  PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK |
			  PSW_MASK_PSTATE | PSW_DEFAULT_KEY;
	psw32_user_bits = PSW32_BASE_BITS | PSW32_MASK_DAT | user32_amode |
			  PSW32_MASK_IO | PSW32_MASK_EXT | PSW32_MASK_MCHECK |
			  PSW32_MASK_PSTATE;
#endif
	psw_kernel_bits = PSW_BASE_BITS | PSW_MASK_DAT | PSW_ASC_HOME |
			  PSW_MASK_MCHECK | PSW_DEFAULT_KEY;

	if (MACHINE_HAS_MVCOS) {
		memcpy(&uaccess, &uaccess_mvcos_switch, sizeof(uaccess));
322
		return 1;
G
Gerald Schaefer 已提交
323 324
	} else {
		memcpy(&uaccess, &uaccess_pt, sizeof(uaccess));
325
		return 0;
G
Gerald Schaefer 已提交
326 327 328 329 330 331 332 333 334 335 336 337 338 339
	}
}

/*
 * Switch kernel/user addressing modes?
 */
static int __init early_parse_switch_amode(char *p)
{
	switch_amode = 1;
	return 0;
}
early_param("switch_amode", early_parse_switch_amode);

#else /* CONFIG_S390_SWITCH_AMODE */
340 341
static inline int set_amode_and_uaccess(unsigned long user_amode,
					unsigned long user32_amode)
G
Gerald Schaefer 已提交
342
{
343
	return 0;
G
Gerald Schaefer 已提交
344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367
}
#endif /* CONFIG_S390_SWITCH_AMODE */

#ifdef CONFIG_S390_EXEC_PROTECT
unsigned int s390_noexec = 0;
EXPORT_SYMBOL_GPL(s390_noexec);

/*
 * Enable execute protection?
 */
static int __init early_parse_noexec(char *p)
{
	if (!strncmp(p, "off", 3))
		return 0;
	switch_amode = 1;
	s390_noexec = 1;
	return 0;
}
early_param("noexec", early_parse_noexec);
#endif /* CONFIG_S390_EXEC_PROTECT */

static void setup_addressing_mode(void)
{
	if (s390_noexec) {
368 369 370 371 372 373 374
		if (set_amode_and_uaccess(PSW_ASC_SECONDARY,
					  PSW32_ASC_SECONDARY))
			pr_info("Execute protection active, "
				"mvcos available\n");
		else
			pr_info("Execute protection active, "
				"mvcos not available\n");
375
	} else if (switch_amode) {
376 377 378 379 380 381
		if (set_amode_and_uaccess(PSW_ASC_PRIMARY, PSW32_ASC_PRIMARY))
			pr_info("Address spaces switched, "
				"mvcos available\n");
		else
			pr_info("Address spaces switched, "
				"mvcos not available\n");
G
Gerald Schaefer 已提交
382
	}
383 384 385 386
#ifdef CONFIG_TRACE_IRQFLAGS
	sysc_restore_trace_psw.mask = psw_kernel_bits & ~PSW_MASK_MCHECK;
	io_restore_trace_psw.mask = psw_kernel_bits & ~PSW_MASK_MCHECK;
#endif
G
Gerald Schaefer 已提交
387 388
}

389 390 391 392 393 394 395 396 397 398 399 400 401
static void __init
setup_lowcore(void)
{
	struct _lowcore *lc;
	int lc_pages;

	/*
	 * Setup lowcore for boot cpu
	 */
	lc_pages = sizeof(void *) == 8 ? 2 : 1;
	lc = (struct _lowcore *)
		__alloc_bootmem(lc_pages * PAGE_SIZE, lc_pages * PAGE_SIZE, 0);
	memset(lc, 0, lc_pages * PAGE_SIZE);
402
	lc->restart_psw.mask = PSW_BASE_BITS | PSW_DEFAULT_KEY;
403 404
	lc->restart_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) restart_int_handler;
G
Gerald Schaefer 已提交
405 406 407
	if (switch_amode)
		lc->restart_psw.mask |= PSW_ASC_HOME;
	lc->external_new_psw.mask = psw_kernel_bits;
408 409
	lc->external_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) ext_int_handler;
G
Gerald Schaefer 已提交
410
	lc->svc_new_psw.mask = psw_kernel_bits | PSW_MASK_IO | PSW_MASK_EXT;
411
	lc->svc_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) system_call;
G
Gerald Schaefer 已提交
412
	lc->program_new_psw.mask = psw_kernel_bits;
413 414
	lc->program_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long)pgm_check_handler;
415
	lc->mcck_new_psw.mask =
G
Gerald Schaefer 已提交
416
		psw_kernel_bits & ~PSW_MASK_MCHECK & ~PSW_MASK_DAT;
417 418
	lc->mcck_new_psw.addr =
		PSW_ADDR_AMODE | (unsigned long) mcck_int_handler;
G
Gerald Schaefer 已提交
419
	lc->io_new_psw.mask = psw_kernel_bits;
420 421
	lc->io_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) io_int_handler;
	lc->ipl_device = S390_lowcore.ipl_device;
422
	lc->clock_comparator = -1ULL;
423 424 425 426 427 428 429
	lc->kernel_stack = ((unsigned long) &init_thread_union) + THREAD_SIZE;
	lc->async_stack = (unsigned long)
		__alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0) + ASYNC_SIZE;
	lc->panic_stack = (unsigned long)
		__alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0) + PAGE_SIZE;
	lc->current_task = (unsigned long) init_thread_union.thread_info.task;
	lc->thread_info = (unsigned long) &init_thread_union;
430
#ifndef CONFIG_64BIT
431 432 433 434
	if (MACHINE_HAS_IEEE) {
		lc->extended_save_area_addr = (__u32)
			__alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0);
		/* enable extended save area */
H
Heiko Carstens 已提交
435
		__ctl_set_bit(14, 29);
436
	}
437 438
#else
	lc->vdso_per_cpu_data = (unsigned long) &lc->paste[0];
439
#endif
440
	set_prefix((u32)(unsigned long) lc);
F
Frank Munzert 已提交
441
	lowcore_ptr[0] = lc;
442 443 444 445 446
}

static void __init
setup_resources(void)
{
H
Hongjie Yang 已提交
447
	struct resource *res, *sub_res;
448 449
	int i;

450 451 452 453 454
	code_resource.start = (unsigned long) &_text;
	code_resource.end = (unsigned long) &_etext - 1;
	data_resource.start = (unsigned long) &_etext;
	data_resource.end = (unsigned long) &_edata - 1;

455 456 457
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		if (!memory_chunk[i].size)
			continue;
458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473
		res = alloc_bootmem_low(sizeof(struct resource));
		res->flags = IORESOURCE_BUSY | IORESOURCE_MEM;
		switch (memory_chunk[i].type) {
		case CHUNK_READ_WRITE:
			res->name = "System RAM";
			break;
		case CHUNK_READ_ONLY:
			res->name = "System ROM";
			res->flags |= IORESOURCE_READONLY;
			break;
		default:
			res->name = "reserved";
		}
		res->start = memory_chunk[i].addr;
		res->end = memory_chunk[i].addr +  memory_chunk[i].size - 1;
		request_resource(&iomem_resource, res);
H
Hongjie Yang 已提交
474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505

		if (code_resource.start >= res->start  &&
			code_resource.start <= res->end &&
			code_resource.end > res->end) {
			sub_res = alloc_bootmem_low(sizeof(struct resource));
			memcpy(sub_res, &code_resource,
				sizeof(struct resource));
			sub_res->end = res->end;
			code_resource.start = res->end + 1;
			request_resource(res, sub_res);
		}

		if (code_resource.start >= res->start &&
			code_resource.start <= res->end &&
			code_resource.end <= res->end)
			request_resource(res, &code_resource);

		if (data_resource.start >= res->start &&
			data_resource.start <= res->end &&
			data_resource.end > res->end) {
			sub_res = alloc_bootmem_low(sizeof(struct resource));
			memcpy(sub_res, &data_resource,
				sizeof(struct resource));
			sub_res->end = res->end;
			data_resource.start = res->end + 1;
			request_resource(res, sub_res);
		}

		if (data_resource.start >= res->start &&
			data_resource.start <= res->end &&
			data_resource.end <= res->end)
			request_resource(res, &data_resource);
506 507 508
	}
}

M
Michael Holzheu 已提交
509 510 511
unsigned long real_memory_size;
EXPORT_SYMBOL_GPL(real_memory_size);

H
Heiko Carstens 已提交
512 513
static void __init setup_memory_end(void)
{
M
Michael Holzheu 已提交
514
	unsigned long memory_size;
515
	unsigned long max_mem;
H
Heiko Carstens 已提交
516 517
	int i;

M
Michael Holzheu 已提交
518
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)
519
	if (ipl_info.type == IPL_TYPE_FCP_DUMP) {
M
Michael Holzheu 已提交
520
		memory_end = ZFCPDUMP_HSA_SIZE;
521 522
		memory_end_set = 1;
	}
M
Michael Holzheu 已提交
523 524
#endif
	memory_size = 0;
H
Heiko Carstens 已提交
525 526
	memory_end &= PAGE_MASK;

527
	max_mem = memory_end ? min(VMEM_MAX_PHYS, memory_end) : VMEM_MAX_PHYS;
528
	memory_end = min(max_mem, memory_end);
H
Heiko Carstens 已提交
529

530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550
	/*
	 * Make sure all chunks are MAX_ORDER aligned so we don't need the
	 * extra checks that HOLES_IN_ZONE would require.
	 */
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		unsigned long start, end;
		struct mem_chunk *chunk;
		unsigned long align;

		chunk = &memory_chunk[i];
		align = 1UL << (MAX_ORDER + PAGE_SHIFT - 1);
		start = (chunk->addr + align - 1) & ~(align - 1);
		end = (chunk->addr + chunk->size) & ~(align - 1);
		if (start >= end)
			memset(chunk, 0, sizeof(*chunk));
		else {
			chunk->addr = start;
			chunk->size = end - start;
		}
	}

H
Heiko Carstens 已提交
551 552 553
	for (i = 0; i < MEMORY_CHUNKS; i++) {
		struct mem_chunk *chunk = &memory_chunk[i];

M
Michael Holzheu 已提交
554 555
		real_memory_size = max(real_memory_size,
				       chunk->addr + chunk->size);
H
Heiko Carstens 已提交
556 557 558 559 560 561 562 563 564 565 566 567
		if (chunk->addr >= max_mem) {
			memset(chunk, 0, sizeof(*chunk));
			continue;
		}
		if (chunk->addr + chunk->size > max_mem)
			chunk->size = max_mem - chunk->addr;
		memory_size = max(memory_size, chunk->addr + chunk->size);
	}
	if (!memory_end)
		memory_end = memory_size;
}

568 569 570 571
static void __init
setup_memory(void)
{
        unsigned long bootmap_size;
H
Hongjie Yang 已提交
572
	unsigned long start_pfn, end_pfn;
573
	int i;
L
Linus Torvalds 已提交
574 575 576 577 578

	/*
	 * partially used pages are not usable - thus
	 * we are rounding upwards:
	 */
579 580
	start_pfn = PFN_UP(__pa(&_end));
	end_pfn = max_pfn = PFN_DOWN(memory_end);
L
Linus Torvalds 已提交
581

582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598
#ifdef CONFIG_BLK_DEV_INITRD
	/*
	 * Move the initrd in case the bitmap of the bootmem allocater
	 * would overwrite it.
	 */

	if (INITRD_START && INITRD_SIZE) {
		unsigned long bmap_size;
		unsigned long start;

		bmap_size = bootmem_bootmap_pages(end_pfn - start_pfn + 1);
		bmap_size = PFN_PHYS(bmap_size);

		if (PFN_PHYS(start_pfn) + bmap_size > INITRD_START) {
			start = PFN_PHYS(start_pfn) + bmap_size + PAGE_SIZE;

			if (start + INITRD_SIZE > memory_end) {
599 600
				pr_err("initrd extends beyond end of "
				       "memory (0x%08lx > 0x%08lx) "
601 602 603 604
				       "disabling initrd\n",
				       start + INITRD_SIZE, memory_end);
				INITRD_START = INITRD_SIZE = 0;
			} else {
605 606 607
				pr_info("Moving initrd (0x%08lx -> "
					"0x%08lx, size: %ld)\n",
					INITRD_START, start, INITRD_SIZE);
608 609 610 611 612 613 614 615
				memmove((void *) start, (void *) INITRD_START,
					INITRD_SIZE);
				INITRD_START = start;
			}
		}
	}
#endif

L
Linus Torvalds 已提交
616
	/*
617
	 * Initialize the boot-time allocator
L
Linus Torvalds 已提交
618 619 620 621 622 623
	 */
	bootmap_size = init_bootmem(start_pfn, end_pfn);

	/*
	 * Register RAM areas with the bootmem allocator.
	 */
624

625
	for (i = 0; i < MEMORY_CHUNKS && memory_chunk[i].size > 0; i++) {
626
		unsigned long start_chunk, end_chunk, pfn;
L
Linus Torvalds 已提交
627 628 629

		if (memory_chunk[i].type != CHUNK_READ_WRITE)
			continue;
630
		start_chunk = PFN_DOWN(memory_chunk[i].addr);
631
		end_chunk = start_chunk + PFN_DOWN(memory_chunk[i].size);
632 633 634 635 636
		end_chunk = min(end_chunk, end_pfn);
		if (start_chunk >= end_chunk)
			continue;
		add_active_range(0, start_chunk, end_chunk);
		pfn = max(start_chunk, start_pfn);
637
		for (; pfn < end_chunk; pfn++)
638
			page_set_storage_key(PFN_PHYS(pfn), PAGE_DEFAULT_KEY);
L
Linus Torvalds 已提交
639 640
	}

641 642
	psw_set_key(PAGE_DEFAULT_KEY);

643
	free_bootmem_with_active_regions(0, max_pfn);
644

645 646 647
	/*
	 * Reserve memory used for lowcore/command line/kernel image.
	 */
648
	reserve_bootmem(0, (unsigned long)_ehead, BOOTMEM_DEFAULT);
649
	reserve_bootmem((unsigned long)_stext,
650 651
			PFN_PHYS(start_pfn) - (unsigned long)_stext,
			BOOTMEM_DEFAULT);
652 653 654 655 656 657
	/*
	 * Reserve the bootmem bitmap itself as well. We do this in two
	 * steps (first step was init_bootmem()) because this catches
	 * the (very unlikely) case of us accidentally initializing the
	 * bootmem allocator with an invalid RAM area.
	 */
658 659
	reserve_bootmem(start_pfn << PAGE_SHIFT, bootmap_size,
			BOOTMEM_DEFAULT);
L
Linus Torvalds 已提交
660 661

#ifdef CONFIG_BLK_DEV_INITRD
662
	if (INITRD_START && INITRD_SIZE) {
L
Linus Torvalds 已提交
663
		if (INITRD_START + INITRD_SIZE <= memory_end) {
664 665
			reserve_bootmem(INITRD_START, INITRD_SIZE,
					BOOTMEM_DEFAULT);
L
Linus Torvalds 已提交
666 667 668
			initrd_start = INITRD_START;
			initrd_end = initrd_start + INITRD_SIZE;
		} else {
669 670 671
			pr_err("initrd extends beyond end of "
			       "memory (0x%08lx > 0x%08lx) "
			       "disabling initrd\n",
672 673
			       initrd_start + INITRD_SIZE, memory_end);
			initrd_start = initrd_end = 0;
L
Linus Torvalds 已提交
674
		}
675
	}
L
Linus Torvalds 已提交
676
#endif
677
}
L
Linus Torvalds 已提交
678

679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722
/*
 * Setup hardware capabilities.
 */
static void __init setup_hwcaps(void)
{
	static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
	struct cpuinfo_S390 *cpuinfo = &S390_lowcore.cpu_data;
	unsigned long long facility_list_extended;
	unsigned int facility_list;
	int i;

	facility_list = stfl();
	/*
	 * The store facility list bits numbers as found in the principles
	 * of operation are numbered with bit 1UL<<31 as number 0 to
	 * bit 1UL<<0 as number 31.
	 *   Bit 0: instructions named N3, "backported" to esa-mode
	 *   Bit 2: z/Architecture mode is active
	 *   Bit 7: the store-facility-list-extended facility is installed
	 *   Bit 17: the message-security assist is installed
	 *   Bit 19: the long-displacement facility is installed
	 *   Bit 21: the extended-immediate facility is installed
	 * These get translated to:
	 *   HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
	 *   HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
	 *   HWCAP_S390_LDISP bit 4, and HWCAP_S390_EIMM bit 5.
	 */
	for (i = 0; i < 6; i++)
		if (facility_list & (1UL << (31 - stfl_bits[i])))
			elf_hwcap |= 1UL << i;

	/*
	 * Check for additional facilities with store-facility-list-extended.
	 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
	 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
	 * as stored by stfl, bits 32-xxx contain additional facilities.
	 * How many facility words are stored depends on the number of
	 * doublewords passed to the instruction. The additional facilites
	 * are:
	 *   Bit 43: decimal floating point facility is installed
	 * translated to:
	 *   HWCAP_S390_DFP bit 6.
	 */
	if ((elf_hwcap & (1UL << 2)) &&
H
Heiko Carstens 已提交
723
	    __stfle(&facility_list_extended, 1) > 0) {
724 725 726 727
		if (facility_list_extended & (1ULL << (64 - 43)))
			elf_hwcap |= 1UL << 6;
	}

728 729 730
	if (MACHINE_HAS_HPAGE)
		elf_hwcap |= 1UL << 7;

731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749
	switch (cpuinfo->cpu_id.machine) {
	case 0x9672:
#if !defined(CONFIG_64BIT)
	default:	/* Use "g5" as default for 31 bit kernels. */
#endif
		strcpy(elf_platform, "g5");
		break;
	case 0x2064:
	case 0x2066:
#if defined(CONFIG_64BIT)
	default:	/* Use "z900" as default for 64 bit kernels. */
#endif
		strcpy(elf_platform, "z900");
		break;
	case 0x2084:
	case 0x2086:
		strcpy(elf_platform, "z990");
		break;
	case 0x2094:
750
	case 0x2096:
751 752
		strcpy(elf_platform, "z9-109");
		break;
753 754 755 756
	case 0x2097:
	case 0x2098:
		strcpy(elf_platform, "z10");
		break;
757 758 759
	}
}

760 761 762 763
/*
 * Setup function called from init/main.c just after the banner
 * was printed.
 */
L
Linus Torvalds 已提交
764

765 766 767
void __init
setup_arch(char **cmdline_p)
{
768 769 770
	/* set up preferred console */
	add_preferred_console("ttyS", 0, NULL);

L
Linus Torvalds 已提交
771
        /*
772
         * print what head.S has found out about the machine
L
Linus Torvalds 已提交
773
         */
774
#ifndef CONFIG_64BIT
775 776 777 778 779 780 781 782 783 784 785
	if (MACHINE_IS_VM)
		pr_info("Linux is running as a z/VM "
			"guest operating system in 31-bit mode\n");
	else
		pr_info("Linux is running natively in 31-bit mode\n");
	if (MACHINE_HAS_IEEE)
		pr_info("The hardware system has IEEE compatible "
			"floating point units\n");
	else
		pr_info("The hardware system has no IEEE compatible "
			"floating point units\n");
786
#else /* CONFIG_64BIT */
787
	if (MACHINE_IS_VM)
788 789
		pr_info("Linux is running as a z/VM "
			"guest operating system in 64-bit mode\n");
790
	else if (MACHINE_IS_KVM) {
791
		pr_info("Linux is running under KVM in 64-bit mode\n");
792 793
		add_preferred_console("hvc", 0, NULL);
		s390_virtio_console_init();
794
	} else
795
		pr_info("Linux is running natively in 64-bit mode\n");
796
#endif /* CONFIG_64BIT */
797

798 799 800
	/* Have one command line that is parsed and saved in /proc/cmdline */
	/* boot_command_line has been already set up in early.c */
	*cmdline_p = boot_command_line;
801

802
        ROOT_DEV = Root_RAM0;
803 804 805 806 807 808

	init_mm.start_code = PAGE_OFFSET;
	init_mm.end_code = (unsigned long) &_etext;
	init_mm.end_data = (unsigned long) &_edata;
	init_mm.brk = (unsigned long) &_end;

809 810 811 812 813
	if (MACHINE_HAS_MVCOS)
		memcpy(&uaccess, &uaccess_mvcos, sizeof(uaccess));
	else
		memcpy(&uaccess, &uaccess_std, sizeof(uaccess));

814 815
	parse_early_param();

816
	setup_ipl();
H
Heiko Carstens 已提交
817
	setup_memory_end();
G
Gerald Schaefer 已提交
818
	setup_addressing_mode();
819 820 821 822
	setup_memory();
	setup_resources();
	setup_lowcore();

L
Linus Torvalds 已提交
823 824
        cpu_init();
        __cpu_logical_map[0] = S390_lowcore.cpu_data.cpu_addr;
825
	s390_init_cpu_topology();
L
Linus Torvalds 已提交
826

827 828 829 830 831
	/*
	 * Setup capabilities (ELF_HWCAP & ELF_PLATFORM).
	 */
	setup_hwcaps();

L
Linus Torvalds 已提交
832 833 834 835 836 837 838
	/*
	 * Create kernel page tables and switch to virtual addressing.
	 */
        paging_init();

        /* Setup default console */
	conmode_default();
M
Michael Holzheu 已提交
839 840 841

	/* Setup zfcpdump support */
	setup_zfcpdump(console_devno);
L
Linus Torvalds 已提交
842
}