Linux Audio

Check our new training course

Loading...
v6.2
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 *  S390 version
   4 *    Copyright IBM Corp. 1999, 2012
   5 *    Author(s): Hartmut Penner (hp@de.ibm.com),
   6 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
   7 *
   8 *  Derived from "arch/i386/kernel/setup.c"
   9 *    Copyright (C) 1995, Linus Torvalds
  10 */
  11
  12/*
  13 * This file handles the architecture-dependent parts of initialization
  14 */
  15
  16#define KMSG_COMPONENT "setup"
  17#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
  18
  19#include <linux/errno.h>
  20#include <linux/export.h>
  21#include <linux/sched.h>
  22#include <linux/sched/task.h>
  23#include <linux/cpu.h>
  24#include <linux/kernel.h>
  25#include <linux/memblock.h>
  26#include <linux/mm.h>
  27#include <linux/stddef.h>
  28#include <linux/unistd.h>
  29#include <linux/ptrace.h>
  30#include <linux/random.h>
  31#include <linux/user.h>
  32#include <linux/tty.h>
  33#include <linux/ioport.h>
  34#include <linux/delay.h>
  35#include <linux/init.h>
  36#include <linux/initrd.h>
 
  37#include <linux/root_dev.h>
  38#include <linux/console.h>
  39#include <linux/kernel_stat.h>
  40#include <linux/dma-map-ops.h>
  41#include <linux/device.h>
  42#include <linux/notifier.h>
  43#include <linux/pfn.h>
  44#include <linux/ctype.h>
  45#include <linux/reboot.h>
  46#include <linux/topology.h>
 
  47#include <linux/kexec.h>
  48#include <linux/crash_dump.h>
  49#include <linux/memory.h>
  50#include <linux/compat.h>
  51#include <linux/start_kernel.h>
  52#include <linux/hugetlb.h>
  53#include <linux/kmemleak.h>
  54
  55#include <asm/archrandom.h>
  56#include <asm/boot_data.h>
  57#include <asm/ipl.h>
  58#include <asm/facility.h>
  59#include <asm/smp.h>
  60#include <asm/mmu_context.h>
  61#include <asm/cpcmd.h>
  62#include <asm/abs_lowcore.h>
  63#include <asm/nmi.h>
  64#include <asm/irq.h>
  65#include <asm/page.h>
  66#include <asm/ptrace.h>
  67#include <asm/sections.h>
  68#include <asm/ebcdic.h>
 
  69#include <asm/diag.h>
  70#include <asm/os_info.h>
  71#include <asm/sclp.h>
  72#include <asm/stacktrace.h>
  73#include <asm/sysinfo.h>
  74#include <asm/numa.h>
  75#include <asm/alternative.h>
  76#include <asm/nospec-branch.h>
  77#include <asm/mem_detect.h>
  78#include <asm/maccess.h>
  79#include <asm/uv.h>
  80#include <asm/asm-offsets.h>
  81#include "entry.h"
  82
  83/*
  84 * Machine setup..
  85 */
  86unsigned int console_mode = 0;
  87EXPORT_SYMBOL(console_mode);
  88
  89unsigned int console_devno = -1;
  90EXPORT_SYMBOL(console_devno);
  91
  92unsigned int console_irq = -1;
  93EXPORT_SYMBOL(console_irq);
  94
  95/*
  96 * Some code and data needs to stay below 2 GB, even when the kernel would be
  97 * relocated above 2 GB, because it has to use 31 bit addresses.
  98 * Such code and data is part of the .amode31 section.
  99 */
 100unsigned long __amode31_ref __samode31 = (unsigned long)&_samode31;
 101unsigned long __amode31_ref __eamode31 = (unsigned long)&_eamode31;
 102unsigned long __amode31_ref __stext_amode31 = (unsigned long)&_stext_amode31;
 103unsigned long __amode31_ref __etext_amode31 = (unsigned long)&_etext_amode31;
 104struct exception_table_entry __amode31_ref *__start_amode31_ex_table = _start_amode31_ex_table;
 105struct exception_table_entry __amode31_ref *__stop_amode31_ex_table = _stop_amode31_ex_table;
 106
 107/*
 108 * Control registers CR2, CR5 and CR15 are initialized with addresses
 109 * of tables that must be placed below 2G which is handled by the AMODE31
 110 * sections.
 111 * Because the AMODE31 sections are relocated below 2G at startup,
 112 * the content of control registers CR2, CR5 and CR15 must be updated
 113 * with new addresses after the relocation. The initial initialization of
 114 * control registers occurs in head64.S and then gets updated again after AMODE31
 115 * relocation. We must access the relevant AMODE31 tables indirectly via
 116 * pointers placed in the .amode31.refs linker section. Those pointers get
 117 * updated automatically during AMODE31 relocation and always contain a valid
 118 * address within AMODE31 sections.
 119 */
 120
 121static __amode31_data u32 __ctl_duct_amode31[16] __aligned(64);
 122
 123static __amode31_data u64 __ctl_aste_amode31[8] __aligned(64) = {
 124	[1] = 0xffffffffffffffff
 125};
 126
 127static __amode31_data u32 __ctl_duald_amode31[32] __aligned(128) = {
 128	0x80000000, 0, 0, 0,
 129	0x80000000, 0, 0, 0,
 130	0x80000000, 0, 0, 0,
 131	0x80000000, 0, 0, 0,
 132	0x80000000, 0, 0, 0,
 133	0x80000000, 0, 0, 0,
 134	0x80000000, 0, 0, 0,
 135	0x80000000, 0, 0, 0
 136};
 137
 138static __amode31_data u32 __ctl_linkage_stack_amode31[8] __aligned(64) = {
 139	0, 0, 0x89000000, 0,
 140	0, 0, 0x8a000000, 0
 141};
 142
 143static u64 __amode31_ref *__ctl_aste = __ctl_aste_amode31;
 144static u32 __amode31_ref *__ctl_duald = __ctl_duald_amode31;
 145static u32 __amode31_ref *__ctl_linkage_stack = __ctl_linkage_stack_amode31;
 146static u32 __amode31_ref *__ctl_duct = __ctl_duct_amode31;
 147
 148int __bootdata(noexec_disabled);
 149unsigned long __bootdata(ident_map_size);
 150struct mem_detect_info __bootdata(mem_detect);
 151struct initrd_data __bootdata(initrd_data);
 152
 153unsigned long __bootdata_preserved(__kaslr_offset);
 154unsigned long __bootdata(__amode31_base);
 155unsigned int __bootdata_preserved(zlib_dfltcc_support);
 156EXPORT_SYMBOL(zlib_dfltcc_support);
 157u64 __bootdata_preserved(stfle_fac_list[16]);
 158EXPORT_SYMBOL(stfle_fac_list);
 159u64 __bootdata_preserved(alt_stfle_fac_list[16]);
 160struct oldmem_data __bootdata_preserved(oldmem_data);
 161
 162unsigned long VMALLOC_START;
 163EXPORT_SYMBOL(VMALLOC_START);
 164
 165unsigned long VMALLOC_END;
 166EXPORT_SYMBOL(VMALLOC_END);
 167
 168struct page *vmemmap;
 169EXPORT_SYMBOL(vmemmap);
 170unsigned long vmemmap_size;
 171
 
 172unsigned long MODULES_VADDR;
 173unsigned long MODULES_END;
 
 174
 175/* An array with a pointer to the lowcore of every CPU. */
 176struct lowcore *lowcore_ptr[NR_CPUS];
 177EXPORT_SYMBOL(lowcore_ptr);
 178
 179DEFINE_STATIC_KEY_FALSE(cpu_has_bear);
 180
 181/*
 182 * The Write Back bit position in the physaddr is given by the SLPC PCI.
 183 * Leaving the mask zero always uses write through which is safe
 184 */
 185unsigned long mio_wb_bit_mask __ro_after_init;
 186
 187/*
 188 * This is set up by the setup-routine at boot-time
 189 * for S390 need to find out, what we have to setup
 190 * using address 0x10400 ...
 191 */
 192
 193#include <asm/setup.h>
 194
 195/*
 196 * condev= and conmode= setup parameter.
 197 */
 198
 199static int __init condev_setup(char *str)
 200{
 201	int vdev;
 202
 203	vdev = simple_strtoul(str, &str, 0);
 204	if (vdev >= 0 && vdev < 65536) {
 205		console_devno = vdev;
 206		console_irq = -1;
 207	}
 208	return 1;
 209}
 210
 211__setup("condev=", condev_setup);
 212
 213static void __init set_preferred_console(void)
 214{
 215	if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
 
 
 
 
 
 
 
 216		add_preferred_console("ttyS", 0, NULL);
 217	else if (CONSOLE_IS_3270)
 218		add_preferred_console("tty3270", 0, NULL);
 219	else if (CONSOLE_IS_VT220)
 220		add_preferred_console("ttysclp", 0, NULL);
 221	else if (CONSOLE_IS_HVC)
 222		add_preferred_console("hvc", 0, NULL);
 223}
 224
 225static int __init conmode_setup(char *str)
 226{
 227#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 228	if (!strcmp(str, "hwc") || !strcmp(str, "sclp"))
 229                SET_CONSOLE_SCLP;
 230#endif
 231#if defined(CONFIG_TN3215_CONSOLE)
 232	if (!strcmp(str, "3215"))
 233		SET_CONSOLE_3215;
 234#endif
 235#if defined(CONFIG_TN3270_CONSOLE)
 236	if (!strcmp(str, "3270"))
 237		SET_CONSOLE_3270;
 238#endif
 239	set_preferred_console();
 240        return 1;
 241}
 242
 243__setup("conmode=", conmode_setup);
 244
 245static void __init conmode_default(void)
 246{
 247	char query_buffer[1024];
 248	char *ptr;
 249
 250        if (MACHINE_IS_VM) {
 251		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
 252		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
 253		ptr = strstr(query_buffer, "SUBCHANNEL =");
 254		console_irq = simple_strtoul(ptr + 13, NULL, 16);
 255		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
 256		ptr = strstr(query_buffer, "CONMODE");
 257		/*
 258		 * Set the conmode to 3215 so that the device recognition 
 259		 * will set the cu_type of the console to 3215. If the
 260		 * conmode is 3270 and we don't set it back then both
 261		 * 3215 and the 3270 driver will try to access the console
 262		 * device (3215 as console and 3270 as normal tty).
 263		 */
 264		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
 265		if (ptr == NULL) {
 266#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 267			SET_CONSOLE_SCLP;
 268#endif
 269			return;
 270		}
 271		if (str_has_prefix(ptr + 8, "3270")) {
 272#if defined(CONFIG_TN3270_CONSOLE)
 273			SET_CONSOLE_3270;
 274#elif defined(CONFIG_TN3215_CONSOLE)
 275			SET_CONSOLE_3215;
 276#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 277			SET_CONSOLE_SCLP;
 278#endif
 279		} else if (str_has_prefix(ptr + 8, "3215")) {
 280#if defined(CONFIG_TN3215_CONSOLE)
 281			SET_CONSOLE_3215;
 282#elif defined(CONFIG_TN3270_CONSOLE)
 283			SET_CONSOLE_3270;
 284#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 285			SET_CONSOLE_SCLP;
 286#endif
 287		}
 288	} else if (MACHINE_IS_KVM) {
 289		if (sclp.has_vt220 && IS_ENABLED(CONFIG_SCLP_VT220_CONSOLE))
 290			SET_CONSOLE_VT220;
 291		else if (sclp.has_linemode && IS_ENABLED(CONFIG_SCLP_CONSOLE))
 292			SET_CONSOLE_SCLP;
 293		else
 294			SET_CONSOLE_HVC;
 295	} else {
 296#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 297		SET_CONSOLE_SCLP;
 298#endif
 299	}
 300}
 301
 302#ifdef CONFIG_CRASH_DUMP
 303static void __init setup_zfcpdump(void)
 304{
 305	if (!is_ipl_type_dump())
 306		return;
 307	if (oldmem_data.start)
 308		return;
 309	strcat(boot_command_line, " cio_ignore=all,!ipldev,!condev");
 310	console_loglevel = 2;
 311}
 312#else
 313static inline void setup_zfcpdump(void) {}
 314#endif /* CONFIG_CRASH_DUMP */
 315
 316 /*
 317 * Reboot, halt and power_off stubs. They just call _machine_restart,
 318 * _machine_halt or _machine_power_off. 
 319 */
 320
 321void machine_restart(char *command)
 322{
 323	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
 324		/*
 325		 * Only unblank the console if we are called in enabled
 326		 * context or a bust_spinlocks cleared the way for us.
 327		 */
 328		console_unblank();
 329	_machine_restart(command);
 330}
 331
 332void machine_halt(void)
 333{
 334	if (!in_interrupt() || oops_in_progress)
 335		/*
 336		 * Only unblank the console if we are called in enabled
 337		 * context or a bust_spinlocks cleared the way for us.
 338		 */
 339		console_unblank();
 340	_machine_halt();
 341}
 342
 343void machine_power_off(void)
 344{
 345	if (!in_interrupt() || oops_in_progress)
 346		/*
 347		 * Only unblank the console if we are called in enabled
 348		 * context or a bust_spinlocks cleared the way for us.
 349		 */
 350		console_unblank();
 351	_machine_power_off();
 352}
 353
 354/*
 355 * Dummy power off function.
 356 */
 357void (*pm_power_off)(void) = machine_power_off;
 358EXPORT_SYMBOL_GPL(pm_power_off);
 359
 360void *restart_stack;
 361
 362unsigned long stack_alloc(void)
 363{
 364#ifdef CONFIG_VMAP_STACK
 365	void *ret;
 366
 367	ret = __vmalloc_node(THREAD_SIZE, THREAD_SIZE, THREADINFO_GFP,
 368			     NUMA_NO_NODE, __builtin_return_address(0));
 369	kmemleak_not_leak(ret);
 370	return (unsigned long)ret;
 371#else
 372	return __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
 373#endif
 374}
 375
 376void stack_free(unsigned long stack)
 377{
 378#ifdef CONFIG_VMAP_STACK
 379	vfree((void *) stack);
 380#else
 381	free_pages(stack, THREAD_SIZE_ORDER);
 382#endif
 383}
 
 384
 385int __init arch_early_irq_init(void)
 386{
 387	unsigned long stack;
 388
 389	stack = __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
 390	if (!stack)
 391		panic("Couldn't allocate async stack");
 392	S390_lowcore.async_stack = stack + STACK_INIT_OFFSET;
 393	return 0;
 394}
 
 395
 396void __init arch_call_rest_init(void)
 397{
 398	unsigned long stack;
 399
 400	smp_reinit_ipl_cpu();
 401	stack = stack_alloc();
 402	if (!stack)
 403		panic("Couldn't allocate kernel stack");
 404	current->stack = (void *) stack;
 405#ifdef CONFIG_VMAP_STACK
 406	current->stack_vm_area = (void *) stack;
 407#endif
 408	set_task_stack_end_magic(current);
 409	stack += STACK_INIT_OFFSET;
 410	S390_lowcore.kernel_stack = stack;
 411	call_on_stack_noreturn(rest_init, stack);
 412}
 413
 414static void __init setup_lowcore_dat_off(void)
 415{
 416	unsigned long int_psw_mask = PSW_KERNEL_BITS;
 417	struct lowcore *abs_lc, *lc;
 418	unsigned long mcck_stack;
 419	unsigned long flags;
 420
 421	if (IS_ENABLED(CONFIG_KASAN))
 422		int_psw_mask |= PSW_MASK_DAT;
 423
 424	/*
 425	 * Setup lowcore for boot cpu
 426	 */
 427	BUILD_BUG_ON(sizeof(struct lowcore) != LC_PAGES * PAGE_SIZE);
 428	lc = memblock_alloc_low(sizeof(*lc), sizeof(*lc));
 429	if (!lc)
 430		panic("%s: Failed to allocate %zu bytes align=%zx\n",
 431		      __func__, sizeof(*lc), sizeof(*lc));
 432
 433	lc->restart_psw.mask = PSW_KERNEL_BITS;
 434	lc->restart_psw.addr = (unsigned long) restart_int_handler;
 435	lc->external_new_psw.mask = int_psw_mask | PSW_MASK_MCHECK;
 436	lc->external_new_psw.addr = (unsigned long) ext_int_handler;
 437	lc->svc_new_psw.mask = int_psw_mask | PSW_MASK_MCHECK;
 438	lc->svc_new_psw.addr = (unsigned long) system_call;
 439	lc->program_new_psw.mask = int_psw_mask | PSW_MASK_MCHECK;
 440	lc->program_new_psw.addr = (unsigned long) pgm_check_handler;
 441	lc->mcck_new_psw.mask = int_psw_mask;
 442	lc->mcck_new_psw.addr = (unsigned long) mcck_int_handler;
 443	lc->io_new_psw.mask = int_psw_mask | PSW_MASK_MCHECK;
 444	lc->io_new_psw.addr = (unsigned long) io_int_handler;
 445	lc->clock_comparator = clock_comparator_max;
 446	lc->nodat_stack = ((unsigned long) &init_thread_union)
 
 
 
 
 
 
 
 
 447		+ THREAD_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
 448	lc->current_task = (unsigned long)&init_task;
 449	lc->lpp = LPP_MAGIC;
 
 
 
 
 
 
 450	lc->machine_flags = S390_lowcore.machine_flags;
 451	lc->preempt_count = S390_lowcore.preempt_count;
 452	nmi_alloc_mcesa_early(&lc->mcesad);
 453	lc->sys_enter_timer = S390_lowcore.sys_enter_timer;
 
 
 
 
 
 
 
 
 
 
 
 
 454	lc->exit_timer = S390_lowcore.exit_timer;
 455	lc->user_timer = S390_lowcore.user_timer;
 456	lc->system_timer = S390_lowcore.system_timer;
 457	lc->steal_timer = S390_lowcore.steal_timer;
 458	lc->last_update_timer = S390_lowcore.last_update_timer;
 459	lc->last_update_clock = S390_lowcore.last_update_clock;
 
 460
 461	/*
 462	 * Allocate the global restart stack which is the same for
 463	 * all CPUs in cast *one* of them does a PSW restart.
 464	 */
 465	restart_stack = memblock_alloc(THREAD_SIZE, THREAD_SIZE);
 466	if (!restart_stack)
 467		panic("%s: Failed to allocate %lu bytes align=0x%lx\n",
 468		      __func__, THREAD_SIZE, THREAD_SIZE);
 469	restart_stack += STACK_INIT_OFFSET;
 470
 471	/*
 472	 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
 473	 * restart data to the absolute zero lowcore. This is necessary if
 474	 * PSW restart is done on an offline CPU that has lowcore zero.
 475	 */
 476	lc->restart_stack = (unsigned long) restart_stack;
 477	lc->restart_fn = (unsigned long) do_restart;
 478	lc->restart_data = 0;
 479	lc->restart_source = -1U;
 480
 481	abs_lc = get_abs_lowcore(&flags);
 482	abs_lc->restart_stack = lc->restart_stack;
 483	abs_lc->restart_fn = lc->restart_fn;
 484	abs_lc->restart_data = lc->restart_data;
 485	abs_lc->restart_source = lc->restart_source;
 486	abs_lc->restart_psw = lc->restart_psw;
 487	abs_lc->mcesad = lc->mcesad;
 488	put_abs_lowcore(abs_lc, flags);
 489
 490	mcck_stack = (unsigned long)memblock_alloc(THREAD_SIZE, THREAD_SIZE);
 491	if (!mcck_stack)
 492		panic("%s: Failed to allocate %lu bytes align=0x%lx\n",
 493		      __func__, THREAD_SIZE, THREAD_SIZE);
 494	lc->mcck_stack = mcck_stack + STACK_INIT_OFFSET;
 495
 496	lc->spinlock_lockval = arch_spin_lockval(0);
 497	lc->spinlock_index = 0;
 498	arch_spin_lock_setup(0);
 499	lc->return_lpswe = gen_lpswe(__LC_RETURN_PSW);
 500	lc->return_mcck_lpswe = gen_lpswe(__LC_RETURN_MCCK_PSW);
 501	lc->preempt_count = PREEMPT_DISABLED;
 502
 503	set_prefix(__pa(lc));
 504	lowcore_ptr[0] = lc;
 505}
 506
 507static void __init setup_lowcore_dat_on(void)
 508{
 509	struct lowcore *abs_lc;
 510	unsigned long flags;
 511	int i;
 512
 513	__ctl_clear_bit(0, 28);
 514	S390_lowcore.external_new_psw.mask |= PSW_MASK_DAT;
 515	S390_lowcore.svc_new_psw.mask |= PSW_MASK_DAT;
 516	S390_lowcore.program_new_psw.mask |= PSW_MASK_DAT;
 517	S390_lowcore.mcck_new_psw.mask |= PSW_MASK_DAT;
 518	S390_lowcore.io_new_psw.mask |= PSW_MASK_DAT;
 519	__ctl_set_bit(0, 28);
 520	__ctl_store(S390_lowcore.cregs_save_area, 0, 15);
 521	if (abs_lowcore_map(0, lowcore_ptr[0], true))
 522		panic("Couldn't setup absolute lowcore");
 523	abs_lowcore_mapped = true;
 524	abs_lc = get_abs_lowcore(&flags);
 525	abs_lc->restart_flags = RESTART_FLAG_CTLREGS;
 526	abs_lc->program_new_psw = S390_lowcore.program_new_psw;
 527	for (i = 0; i < 16; i++)
 528		abs_lc->cregs_save_area[i] = S390_lowcore.cregs_save_area[i];
 529	put_abs_lowcore(abs_lc, flags);
 530}
 531
 532static struct resource code_resource = {
 533	.name  = "Kernel code",
 534	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 535};
 536
 537static struct resource data_resource = {
 538	.name = "Kernel data",
 539	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 540};
 541
 542static struct resource bss_resource = {
 543	.name = "Kernel bss",
 544	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 545};
 546
 547static struct resource __initdata *standard_resources[] = {
 548	&code_resource,
 549	&data_resource,
 550	&bss_resource,
 551};
 552
 553static void __init setup_resources(void)
 554{
 555	struct resource *res, *std_res, *sub_res;
 556	phys_addr_t start, end;
 557	int j;
 558	u64 i;
 559
 560	code_resource.start = (unsigned long) _text;
 561	code_resource.end = (unsigned long) _etext - 1;
 562	data_resource.start = (unsigned long) _etext;
 563	data_resource.end = (unsigned long) _edata - 1;
 564	bss_resource.start = (unsigned long) __bss_start;
 565	bss_resource.end = (unsigned long) __bss_stop - 1;
 566
 567	for_each_mem_range(i, &start, &end) {
 568		res = memblock_alloc(sizeof(*res), 8);
 569		if (!res)
 570			panic("%s: Failed to allocate %zu bytes align=0x%x\n",
 571			      __func__, sizeof(*res), 8);
 572		res->flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM;
 573
 574		res->name = "System RAM";
 575		res->start = start;
 576		/*
 577		 * In memblock, end points to the first byte after the
 578		 * range while in resourses, end points to the last byte in
 579		 * the range.
 580		 */
 581		res->end = end - 1;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 582		request_resource(&iomem_resource, res);
 583
 584		for (j = 0; j < ARRAY_SIZE(standard_resources); j++) {
 585			std_res = standard_resources[j];
 586			if (std_res->start < res->start ||
 587			    std_res->start > res->end)
 588				continue;
 589			if (std_res->end > res->end) {
 590				sub_res = memblock_alloc(sizeof(*sub_res), 8);
 591				if (!sub_res)
 592					panic("%s: Failed to allocate %zu bytes align=0x%x\n",
 593					      __func__, sizeof(*sub_res), 8);
 594				*sub_res = *std_res;
 595				sub_res->end = res->end;
 596				std_res->start = res->end + 1;
 597				request_resource(res, sub_res);
 598			} else {
 599				request_resource(res, std_res);
 600			}
 601		}
 602	}
 603#ifdef CONFIG_CRASH_DUMP
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 604	/*
 605	 * Re-add removed crash kernel memory as reserved memory. This makes
 606	 * sure it will be mapped with the identity mapping and struct pages
 607	 * will be created, so it can be resized later on.
 608	 * However add it later since the crash kernel resource should not be
 609	 * part of the System RAM resource.
 610	 */
 611	if (crashk_res.end) {
 612		memblock_add_node(crashk_res.start, resource_size(&crashk_res),
 613				  0, MEMBLOCK_NONE);
 614		memblock_reserve(crashk_res.start, resource_size(&crashk_res));
 615		insert_resource(&iomem_resource, &crashk_res);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 616	}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 617#endif
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 618}
 619
 620static void __init setup_memory_end(void)
 621{
 622	memblock_remove(ident_map_size, PHYS_ADDR_MAX - ident_map_size);
 623	max_pfn = max_low_pfn = PFN_DOWN(ident_map_size);
 624	pr_notice("The maximum memory size is %luMB\n", ident_map_size >> 20);
 625}
 626
 627#ifdef CONFIG_CRASH_DUMP
 628
 629/*
 630 * When kdump is enabled, we have to ensure that no memory from the area
 631 * [0 - crashkernel memory size] is set offline - it will be exchanged with
 632 * the crashkernel memory region when kdump is triggered. The crashkernel
 633 * memory region can never get offlined (pages are unmovable).
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 634 */
 635static int kdump_mem_notifier(struct notifier_block *nb,
 636			      unsigned long action, void *data)
 637{
 638	struct memory_notify *arg = data;
 639
 640	if (action != MEM_GOING_OFFLINE)
 641		return NOTIFY_OK;
 642	if (arg->start_pfn < PFN_DOWN(resource_size(&crashk_res)))
 643		return NOTIFY_BAD;
 644	return NOTIFY_OK;
 
 
 
 
 645}
 646
 647static struct notifier_block kdump_mem_nb = {
 648	.notifier_call = kdump_mem_notifier,
 649};
 650
 651#endif
 652
 653/*
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 654 * Reserve memory for kdump kernel to be loaded with kexec
 655 */
 656static void __init reserve_crashkernel(void)
 657{
 658#ifdef CONFIG_CRASH_DUMP
 659	unsigned long long crash_base, crash_size;
 660	phys_addr_t low, high;
 661	int rc;
 662
 663	rc = parse_crashkernel(boot_command_line, ident_map_size, &crash_size,
 664			       &crash_base);
 665
 666	crash_base = ALIGN(crash_base, KEXEC_CRASH_MEM_ALIGN);
 667	crash_size = ALIGN(crash_size, KEXEC_CRASH_MEM_ALIGN);
 668	if (rc || crash_size == 0)
 669		return;
 670
 671	if (memblock.memory.regions[0].size < crash_size) {
 672		pr_info("crashkernel reservation failed: %s\n",
 673			"first memory chunk must be at least crashkernel size");
 674		return;
 675	}
 676
 677	low = crash_base ?: oldmem_data.start;
 678	high = low + crash_size;
 679	if (low >= oldmem_data.start && high <= oldmem_data.start + oldmem_data.size) {
 680		/* The crashkernel fits into OLDMEM, reuse OLDMEM */
 681		crash_base = low;
 682	} else {
 683		/* Find suitable area in free memory */
 684		low = max_t(unsigned long, crash_size, sclp.hsa_size);
 685		high = crash_base ? crash_base + crash_size : ULONG_MAX;
 686
 687		if (crash_base && crash_base < low) {
 688			pr_info("crashkernel reservation failed: %s\n",
 689				"crash_base too low");
 690			return;
 691		}
 692		low = crash_base ?: low;
 693		crash_base = memblock_phys_alloc_range(crash_size,
 694						       KEXEC_CRASH_MEM_ALIGN,
 695						       low, high);
 696	}
 697
 698	if (!crash_base) {
 699		pr_info("crashkernel reservation failed: %s\n",
 700			"no suitable area found");
 701		return;
 702	}
 703
 704	if (register_memory_notifier(&kdump_mem_nb)) {
 705		memblock_phys_free(crash_base, crash_size);
 706		return;
 707	}
 708
 709	if (!oldmem_data.start && MACHINE_IS_VM)
 710		diag10_range(PFN_DOWN(crash_base), PFN_DOWN(crash_size));
 711	crashk_res.start = crash_base;
 712	crashk_res.end = crash_base + crash_size - 1;
 713	memblock_remove(crash_base, crash_size);
 
 714	pr_info("Reserving %lluMB of memory at %lluMB "
 715		"for crashkernel (System RAM: %luMB)\n",
 716		crash_size >> 20, crash_base >> 20,
 717		(unsigned long)memblock.memory.total_size >> 20);
 718	os_info_crashkernel_add(crash_base, crash_size);
 719#endif
 720}
 721
 722/*
 723 * Reserve the initrd from being used by memblock
 724 */
 725static void __init reserve_initrd(void)
 726{
 727#ifdef CONFIG_BLK_DEV_INITRD
 728	if (!initrd_data.start || !initrd_data.size)
 729		return;
 730	initrd_start = (unsigned long)__va(initrd_data.start);
 731	initrd_end = initrd_start + initrd_data.size;
 732	memblock_reserve(initrd_data.start, initrd_data.size);
 733#endif
 734}
 735
 736/*
 737 * Reserve the memory area used to pass the certificate lists
 738 */
 739static void __init reserve_certificate_list(void)
 740{
 741	if (ipl_cert_list_addr)
 742		memblock_reserve(ipl_cert_list_addr, ipl_cert_list_size);
 743}
 744
 745static void __init reserve_mem_detect_info(void)
 746{
 747	unsigned long start, size;
 
 
 748
 749	get_mem_detect_reserved(&start, &size);
 750	if (size)
 751		memblock_reserve(start, size);
 752}
 753
 754static void __init free_mem_detect_info(void)
 755{
 756	unsigned long start, size;
 757
 758	get_mem_detect_reserved(&start, &size);
 759	if (size)
 760		memblock_phys_free(start, size);
 761}
 762
 763static const char * __init get_mem_info_source(void)
 764{
 765	switch (mem_detect.info_source) {
 766	case MEM_DETECT_SCLP_STOR_INFO:
 767		return "sclp storage info";
 768	case MEM_DETECT_DIAG260:
 769		return "diag260";
 770	case MEM_DETECT_SCLP_READ_INFO:
 771		return "sclp read info";
 772	case MEM_DETECT_BIN_SEARCH:
 773		return "binary search";
 
 
 
 
 
 
 
 
 
 
 
 
 774	}
 775	return "none";
 776}
 777
 778static void __init memblock_add_mem_detect_info(void)
 779{
 780	unsigned long start, end;
 781	int i;
 782
 783	pr_debug("physmem info source: %s (%hhd)\n",
 784		 get_mem_info_source(), mem_detect.info_source);
 785	/* keep memblock lists close to the kernel */
 786	memblock_set_bottom_up(true);
 787	for_each_mem_detect_block(i, &start, &end) {
 788		memblock_add(start, end - start);
 789		memblock_physmem_add(start, end - start);
 790	}
 791	memblock_set_bottom_up(false);
 792	memblock_set_node(0, ULONG_MAX, &memblock.memory, 0);
 793}
 794
 795/*
 796 * Check for initrd being in usable memory
 797 */
 798static void __init check_initrd(void)
 799{
 800#ifdef CONFIG_BLK_DEV_INITRD
 801	if (initrd_data.start && initrd_data.size &&
 802	    !memblock_is_region_memory(initrd_data.start, initrd_data.size)) {
 803		pr_err("The initial RAM disk does not fit into the memory\n");
 804		memblock_phys_free(initrd_data.start, initrd_data.size);
 805		initrd_start = initrd_end = 0;
 
 
 
 806	}
 807#endif
 808}
 809
 810/*
 811 * Reserve memory used for lowcore/command line/kernel image.
 812 */
 813static void __init reserve_kernel(void)
 814{
 815	memblock_reserve(0, STARTUP_NORMAL_OFFSET);
 816	memblock_reserve(OLDMEM_BASE, sizeof(unsigned long));
 817	memblock_reserve(OLDMEM_SIZE, sizeof(unsigned long));
 818	memblock_reserve(__amode31_base, __eamode31 - __samode31);
 819	memblock_reserve(__pa(sclp_early_sccb), EXT_SCCB_READ_SCP);
 820	memblock_reserve(__pa(_stext), _end - _stext);
 821}
 822
 823static void __init setup_memory(void)
 824{
 825	phys_addr_t start, end;
 826	u64 i;
 827
 828	/*
 829	 * Init storage key for present memory
 830	 */
 831	for_each_mem_range(i, &start, &end)
 832		storage_key_init_range(start, end);
 833
 834	psw_set_key(PAGE_DEFAULT_KEY);
 835}
 
 
 
 
 
 
 
 836
 837static void __init relocate_amode31_section(void)
 838{
 839	unsigned long amode31_size = __eamode31 - __samode31;
 840	long amode31_offset = __amode31_base - __samode31;
 841	long *ptr;
 842
 843	pr_info("Relocating AMODE31 section of size 0x%08lx\n", amode31_size);
 844
 845	/* Move original AMODE31 section to the new one */
 846	memmove((void *)__amode31_base, (void *)__samode31, amode31_size);
 847	/* Zero out the old AMODE31 section to catch invalid accesses within it */
 848	memset((void *)__samode31, 0, amode31_size);
 849
 850	/* Update all AMODE31 region references */
 851	for (ptr = _start_amode31_refs; ptr != _end_amode31_refs; ptr++)
 852		*ptr += amode31_offset;
 853}
 854
 855/* This must be called after AMODE31 relocation */
 856static void __init setup_cr(void)
 857{
 858	union ctlreg2 cr2;
 859	union ctlreg5 cr5;
 860	union ctlreg15 cr15;
 861
 862	__ctl_duct[1] = (unsigned long)__ctl_aste;
 863	__ctl_duct[2] = (unsigned long)__ctl_aste;
 864	__ctl_duct[4] = (unsigned long)__ctl_duald;
 865
 866	/* Update control registers CR2, CR5 and CR15 */
 867	__ctl_store(cr2.val, 2, 2);
 868	__ctl_store(cr5.val, 5, 5);
 869	__ctl_store(cr15.val, 15, 15);
 870	cr2.ducto = (unsigned long)__ctl_duct >> 6;
 871	cr5.pasteo = (unsigned long)__ctl_duct >> 6;
 872	cr15.lsea = (unsigned long)__ctl_linkage_stack >> 3;
 873	__ctl_load(cr2.val, 2, 2);
 874	__ctl_load(cr5.val, 5, 5);
 875	__ctl_load(cr15.val, 15, 15);
 876}
 877
 878/*
 879 * Add system information as device randomness
 880 */
 881static void __init setup_randomness(void)
 882{
 883	struct sysinfo_3_2_2 *vmms;
 884
 885	vmms = memblock_alloc(PAGE_SIZE, PAGE_SIZE);
 886	if (!vmms)
 887		panic("Failed to allocate memory for sysinfo structure\n");
 888	if (stsi(vmms, 3, 2, 2) == 0 && vmms->count)
 889		add_device_randomness(&vmms->vm, sizeof(vmms->vm[0]) * vmms->count);
 890	memblock_free(vmms, PAGE_SIZE);
 891
 892	if (cpacf_query_func(CPACF_PRNO, CPACF_PRNO_TRNG))
 893		static_branch_enable(&s390_arch_random_available);
 894}
 895
 896/*
 897 * Find the correct size for the task_struct. This depends on
 898 * the size of the struct fpu at the end of the thread_struct
 899 * which is embedded in the task_struct.
 900 */
 901static void __init setup_task_size(void)
 902{
 903	int task_size = sizeof(struct task_struct);
 
 
 
 
 
 
 
 
 
 
 
 
 
 904
 905	if (!MACHINE_HAS_VX) {
 906		task_size -= sizeof(__vector128) * __NUM_VXRS;
 907		task_size += sizeof(freg_t) * __NUM_FPRS;
 908	}
 909	arch_task_struct_size = task_size;
 910}
 911
 912/*
 913 * Issue diagnose 318 to set the control program name and
 914 * version codes.
 915 */
 916static void __init setup_control_program_code(void)
 917{
 918	union diag318_info diag318_info = {
 919		.cpnc = CPNC_LINUX,
 920		.cpvc = 0,
 921	};
 
 
 
 
 
 922
 923	if (!sclp.has_diag318)
 924		return;
 
 
 
 925
 926	diag_stat_inc(DIAG_STAT_X318);
 927	asm volatile("diag %0,0,0x318\n" : : "d" (diag318_info.val));
 928}
 
 
 
 929
 930/*
 931 * Print the component list from the IPL report
 932 */
 933static void __init log_component_list(void)
 934{
 935	struct ipl_rb_component_entry *ptr, *end;
 936	char *str;
 937
 938	if (!early_ipl_comp_list_addr)
 939		return;
 940	if (ipl_block.hdr.flags & IPL_PL_FLAG_SIPL)
 941		pr_info("Linux is running with Secure-IPL enabled\n");
 942	else
 943		pr_info("Linux is running with Secure-IPL disabled\n");
 944	ptr = (void *) early_ipl_comp_list_addr;
 945	end = (void *) ptr + early_ipl_comp_list_size;
 946	pr_info("The IPL report contains the following components:\n");
 947	while (ptr < end) {
 948		if (ptr->flags & IPL_RB_COMPONENT_FLAG_SIGNED) {
 949			if (ptr->flags & IPL_RB_COMPONENT_FLAG_VERIFIED)
 950				str = "signed, verified";
 951			else
 952				str = "signed, verification failed";
 953		} else {
 954			str = "not signed";
 955		}
 956		pr_info("%016llx - %016llx (%s)\n",
 957			ptr->addr, ptr->addr + ptr->len, str);
 958		ptr++;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 959	}
 960}
 961
 962/*
 963 * Setup function called from init/main.c just after the banner
 964 * was printed.
 965 */
 966
 967void __init setup_arch(char **cmdline_p)
 968{
 969        /*
 970         * print what head.S has found out about the machine
 971         */
 
 
 
 
 
 
 
 
 
 
 
 
 
 972	if (MACHINE_IS_VM)
 973		pr_info("Linux is running as a z/VM "
 974			"guest operating system in 64-bit mode\n");
 975	else if (MACHINE_IS_KVM)
 976		pr_info("Linux is running under KVM in 64-bit mode\n");
 977	else if (MACHINE_IS_LPAR)
 978		pr_info("Linux is running natively in 64-bit mode\n");
 979	else
 980		pr_info("Linux is running as a guest in 64-bit mode\n");
 981
 982	log_component_list();
 983
 984	/* Have one command line that is parsed and saved in /proc/cmdline */
 985	/* boot_command_line has been already set up in early.c */
 986	*cmdline_p = boot_command_line;
 987
 988        ROOT_DEV = Root_RAM0;
 989
 990	setup_initial_init_mm(_text, _etext, _edata, _end);
 991
 992	if (IS_ENABLED(CONFIG_EXPOLINE_AUTO))
 993		nospec_auto_detect();
 994
 995	jump_label_init();
 996	parse_early_param();
 997#ifdef CONFIG_CRASH_DUMP
 998	/* Deactivate elfcorehdr= kernel parameter */
 999	elfcorehdr_addr = ELFCORE_ADDR_MAX;
1000#endif
1001
1002	os_info_init();
1003	setup_ipl();
1004	setup_task_size();
1005	setup_control_program_code();
1006
1007	/* Do some memory reservations *before* memory is added to memblock */
1008	reserve_kernel();
1009	reserve_initrd();
1010	reserve_certificate_list();
1011	reserve_mem_detect_info();
1012	memblock_set_current_limit(ident_map_size);
1013	memblock_allow_resize();
1014
1015	/* Get information about *all* installed memory */
1016	memblock_add_mem_detect_info();
1017
1018	free_mem_detect_info();
1019	setup_memory_end();
1020	memblock_dump_all();
1021	setup_memory();
1022
1023	relocate_amode31_section();
1024	setup_cr();
1025	setup_uv();
1026	dma_contiguous_reserve(ident_map_size);
1027	vmcp_cma_reserve();
1028	if (MACHINE_HAS_EDAT2)
1029		hugetlb_cma_reserve(PUD_SHIFT - PAGE_SHIFT);
1030
1031	check_initrd();
1032	reserve_crashkernel();
1033#ifdef CONFIG_CRASH_DUMP
1034	/*
1035	 * Be aware that smp_save_dump_secondary_cpus() triggers a system reset.
1036	 * Therefore CPU and device initialization should be done afterwards.
1037	 */
1038	smp_save_dump_secondary_cpus();
1039#endif
1040
1041	setup_resources();
1042	setup_lowcore_dat_off();
 
 
1043	smp_fill_possible_mask();
1044	cpu_detect_mhz_feature();
1045        cpu_init();
1046	numa_setup();
1047	smp_detect_cpus();
1048	topology_init_early();
1049
1050	if (test_facility(193))
1051		static_branch_enable(&cpu_has_bear);
 
 
1052
1053	/*
1054	 * Create kernel page tables and switch to virtual addressing.
1055	 */
1056        paging_init();
1057	memcpy_real_init();
1058	/*
1059	 * After paging_init created the kernel page table, the new PSWs
1060	 * in lowcore can now run with DAT enabled.
1061	 */
1062	setup_lowcore_dat_on();
1063#ifdef CONFIG_CRASH_DUMP
1064	smp_save_dump_ipl_cpu();
1065#endif
1066
1067        /* Setup default console */
1068	conmode_default();
1069	set_preferred_console();
1070
1071	apply_alternative_instructions();
1072	if (IS_ENABLED(CONFIG_EXPOLINE))
1073		nospec_init_branches();
1074
1075	/* Setup zfcp/nvme dump support */
1076	setup_zfcpdump();
 
1077
1078	/* Add system specific data to the random pool */
1079	setup_randomness();
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1080}
v3.15
 
   1/*
   2 *  S390 version
   3 *    Copyright IBM Corp. 1999, 2012
   4 *    Author(s): Hartmut Penner (hp@de.ibm.com),
   5 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
   6 *
   7 *  Derived from "arch/i386/kernel/setup.c"
   8 *    Copyright (C) 1995, Linus Torvalds
   9 */
  10
  11/*
  12 * This file handles the architecture-dependent parts of initialization
  13 */
  14
  15#define KMSG_COMPONENT "setup"
  16#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
  17
  18#include <linux/errno.h>
  19#include <linux/export.h>
  20#include <linux/sched.h>
 
 
  21#include <linux/kernel.h>
  22#include <linux/memblock.h>
  23#include <linux/mm.h>
  24#include <linux/stddef.h>
  25#include <linux/unistd.h>
  26#include <linux/ptrace.h>
 
  27#include <linux/user.h>
  28#include <linux/tty.h>
  29#include <linux/ioport.h>
  30#include <linux/delay.h>
  31#include <linux/init.h>
  32#include <linux/initrd.h>
  33#include <linux/bootmem.h>
  34#include <linux/root_dev.h>
  35#include <linux/console.h>
  36#include <linux/kernel_stat.h>
 
  37#include <linux/device.h>
  38#include <linux/notifier.h>
  39#include <linux/pfn.h>
  40#include <linux/ctype.h>
  41#include <linux/reboot.h>
  42#include <linux/topology.h>
  43#include <linux/ftrace.h>
  44#include <linux/kexec.h>
  45#include <linux/crash_dump.h>
  46#include <linux/memory.h>
  47#include <linux/compat.h>
 
 
 
  48
 
 
  49#include <asm/ipl.h>
  50#include <asm/facility.h>
  51#include <asm/smp.h>
  52#include <asm/mmu_context.h>
  53#include <asm/cpcmd.h>
  54#include <asm/lowcore.h>
 
  55#include <asm/irq.h>
  56#include <asm/page.h>
  57#include <asm/ptrace.h>
  58#include <asm/sections.h>
  59#include <asm/ebcdic.h>
  60#include <asm/kvm_virtio.h>
  61#include <asm/diag.h>
  62#include <asm/os_info.h>
  63#include <asm/sclp.h>
 
 
 
 
 
 
 
 
 
  64#include "entry.h"
  65
  66/*
  67 * Machine setup..
  68 */
  69unsigned int console_mode = 0;
  70EXPORT_SYMBOL(console_mode);
  71
  72unsigned int console_devno = -1;
  73EXPORT_SYMBOL(console_devno);
  74
  75unsigned int console_irq = -1;
  76EXPORT_SYMBOL(console_irq);
  77
  78unsigned long elf_hwcap = 0;
  79char elf_platform[ELF_PLATFORM_SIZE];
 
 
 
 
 
 
 
 
 
  80
  81struct mem_chunk __initdata memory_chunk[MEMORY_CHUNKS];
 
 
 
 
 
 
 
 
 
 
 
 
  82
  83int __initdata memory_end_set;
  84unsigned long __initdata memory_end;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
  85
  86unsigned long VMALLOC_START;
  87EXPORT_SYMBOL(VMALLOC_START);
  88
  89unsigned long VMALLOC_END;
  90EXPORT_SYMBOL(VMALLOC_END);
  91
  92struct page *vmemmap;
  93EXPORT_SYMBOL(vmemmap);
 
  94
  95#ifdef CONFIG_64BIT
  96unsigned long MODULES_VADDR;
  97unsigned long MODULES_END;
  98#endif
  99
 100/* An array with a pointer to the lowcore of every CPU. */
 101struct _lowcore *lowcore_ptr[NR_CPUS];
 102EXPORT_SYMBOL(lowcore_ptr);
 103
 
 
 
 
 
 
 
 
 104/*
 105 * This is set up by the setup-routine at boot-time
 106 * for S390 need to find out, what we have to setup
 107 * using address 0x10400 ...
 108 */
 109
 110#include <asm/setup.h>
 111
 112/*
 113 * condev= and conmode= setup parameter.
 114 */
 115
 116static int __init condev_setup(char *str)
 117{
 118	int vdev;
 119
 120	vdev = simple_strtoul(str, &str, 0);
 121	if (vdev >= 0 && vdev < 65536) {
 122		console_devno = vdev;
 123		console_irq = -1;
 124	}
 125	return 1;
 126}
 127
 128__setup("condev=", condev_setup);
 129
 130static void __init set_preferred_console(void)
 131{
 132	if (MACHINE_IS_KVM) {
 133		if (sclp_has_vt220())
 134			add_preferred_console("ttyS", 1, NULL);
 135		else if (sclp_has_linemode())
 136			add_preferred_console("ttyS", 0, NULL);
 137		else
 138			add_preferred_console("hvc", 0, NULL);
 139	} else if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
 140		add_preferred_console("ttyS", 0, NULL);
 141	else if (CONSOLE_IS_3270)
 142		add_preferred_console("tty3270", 0, NULL);
 
 
 
 
 143}
 144
 145static int __init conmode_setup(char *str)
 146{
 147#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 148	if (strncmp(str, "hwc", 4) == 0 || strncmp(str, "sclp", 5) == 0)
 149                SET_CONSOLE_SCLP;
 150#endif
 151#if defined(CONFIG_TN3215_CONSOLE)
 152	if (strncmp(str, "3215", 5) == 0)
 153		SET_CONSOLE_3215;
 154#endif
 155#if defined(CONFIG_TN3270_CONSOLE)
 156	if (strncmp(str, "3270", 5) == 0)
 157		SET_CONSOLE_3270;
 158#endif
 159	set_preferred_console();
 160        return 1;
 161}
 162
 163__setup("conmode=", conmode_setup);
 164
 165static void __init conmode_default(void)
 166{
 167	char query_buffer[1024];
 168	char *ptr;
 169
 170        if (MACHINE_IS_VM) {
 171		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
 172		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
 173		ptr = strstr(query_buffer, "SUBCHANNEL =");
 174		console_irq = simple_strtoul(ptr + 13, NULL, 16);
 175		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
 176		ptr = strstr(query_buffer, "CONMODE");
 177		/*
 178		 * Set the conmode to 3215 so that the device recognition 
 179		 * will set the cu_type of the console to 3215. If the
 180		 * conmode is 3270 and we don't set it back then both
 181		 * 3215 and the 3270 driver will try to access the console
 182		 * device (3215 as console and 3270 as normal tty).
 183		 */
 184		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
 185		if (ptr == NULL) {
 186#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 187			SET_CONSOLE_SCLP;
 188#endif
 189			return;
 190		}
 191		if (strncmp(ptr + 8, "3270", 4) == 0) {
 192#if defined(CONFIG_TN3270_CONSOLE)
 193			SET_CONSOLE_3270;
 194#elif defined(CONFIG_TN3215_CONSOLE)
 195			SET_CONSOLE_3215;
 196#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 197			SET_CONSOLE_SCLP;
 198#endif
 199		} else if (strncmp(ptr + 8, "3215", 4) == 0) {
 200#if defined(CONFIG_TN3215_CONSOLE)
 201			SET_CONSOLE_3215;
 202#elif defined(CONFIG_TN3270_CONSOLE)
 203			SET_CONSOLE_3270;
 204#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 205			SET_CONSOLE_SCLP;
 206#endif
 207		}
 
 
 
 
 
 
 
 208	} else {
 209#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 210		SET_CONSOLE_SCLP;
 211#endif
 212	}
 213}
 214
 215#ifdef CONFIG_ZFCPDUMP
 216static void __init setup_zfcpdump(void)
 217{
 218	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
 219		return;
 220	if (OLDMEM_BASE)
 221		return;
 222	strcat(boot_command_line, " cio_ignore=all,!ipldev,!condev");
 223	console_loglevel = 2;
 224}
 225#else
 226static inline void setup_zfcpdump(void) {}
 227#endif /* CONFIG_ZFCPDUMP */
 228
 229 /*
 230 * Reboot, halt and power_off stubs. They just call _machine_restart,
 231 * _machine_halt or _machine_power_off. 
 232 */
 233
 234void machine_restart(char *command)
 235{
 236	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
 237		/*
 238		 * Only unblank the console if we are called in enabled
 239		 * context or a bust_spinlocks cleared the way for us.
 240		 */
 241		console_unblank();
 242	_machine_restart(command);
 243}
 244
 245void machine_halt(void)
 246{
 247	if (!in_interrupt() || oops_in_progress)
 248		/*
 249		 * Only unblank the console if we are called in enabled
 250		 * context or a bust_spinlocks cleared the way for us.
 251		 */
 252		console_unblank();
 253	_machine_halt();
 254}
 255
 256void machine_power_off(void)
 257{
 258	if (!in_interrupt() || oops_in_progress)
 259		/*
 260		 * Only unblank the console if we are called in enabled
 261		 * context or a bust_spinlocks cleared the way for us.
 262		 */
 263		console_unblank();
 264	_machine_power_off();
 265}
 266
 267/*
 268 * Dummy power off function.
 269 */
 270void (*pm_power_off)(void) = machine_power_off;
 271EXPORT_SYMBOL_GPL(pm_power_off);
 272
 273static int __init early_parse_mem(char *p)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 274{
 275	memory_end = memparse(p, &p);
 276	memory_end_set = 1;
 277	return 0;
 
 
 278}
 279early_param("mem", early_parse_mem);
 280
 281static int __init parse_vmalloc(char *arg)
 282{
 283	if (!arg)
 284		return -EINVAL;
 285	VMALLOC_END = (memparse(arg, &arg) + PAGE_SIZE - 1) & PAGE_MASK;
 
 
 
 286	return 0;
 287}
 288early_param("vmalloc", parse_vmalloc);
 289
 290void *restart_stack __attribute__((__section__(".data")));
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 291
 292static void __init setup_lowcore(void)
 293{
 294	struct _lowcore *lc;
 
 
 
 
 
 
 295
 296	/*
 297	 * Setup lowcore for boot cpu
 298	 */
 299	BUILD_BUG_ON(sizeof(struct _lowcore) != LC_PAGES * 4096);
 300	lc = __alloc_bootmem_low(LC_PAGES * PAGE_SIZE, LC_PAGES * PAGE_SIZE, 0);
 
 
 
 
 301	lc->restart_psw.mask = PSW_KERNEL_BITS;
 302	lc->restart_psw.addr =
 303		PSW_ADDR_AMODE | (unsigned long) restart_int_handler;
 304	lc->external_new_psw.mask = PSW_KERNEL_BITS |
 305		PSW_MASK_DAT | PSW_MASK_MCHECK;
 306	lc->external_new_psw.addr =
 307		PSW_ADDR_AMODE | (unsigned long) ext_int_handler;
 308	lc->svc_new_psw.mask = PSW_KERNEL_BITS |
 309		PSW_MASK_DAT | PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK;
 310	lc->svc_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) system_call;
 311	lc->program_new_psw.mask = PSW_KERNEL_BITS |
 312		PSW_MASK_DAT | PSW_MASK_MCHECK;
 313	lc->program_new_psw.addr =
 314		PSW_ADDR_AMODE | (unsigned long) pgm_check_handler;
 315	lc->mcck_new_psw.mask = PSW_KERNEL_BITS;
 316	lc->mcck_new_psw.addr =
 317		PSW_ADDR_AMODE | (unsigned long) mcck_int_handler;
 318	lc->io_new_psw.mask = PSW_KERNEL_BITS |
 319		PSW_MASK_DAT | PSW_MASK_MCHECK;
 320	lc->io_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) io_int_handler;
 321	lc->clock_comparator = -1ULL;
 322	lc->kernel_stack = ((unsigned long) &init_thread_union)
 323		+ THREAD_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
 324	lc->async_stack = (unsigned long)
 325		__alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0)
 326		+ ASYNC_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
 327	lc->panic_stack = (unsigned long)
 328		__alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0)
 329		+ PAGE_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
 330	lc->current_task = (unsigned long) init_thread_union.thread_info.task;
 331	lc->thread_info = (unsigned long) &init_thread_union;
 332	lc->machine_flags = S390_lowcore.machine_flags;
 333	lc->stfl_fac_list = S390_lowcore.stfl_fac_list;
 334	memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
 335	       MAX_FACILITY_BIT/8);
 336#ifndef CONFIG_64BIT
 337	if (MACHINE_HAS_IEEE) {
 338		lc->extended_save_area_addr = (__u32)
 339			__alloc_bootmem_low(PAGE_SIZE, PAGE_SIZE, 0);
 340		/* enable extended save area */
 341		__ctl_set_bit(14, 29);
 342	}
 343#else
 344	lc->vdso_per_cpu_data = (unsigned long) &lc->paste[0];
 345#endif
 346	lc->sync_enter_timer = S390_lowcore.sync_enter_timer;
 347	lc->async_enter_timer = S390_lowcore.async_enter_timer;
 348	lc->exit_timer = S390_lowcore.exit_timer;
 349	lc->user_timer = S390_lowcore.user_timer;
 350	lc->system_timer = S390_lowcore.system_timer;
 351	lc->steal_timer = S390_lowcore.steal_timer;
 352	lc->last_update_timer = S390_lowcore.last_update_timer;
 353	lc->last_update_clock = S390_lowcore.last_update_clock;
 354	lc->ftrace_func = S390_lowcore.ftrace_func;
 355
 356	restart_stack = __alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0);
 357	restart_stack += ASYNC_SIZE;
 
 
 
 
 
 
 
 358
 359	/*
 360	 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
 361	 * restart data to the absolute zero lowcore. This is necessary if
 362	 * PSW restart is done on an offline CPU that has lowcore zero.
 363	 */
 364	lc->restart_stack = (unsigned long) restart_stack;
 365	lc->restart_fn = (unsigned long) do_restart;
 366	lc->restart_data = 0;
 367	lc->restart_source = -1UL;
 368
 369	/* Setup absolute zero lowcore */
 370	mem_assign_absolute(S390_lowcore.restart_stack, lc->restart_stack);
 371	mem_assign_absolute(S390_lowcore.restart_fn, lc->restart_fn);
 372	mem_assign_absolute(S390_lowcore.restart_data, lc->restart_data);
 373	mem_assign_absolute(S390_lowcore.restart_source, lc->restart_source);
 374	mem_assign_absolute(S390_lowcore.restart_psw, lc->restart_psw);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 375
 376	set_prefix((u32)(unsigned long) lc);
 377	lowcore_ptr[0] = lc;
 378}
 379
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 380static struct resource code_resource = {
 381	.name  = "Kernel code",
 382	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
 383};
 384
 385static struct resource data_resource = {
 386	.name = "Kernel data",
 387	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
 388};
 389
 390static struct resource bss_resource = {
 391	.name = "Kernel bss",
 392	.flags = IORESOURCE_BUSY | IORESOURCE_MEM,
 393};
 394
 395static struct resource __initdata *standard_resources[] = {
 396	&code_resource,
 397	&data_resource,
 398	&bss_resource,
 399};
 400
 401static void __init setup_resources(void)
 402{
 403	struct resource *res, *std_res, *sub_res;
 404	int i, j;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 405
 406	code_resource.start = (unsigned long) &_text;
 407	code_resource.end = (unsigned long) &_etext - 1;
 408	data_resource.start = (unsigned long) &_etext;
 409	data_resource.end = (unsigned long) &_edata - 1;
 410	bss_resource.start = (unsigned long) &__bss_start;
 411	bss_resource.end = (unsigned long) &__bss_stop - 1;
 412
 413	for (i = 0; i < MEMORY_CHUNKS; i++) {
 414		if (!memory_chunk[i].size)
 415			continue;
 416		res = alloc_bootmem_low(sizeof(*res));
 417		res->flags = IORESOURCE_BUSY | IORESOURCE_MEM;
 418		switch (memory_chunk[i].type) {
 419		case CHUNK_READ_WRITE:
 420			res->name = "System RAM";
 421			break;
 422		case CHUNK_READ_ONLY:
 423			res->name = "System ROM";
 424			res->flags |= IORESOURCE_READONLY;
 425			break;
 426		default:
 427			res->name = "reserved";
 428		}
 429		res->start = memory_chunk[i].addr;
 430		res->end = res->start + memory_chunk[i].size - 1;
 431		request_resource(&iomem_resource, res);
 432
 433		for (j = 0; j < ARRAY_SIZE(standard_resources); j++) {
 434			std_res = standard_resources[j];
 435			if (std_res->start < res->start ||
 436			    std_res->start > res->end)
 437				continue;
 438			if (std_res->end > res->end) {
 439				sub_res = alloc_bootmem_low(sizeof(*sub_res));
 
 
 
 440				*sub_res = *std_res;
 441				sub_res->end = res->end;
 442				std_res->start = res->end + 1;
 443				request_resource(res, sub_res);
 444			} else {
 445				request_resource(res, std_res);
 446			}
 447		}
 448	}
 449}
 450
 451static void __init setup_memory_end(void)
 452{
 453	unsigned long vmax, vmalloc_size, tmp;
 454	unsigned long real_memory_size = 0;
 455	int i;
 456
 457
 458#ifdef CONFIG_ZFCPDUMP
 459	if (ipl_info.type == IPL_TYPE_FCP_DUMP &&
 460	    !OLDMEM_BASE && sclp_get_hsa_size()) {
 461		memory_end = sclp_get_hsa_size();
 462		memory_end_set = 1;
 463	}
 464#endif
 465	memory_end &= PAGE_MASK;
 466
 467	/*
 468	 * Make sure all chunks are MAX_ORDER aligned so we don't need the
 469	 * extra checks that HOLES_IN_ZONE would require.
 
 
 
 470	 */
 471	for (i = 0; i < MEMORY_CHUNKS; i++) {
 472		unsigned long start, end;
 473		struct mem_chunk *chunk;
 474		unsigned long align;
 475
 476		chunk = &memory_chunk[i];
 477		if (!chunk->size)
 478			continue;
 479		align = 1UL << (MAX_ORDER + PAGE_SHIFT - 1);
 480		start = (chunk->addr + align - 1) & ~(align - 1);
 481		end = (chunk->addr + chunk->size) & ~(align - 1);
 482		if (start >= end)
 483			memset(chunk, 0, sizeof(*chunk));
 484		else {
 485			chunk->addr = start;
 486			chunk->size = end - start;
 487		}
 488		real_memory_size = max(real_memory_size,
 489				       chunk->addr + chunk->size);
 490	}
 491
 492	/* Choose kernel address space layout: 2, 3, or 4 levels. */
 493#ifdef CONFIG_64BIT
 494	vmalloc_size = VMALLOC_END ?: (128UL << 30) - MODULES_LEN;
 495	tmp = (memory_end ?: real_memory_size) / PAGE_SIZE;
 496	tmp = tmp * (sizeof(struct page) + PAGE_SIZE) + vmalloc_size;
 497	if (tmp <= (1UL << 42))
 498		vmax = 1UL << 42;	/* 3-level kernel page table */
 499	else
 500		vmax = 1UL << 53;	/* 4-level kernel page table */
 501	/* module area is at the end of the kernel address space. */
 502	MODULES_END = vmax;
 503	MODULES_VADDR = MODULES_END - MODULES_LEN;
 504	VMALLOC_END = MODULES_VADDR;
 505#else
 506	vmalloc_size = VMALLOC_END ?: 96UL << 20;
 507	vmax = 1UL << 31;		/* 2-level kernel page table */
 508	/* vmalloc area is at the end of the kernel address space. */
 509	VMALLOC_END = vmax;
 510#endif
 511	VMALLOC_START = vmax - vmalloc_size;
 512
 513	/* Split remaining virtual space between 1:1 mapping & vmemmap array */
 514	tmp = VMALLOC_START / (PAGE_SIZE + sizeof(struct page));
 515	/* vmemmap contains a multiple of PAGES_PER_SECTION struct pages */
 516	tmp = SECTION_ALIGN_UP(tmp);
 517	tmp = VMALLOC_START - tmp * sizeof(struct page);
 518	tmp &= ~((vmax >> 11) - 1);	/* align to page table level */
 519	tmp = min(tmp, 1UL << MAX_PHYSMEM_BITS);
 520	vmemmap = (struct page *) tmp;
 521
 522	/* Take care that memory_end is set and <= vmemmap */
 523	memory_end = min(memory_end ?: real_memory_size, tmp);
 524
 525	/* Fixup memory chunk array to fit into 0..memory_end */
 526	for (i = 0; i < MEMORY_CHUNKS; i++) {
 527		struct mem_chunk *chunk = &memory_chunk[i];
 528
 529		if (!chunk->size)
 530			continue;
 531		if (chunk->addr >= memory_end) {
 532			memset(chunk, 0, sizeof(*chunk));
 533			continue;
 534		}
 535		if (chunk->addr + chunk->size > memory_end)
 536			chunk->size = memory_end - chunk->addr;
 537	}
 538}
 539
 540static void __init setup_vmcoreinfo(void)
 541{
 542	mem_assign_absolute(S390_lowcore.vmcore_info, paddr_vmcoreinfo_note());
 
 
 543}
 544
 545#ifdef CONFIG_CRASH_DUMP
 546
 547/*
 548 * Find suitable location for crashkernel memory
 549 */
 550static unsigned long __init find_crash_base(unsigned long crash_size,
 551					    char **msg)
 552{
 553	unsigned long crash_base;
 554	struct mem_chunk *chunk;
 555	int i;
 556
 557	if (memory_chunk[0].size < crash_size) {
 558		*msg = "first memory chunk must be at least crashkernel size";
 559		return 0;
 560	}
 561	if (OLDMEM_BASE && crash_size == OLDMEM_SIZE)
 562		return OLDMEM_BASE;
 563
 564	for (i = MEMORY_CHUNKS - 1; i >= 0; i--) {
 565		chunk = &memory_chunk[i];
 566		if (chunk->size == 0)
 567			continue;
 568		if (chunk->type != CHUNK_READ_WRITE)
 569			continue;
 570		if (chunk->size < crash_size)
 571			continue;
 572		crash_base = (chunk->addr + chunk->size) - crash_size;
 573		if (crash_base < crash_size)
 574			continue;
 575		if (crash_base < sclp_get_hsa_size())
 576			continue;
 577		if (crash_base < (unsigned long) INITRD_START + INITRD_SIZE)
 578			continue;
 579		return crash_base;
 580	}
 581	*msg = "no suitable area found";
 582	return 0;
 583}
 584
 585/*
 586 * Check if crash_base and crash_size is valid
 587 */
 588static int __init verify_crash_base(unsigned long crash_base,
 589				    unsigned long crash_size,
 590				    char **msg)
 591{
 592	struct mem_chunk *chunk;
 593	int i;
 594
 595	/*
 596	 * Because we do the swap to zero, we must have at least 'crash_size'
 597	 * bytes free space before crash_base
 598	 */
 599	if (crash_size > crash_base) {
 600		*msg = "crashkernel offset must be greater than size";
 601		return -EINVAL;
 602	}
 603
 604	/* First memory chunk must be at least crash_size */
 605	if (memory_chunk[0].size < crash_size) {
 606		*msg = "first memory chunk must be at least crashkernel size";
 607		return -EINVAL;
 608	}
 609	/* Check if we fit into the respective memory chunk */
 610	for (i = 0; i < MEMORY_CHUNKS; i++) {
 611		chunk = &memory_chunk[i];
 612		if (chunk->size == 0)
 613			continue;
 614		if (crash_base < chunk->addr)
 615			continue;
 616		if (crash_base >= chunk->addr + chunk->size)
 617			continue;
 618		/* we have found the memory chunk */
 619		if (crash_base + crash_size > chunk->addr + chunk->size) {
 620			*msg = "selected memory chunk is too small for "
 621				"crashkernel memory";
 622			return -EINVAL;
 623		}
 624		return 0;
 625	}
 626	*msg = "invalid memory range specified";
 627	return -EINVAL;
 628}
 629
 630/*
 631 * When kdump is enabled, we have to ensure that no memory from
 632 * the area [0 - crashkernel memory size] and
 633 * [crashk_res.start - crashk_res.end] is set offline.
 634 */
 635static int kdump_mem_notifier(struct notifier_block *nb,
 636			      unsigned long action, void *data)
 637{
 638	struct memory_notify *arg = data;
 639
 
 
 640	if (arg->start_pfn < PFN_DOWN(resource_size(&crashk_res)))
 641		return NOTIFY_BAD;
 642	if (arg->start_pfn > PFN_DOWN(crashk_res.end))
 643		return NOTIFY_OK;
 644	if (arg->start_pfn + arg->nr_pages - 1 < PFN_DOWN(crashk_res.start))
 645		return NOTIFY_OK;
 646	return NOTIFY_BAD;
 647}
 648
 649static struct notifier_block kdump_mem_nb = {
 650	.notifier_call = kdump_mem_notifier,
 651};
 652
 653#endif
 654
 655/*
 656 * Make sure that oldmem, where the dump is stored, is protected
 657 */
 658static void reserve_oldmem(void)
 659{
 660#ifdef CONFIG_CRASH_DUMP
 661	unsigned long real_size = 0;
 662	int i;
 663
 664	if (!OLDMEM_BASE)
 665		return;
 666	for (i = 0; i < MEMORY_CHUNKS; i++) {
 667		struct mem_chunk *chunk = &memory_chunk[i];
 668
 669		real_size = max(real_size, chunk->addr + chunk->size);
 670	}
 671	create_mem_hole(memory_chunk, OLDMEM_BASE, OLDMEM_SIZE);
 672	create_mem_hole(memory_chunk, OLDMEM_SIZE, real_size - OLDMEM_SIZE);
 673#endif
 674}
 675
 676/*
 677 * Reserve memory for kdump kernel to be loaded with kexec
 678 */
 679static void __init reserve_crashkernel(void)
 680{
 681#ifdef CONFIG_CRASH_DUMP
 682	unsigned long long crash_base, crash_size;
 683	char *msg = NULL;
 684	int rc;
 685
 686	rc = parse_crashkernel(boot_command_line, memory_end, &crash_size,
 687			       &crash_base);
 
 
 
 688	if (rc || crash_size == 0)
 689		return;
 690	crash_base = ALIGN(crash_base, KEXEC_CRASH_MEM_ALIGN);
 691	crash_size = ALIGN(crash_size, KEXEC_CRASH_MEM_ALIGN);
 692	if (register_memory_notifier(&kdump_mem_nb))
 
 693		return;
 694	if (!crash_base)
 695		crash_base = find_crash_base(crash_size, &msg);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 696	if (!crash_base) {
 697		pr_info("crashkernel reservation failed: %s\n", msg);
 698		unregister_memory_notifier(&kdump_mem_nb);
 699		return;
 700	}
 701	if (verify_crash_base(crash_base, crash_size, &msg)) {
 702		pr_info("crashkernel reservation failed: %s\n", msg);
 703		unregister_memory_notifier(&kdump_mem_nb);
 704		return;
 705	}
 706	if (!OLDMEM_BASE && MACHINE_IS_VM)
 
 707		diag10_range(PFN_DOWN(crash_base), PFN_DOWN(crash_size));
 708	crashk_res.start = crash_base;
 709	crashk_res.end = crash_base + crash_size - 1;
 710	insert_resource(&iomem_resource, &crashk_res);
 711	create_mem_hole(memory_chunk, crash_base, crash_size);
 712	pr_info("Reserving %lluMB of memory at %lluMB "
 713		"for crashkernel (System RAM: %luMB)\n",
 714		crash_size >> 20, crash_base >> 20, memory_end >> 20);
 
 715	os_info_crashkernel_add(crash_base, crash_size);
 716#endif
 717}
 718
 719static void __init setup_memory(void)
 
 
 
 720{
 721        unsigned long bootmap_size;
 722	unsigned long start_pfn, end_pfn;
 723	int i;
 
 
 
 
 
 724
 725	/*
 726	 * partially used pages are not usable - thus
 727	 * we are rounding upwards:
 728	 */
 729	start_pfn = PFN_UP(__pa(&_end));
 730	end_pfn = max_pfn = PFN_DOWN(memory_end);
 
 
 731
 732#ifdef CONFIG_BLK_DEV_INITRD
 733	/*
 734	 * Move the initrd in case the bitmap of the bootmem allocater
 735	 * would overwrite it.
 736	 */
 737
 738	if (INITRD_START && INITRD_SIZE) {
 739		unsigned long bmap_size;
 740		unsigned long start;
 
 741
 742		bmap_size = bootmem_bootmap_pages(end_pfn - start_pfn + 1);
 743		bmap_size = PFN_PHYS(bmap_size);
 
 744
 745		if (PFN_PHYS(start_pfn) + bmap_size > INITRD_START) {
 746			start = PFN_PHYS(start_pfn) + bmap_size + PAGE_SIZE;
 
 
 747
 748#ifdef CONFIG_CRASH_DUMP
 749			if (OLDMEM_BASE) {
 750				/* Move initrd behind kdump oldmem */
 751				if (start + INITRD_SIZE > OLDMEM_BASE &&
 752				    start < OLDMEM_BASE + OLDMEM_SIZE)
 753					start = OLDMEM_BASE + OLDMEM_SIZE;
 754			}
 755#endif
 756			if (start + INITRD_SIZE > memory_end) {
 757				pr_err("initrd extends beyond end of "
 758				       "memory (0x%08lx > 0x%08lx) "
 759				       "disabling initrd\n",
 760				       start + INITRD_SIZE, memory_end);
 761				INITRD_START = INITRD_SIZE = 0;
 762			} else {
 763				pr_info("Moving initrd (0x%08lx -> "
 764					"0x%08lx, size: %ld)\n",
 765					INITRD_START, start, INITRD_SIZE);
 766				memmove((void *) start, (void *) INITRD_START,
 767					INITRD_SIZE);
 768				INITRD_START = start;
 769			}
 770		}
 771	}
 772#endif
 
 773
 774	/*
 775	 * Initialize the boot-time allocator
 776	 */
 777	bootmap_size = init_bootmem(start_pfn, end_pfn);
 778
 779	/*
 780	 * Register RAM areas with the bootmem allocator.
 781	 */
 
 
 
 
 
 
 
 
 782
 783	for (i = 0; i < MEMORY_CHUNKS; i++) {
 784		unsigned long start_chunk, end_chunk, pfn;
 785
 786		if (!memory_chunk[i].size)
 787			continue;
 788		start_chunk = PFN_DOWN(memory_chunk[i].addr);
 789		end_chunk = start_chunk + PFN_DOWN(memory_chunk[i].size);
 790		end_chunk = min(end_chunk, end_pfn);
 791		if (start_chunk >= end_chunk)
 792			continue;
 793		memblock_add_node(PFN_PHYS(start_chunk),
 794				  PFN_PHYS(end_chunk - start_chunk), 0);
 795		pfn = max(start_chunk, start_pfn);
 796		storage_key_init_range(PFN_PHYS(pfn), PFN_PHYS(end_chunk));
 797	}
 
 
 798
 799	psw_set_key(PAGE_DEFAULT_KEY);
 
 
 
 
 
 
 
 
 
 
 
 800
 801	free_bootmem_with_active_regions(0, max_pfn);
 
 
 
 802
 803	/*
 804	 * Reserve memory used for lowcore/command line/kernel image.
 805	 */
 806	reserve_bootmem(0, (unsigned long)_ehead, BOOTMEM_DEFAULT);
 807	reserve_bootmem((unsigned long)_stext,
 808			PFN_PHYS(start_pfn) - (unsigned long)_stext,
 809			BOOTMEM_DEFAULT);
 810	/*
 811	 * Reserve the bootmem bitmap itself as well. We do this in two
 812	 * steps (first step was init_bootmem()) because this catches
 813	 * the (very unlikely) case of us accidentally initializing the
 814	 * bootmem allocator with an invalid RAM area.
 815	 */
 816	reserve_bootmem(start_pfn << PAGE_SHIFT, bootmap_size,
 817			BOOTMEM_DEFAULT);
 818
 819#ifdef CONFIG_CRASH_DUMP
 820	if (crashk_res.start)
 821		reserve_bootmem(crashk_res.start,
 822				crashk_res.end - crashk_res.start + 1,
 823				BOOTMEM_DEFAULT);
 824	if (is_kdump_kernel())
 825		reserve_bootmem(elfcorehdr_addr - OLDMEM_BASE,
 826				PAGE_ALIGN(elfcorehdr_size), BOOTMEM_DEFAULT);
 827#endif
 828#ifdef CONFIG_BLK_DEV_INITRD
 829	if (INITRD_START && INITRD_SIZE) {
 830		if (INITRD_START + INITRD_SIZE <= memory_end) {
 831			reserve_bootmem(INITRD_START, INITRD_SIZE,
 832					BOOTMEM_DEFAULT);
 833			initrd_start = INITRD_START;
 834			initrd_end = initrd_start + INITRD_SIZE;
 835		} else {
 836			pr_err("initrd extends beyond end of "
 837			       "memory (0x%08lx > 0x%08lx) "
 838			       "disabling initrd\n",
 839			       initrd_start + INITRD_SIZE, memory_end);
 840			initrd_start = initrd_end = 0;
 841		}
 842	}
 843#endif
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 844}
 845
 846/*
 847 * Setup hardware capabilities.
 848 */
 849static void __init setup_hwcaps(void)
 850{
 851	static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
 852	struct cpuid cpu_id;
 853	int i;
 
 
 
 
 
 
 
 
 
 854
 855	/*
 856	 * The store facility list bits numbers as found in the principles
 857	 * of operation are numbered with bit 1UL<<31 as number 0 to
 858	 * bit 1UL<<0 as number 31.
 859	 *   Bit 0: instructions named N3, "backported" to esa-mode
 860	 *   Bit 2: z/Architecture mode is active
 861	 *   Bit 7: the store-facility-list-extended facility is installed
 862	 *   Bit 17: the message-security assist is installed
 863	 *   Bit 19: the long-displacement facility is installed
 864	 *   Bit 21: the extended-immediate facility is installed
 865	 *   Bit 22: extended-translation facility 3 is installed
 866	 *   Bit 30: extended-translation facility 3 enhancement facility
 867	 * These get translated to:
 868	 *   HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
 869	 *   HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
 870	 *   HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
 871	 *   HWCAP_S390_ETF3EH bit 8 (22 && 30).
 872	 */
 873	for (i = 0; i < 6; i++)
 874		if (test_facility(stfl_bits[i]))
 875			elf_hwcap |= 1UL << i;
 876
 877	if (test_facility(22) && test_facility(30))
 878		elf_hwcap |= HWCAP_S390_ETF3EH;
 
 
 
 
 879
 880	/*
 881	 * Check for additional facilities with store-facility-list-extended.
 882	 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
 883	 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
 884	 * as stored by stfl, bits 32-xxx contain additional facilities.
 885	 * How many facility words are stored depends on the number of
 886	 * doublewords passed to the instruction. The additional facilities
 887	 * are:
 888	 *   Bit 42: decimal floating point facility is installed
 889	 *   Bit 44: perform floating point operation facility is installed
 890	 * translated to:
 891	 *   HWCAP_S390_DFP bit 6 (42 && 44).
 892	 */
 893	if ((elf_hwcap & (1UL << 2)) && test_facility(42) && test_facility(44))
 894		elf_hwcap |= HWCAP_S390_DFP;
 895
 896	/*
 897	 * Huge page support HWCAP_S390_HPAGE is bit 7.
 898	 */
 899	if (MACHINE_HAS_HPAGE)
 900		elf_hwcap |= HWCAP_S390_HPAGE;
 901
 902#if defined(CONFIG_64BIT)
 903	/*
 904	 * 64-bit register support for 31-bit processes
 905	 * HWCAP_S390_HIGH_GPRS is bit 9.
 906	 */
 907	elf_hwcap |= HWCAP_S390_HIGH_GPRS;
 908
 909	/*
 910	 * Transactional execution support HWCAP_S390_TE is bit 10.
 911	 */
 912	if (test_facility(50) && test_facility(73))
 913		elf_hwcap |= HWCAP_S390_TE;
 914#endif
 
 915
 916	get_cpu_id(&cpu_id);
 917	switch (cpu_id.machine) {
 918	case 0x9672:
 919#if !defined(CONFIG_64BIT)
 920	default:	/* Use "g5" as default for 31 bit kernels. */
 921#endif
 922		strcpy(elf_platform, "g5");
 923		break;
 924	case 0x2064:
 925	case 0x2066:
 926#if defined(CONFIG_64BIT)
 927	default:	/* Use "z900" as default for 64 bit kernels. */
 928#endif
 929		strcpy(elf_platform, "z900");
 930		break;
 931	case 0x2084:
 932	case 0x2086:
 933		strcpy(elf_platform, "z990");
 934		break;
 935	case 0x2094:
 936	case 0x2096:
 937		strcpy(elf_platform, "z9-109");
 938		break;
 939	case 0x2097:
 940	case 0x2098:
 941		strcpy(elf_platform, "z10");
 942		break;
 943	case 0x2817:
 944	case 0x2818:
 945		strcpy(elf_platform, "z196");
 946		break;
 947	case 0x2827:
 948	case 0x2828:
 949		strcpy(elf_platform, "zEC12");
 950		break;
 951	}
 952}
 953
 954/*
 955 * Setup function called from init/main.c just after the banner
 956 * was printed.
 957 */
 958
 959void __init setup_arch(char **cmdline_p)
 960{
 961        /*
 962         * print what head.S has found out about the machine
 963         */
 964#ifndef CONFIG_64BIT
 965	if (MACHINE_IS_VM)
 966		pr_info("Linux is running as a z/VM "
 967			"guest operating system in 31-bit mode\n");
 968	else if (MACHINE_IS_LPAR)
 969		pr_info("Linux is running natively in 31-bit mode\n");
 970	if (MACHINE_HAS_IEEE)
 971		pr_info("The hardware system has IEEE compatible "
 972			"floating point units\n");
 973	else
 974		pr_info("The hardware system has no IEEE compatible "
 975			"floating point units\n");
 976#else /* CONFIG_64BIT */
 977	if (MACHINE_IS_VM)
 978		pr_info("Linux is running as a z/VM "
 979			"guest operating system in 64-bit mode\n");
 980	else if (MACHINE_IS_KVM)
 981		pr_info("Linux is running under KVM in 64-bit mode\n");
 982	else if (MACHINE_IS_LPAR)
 983		pr_info("Linux is running natively in 64-bit mode\n");
 984#endif /* CONFIG_64BIT */
 
 
 
 985
 986	/* Have one command line that is parsed and saved in /proc/cmdline */
 987	/* boot_command_line has been already set up in early.c */
 988	*cmdline_p = boot_command_line;
 989
 990        ROOT_DEV = Root_RAM0;
 991
 992	init_mm.start_code = PAGE_OFFSET;
 993	init_mm.end_code = (unsigned long) &_etext;
 994	init_mm.end_data = (unsigned long) &_edata;
 995	init_mm.brk = (unsigned long) &_end;
 996
 
 997	parse_early_param();
 998	detect_memory_layout(memory_chunk, memory_end);
 
 
 
 
 999	os_info_init();
1000	setup_ipl();
1001	reserve_oldmem();
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1002	setup_memory_end();
 
 
 
 
 
 
 
 
 
 
 
 
1003	reserve_crashkernel();
1004	setup_memory();
 
 
 
 
 
 
 
1005	setup_resources();
1006	setup_vmcoreinfo();
1007	setup_lowcore();
1008
1009	smp_fill_possible_mask();
 
1010        cpu_init();
1011	s390_init_cpu_topology();
 
 
1012
1013	/*
1014	 * Setup capabilities (ELF_HWCAP & ELF_PLATFORM).
1015	 */
1016	setup_hwcaps();
1017
1018	/*
1019	 * Create kernel page tables and switch to virtual addressing.
1020	 */
1021        paging_init();
 
 
 
 
 
 
 
 
 
1022
1023        /* Setup default console */
1024	conmode_default();
1025	set_preferred_console();
1026
1027	/* Setup zfcpdump support */
 
 
 
 
1028	setup_zfcpdump();
1029}
1030
1031#ifdef CONFIG_32BIT
1032static int no_removal_warning __initdata;
1033
1034static int __init parse_no_removal_warning(char *str)
1035{
1036	no_removal_warning = 1;
1037	return 0;
1038}
1039__setup("no_removal_warning", parse_no_removal_warning);
1040
1041static int __init removal_warning(void)
1042{
1043	if (no_removal_warning)
1044		return 0;
1045	printk(KERN_ALERT "\n\n");
1046	printk(KERN_CONT "Warning - you are using a 31 bit kernel!\n\n");
1047	printk(KERN_CONT "We plan to remove 31 bit kernel support from the kernel sources in March 2015.\n");
1048	printk(KERN_CONT "Currently we assume that nobody is using the 31 bit kernel on old 31 bit\n");
1049	printk(KERN_CONT "hardware anymore. If you think that the code should not be removed and also\n");
1050	printk(KERN_CONT "future versions of the Linux kernel should be able to run in 31 bit mode\n");
1051	printk(KERN_CONT "please let us know. Please write to:\n");
1052	printk(KERN_CONT "linux390@de.ibm.com (mail address) and/or\n");
1053	printk(KERN_CONT "linux-s390@vger.kernel.org (mailing list).\n\n");
1054	printk(KERN_CONT "Thank you!\n\n");
1055	printk(KERN_CONT "If this kernel runs on a 64 bit machine you may consider using a 64 bit kernel.\n");
1056	printk(KERN_CONT "This message can be disabled with the \"no_removal_warning\" kernel parameter.\n");
1057	schedule_timeout_uninterruptible(300 * HZ);
1058	return 0;
1059}
1060early_initcall(removal_warning);
1061#endif