Linux Audio

Check our new training course

Loading...
v6.13.7
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 *  S390 version
   4 *    Copyright IBM Corp. 1999, 2012
   5 *    Author(s): Hartmut Penner (hp@de.ibm.com),
   6 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
   7 *
   8 *  Derived from "arch/i386/kernel/setup.c"
   9 *    Copyright (C) 1995, Linus Torvalds
  10 */
  11
  12/*
  13 * This file handles the architecture-dependent parts of initialization
  14 */
  15
  16#define KMSG_COMPONENT "setup"
  17#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
  18
  19#include <linux/errno.h>
  20#include <linux/export.h>
  21#include <linux/sched.h>
  22#include <linux/sched/task.h>
  23#include <linux/cpu.h>
  24#include <linux/kernel.h>
  25#include <linux/memblock.h>
  26#include <linux/mm.h>
  27#include <linux/stddef.h>
  28#include <linux/unistd.h>
  29#include <linux/ptrace.h>
  30#include <linux/random.h>
  31#include <linux/user.h>
  32#include <linux/tty.h>
  33#include <linux/ioport.h>
  34#include <linux/delay.h>
  35#include <linux/init.h>
  36#include <linux/initrd.h>
  37#include <linux/root_dev.h>
  38#include <linux/console.h>
  39#include <linux/kernel_stat.h>
  40#include <linux/dma-map-ops.h>
  41#include <linux/device.h>
  42#include <linux/notifier.h>
  43#include <linux/pfn.h>
  44#include <linux/ctype.h>
  45#include <linux/reboot.h>
  46#include <linux/topology.h>
  47#include <linux/kexec.h>
  48#include <linux/crash_dump.h>
  49#include <linux/memory.h>
  50#include <linux/compat.h>
  51#include <linux/start_kernel.h>
  52#include <linux/hugetlb.h>
  53#include <linux/kmemleak.h>
  54
  55#include <asm/archrandom.h>
  56#include <asm/boot_data.h>
  57#include <asm/ipl.h>
  58#include <asm/facility.h>
  59#include <asm/smp.h>
  60#include <asm/mmu_context.h>
  61#include <asm/cpcmd.h>
  62#include <asm/abs_lowcore.h>
  63#include <asm/nmi.h>
  64#include <asm/irq.h>
  65#include <asm/page.h>
  66#include <asm/ptrace.h>
  67#include <asm/sections.h>
  68#include <asm/ebcdic.h>
  69#include <asm/diag.h>
  70#include <asm/os_info.h>
  71#include <asm/sclp.h>
  72#include <asm/stacktrace.h>
  73#include <asm/sysinfo.h>
  74#include <asm/numa.h>
  75#include <asm/alternative.h>
  76#include <asm/nospec-branch.h>
  77#include <asm/physmem_info.h>
  78#include <asm/maccess.h>
  79#include <asm/uv.h>
  80#include <asm/asm-offsets.h>
  81#include "entry.h"
  82
  83/*
  84 * Machine setup..
  85 */
  86unsigned int console_mode = 0;
  87EXPORT_SYMBOL(console_mode);
  88
  89unsigned int console_devno = -1;
  90EXPORT_SYMBOL(console_devno);
  91
  92unsigned int console_irq = -1;
  93EXPORT_SYMBOL(console_irq);
  94
  95/*
  96 * Some code and data needs to stay below 2 GB, even when the kernel would be
  97 * relocated above 2 GB, because it has to use 31 bit addresses.
  98 * Such code and data is part of the .amode31 section.
  99 */
 100char __amode31_ref *__samode31 = _samode31;
 101char __amode31_ref *__eamode31 = _eamode31;
 102char __amode31_ref *__stext_amode31 = _stext_amode31;
 103char __amode31_ref *__etext_amode31 = _etext_amode31;
 104struct exception_table_entry __amode31_ref *__start_amode31_ex_table = _start_amode31_ex_table;
 105struct exception_table_entry __amode31_ref *__stop_amode31_ex_table = _stop_amode31_ex_table;
 106
 107/*
 108 * Control registers CR2, CR5 and CR15 are initialized with addresses
 109 * of tables that must be placed below 2G which is handled by the AMODE31
 110 * sections.
 111 * Because the AMODE31 sections are relocated below 2G at startup,
 112 * the content of control registers CR2, CR5 and CR15 must be updated
 113 * with new addresses after the relocation. The initial initialization of
 114 * control registers occurs in head64.S and then gets updated again after AMODE31
 115 * relocation. We must access the relevant AMODE31 tables indirectly via
 116 * pointers placed in the .amode31.refs linker section. Those pointers get
 117 * updated automatically during AMODE31 relocation and always contain a valid
 118 * address within AMODE31 sections.
 119 */
 120
 121static __amode31_data u32 __ctl_duct_amode31[16] __aligned(64);
 122
 123static __amode31_data u64 __ctl_aste_amode31[8] __aligned(64) = {
 124	[1] = 0xffffffffffffffff
 125};
 126
 127static __amode31_data u32 __ctl_duald_amode31[32] __aligned(128) = {
 128	0x80000000, 0, 0, 0,
 129	0x80000000, 0, 0, 0,
 130	0x80000000, 0, 0, 0,
 131	0x80000000, 0, 0, 0,
 132	0x80000000, 0, 0, 0,
 133	0x80000000, 0, 0, 0,
 134	0x80000000, 0, 0, 0,
 135	0x80000000, 0, 0, 0
 136};
 137
 138static __amode31_data u32 __ctl_linkage_stack_amode31[8] __aligned(64) = {
 139	0, 0, 0x89000000, 0,
 140	0, 0, 0x8a000000, 0
 141};
 142
 143static u64 __amode31_ref *__ctl_aste = __ctl_aste_amode31;
 144static u32 __amode31_ref *__ctl_duald = __ctl_duald_amode31;
 145static u32 __amode31_ref *__ctl_linkage_stack = __ctl_linkage_stack_amode31;
 146static u32 __amode31_ref *__ctl_duct = __ctl_duct_amode31;
 147
 148unsigned long __bootdata_preserved(max_mappable);
 149struct physmem_info __bootdata(physmem_info);
 150
 151struct vm_layout __bootdata_preserved(vm_layout);
 152EXPORT_SYMBOL(vm_layout);
 153int __bootdata_preserved(__kaslr_enabled);
 154unsigned int __bootdata_preserved(zlib_dfltcc_support);
 155EXPORT_SYMBOL(zlib_dfltcc_support);
 156u64 __bootdata_preserved(stfle_fac_list[16]);
 157EXPORT_SYMBOL(stfle_fac_list);
 158struct oldmem_data __bootdata_preserved(oldmem_data);
 159
 160unsigned long VMALLOC_START;
 161EXPORT_SYMBOL(VMALLOC_START);
 162
 163unsigned long VMALLOC_END;
 164EXPORT_SYMBOL(VMALLOC_END);
 165
 166struct page *vmemmap;
 167EXPORT_SYMBOL(vmemmap);
 168unsigned long vmemmap_size;
 169
 170unsigned long MODULES_VADDR;
 171unsigned long MODULES_END;
 172
 173/* An array with a pointer to the lowcore of every CPU. */
 174struct lowcore *lowcore_ptr[NR_CPUS];
 175EXPORT_SYMBOL(lowcore_ptr);
 176
 177DEFINE_STATIC_KEY_FALSE(cpu_has_bear);
 178
 179/*
 180 * The Write Back bit position in the physaddr is given by the SLPC PCI.
 181 * Leaving the mask zero always uses write through which is safe
 182 */
 183unsigned long mio_wb_bit_mask __ro_after_init;
 184
 185/*
 186 * This is set up by the setup-routine at boot-time
 187 * for S390 need to find out, what we have to setup
 188 * using address 0x10400 ...
 189 */
 190
 191#include <asm/setup.h>
 192
 193/*
 194 * condev= and conmode= setup parameter.
 195 */
 196
 197static int __init condev_setup(char *str)
 198{
 199	int vdev;
 200
 201	vdev = simple_strtoul(str, &str, 0);
 202	if (vdev >= 0 && vdev < 65536) {
 203		console_devno = vdev;
 204		console_irq = -1;
 205	}
 206	return 1;
 207}
 208
 209__setup("condev=", condev_setup);
 210
 211static void __init set_preferred_console(void)
 212{
 213	if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
 214		add_preferred_console("ttyS", 0, NULL);
 215	else if (CONSOLE_IS_3270)
 216		add_preferred_console("tty3270", 0, NULL);
 217	else if (CONSOLE_IS_VT220)
 218		add_preferred_console("ttysclp", 0, NULL);
 219	else if (CONSOLE_IS_HVC)
 220		add_preferred_console("hvc", 0, NULL);
 221}
 222
 223static int __init conmode_setup(char *str)
 224{
 225#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 226	if (!strcmp(str, "hwc") || !strcmp(str, "sclp"))
 227                SET_CONSOLE_SCLP;
 228#endif
 229#if defined(CONFIG_TN3215_CONSOLE)
 230	if (!strcmp(str, "3215"))
 231		SET_CONSOLE_3215;
 232#endif
 233#if defined(CONFIG_TN3270_CONSOLE)
 234	if (!strcmp(str, "3270"))
 235		SET_CONSOLE_3270;
 236#endif
 237	set_preferred_console();
 238        return 1;
 239}
 240
 241__setup("conmode=", conmode_setup);
 242
 243static void __init conmode_default(void)
 244{
 245	char query_buffer[1024];
 246	char *ptr;
 247
 248        if (MACHINE_IS_VM) {
 249		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
 250		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
 251		ptr = strstr(query_buffer, "SUBCHANNEL =");
 252		console_irq = simple_strtoul(ptr + 13, NULL, 16);
 253		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
 254		ptr = strstr(query_buffer, "CONMODE");
 255		/*
 256		 * Set the conmode to 3215 so that the device recognition 
 257		 * will set the cu_type of the console to 3215. If the
 258		 * conmode is 3270 and we don't set it back then both
 259		 * 3215 and the 3270 driver will try to access the console
 260		 * device (3215 as console and 3270 as normal tty).
 261		 */
 262		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
 263		if (ptr == NULL) {
 264#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 265			SET_CONSOLE_SCLP;
 266#endif
 267			return;
 268		}
 269		if (str_has_prefix(ptr + 8, "3270")) {
 270#if defined(CONFIG_TN3270_CONSOLE)
 271			SET_CONSOLE_3270;
 272#elif defined(CONFIG_TN3215_CONSOLE)
 273			SET_CONSOLE_3215;
 274#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 275			SET_CONSOLE_SCLP;
 276#endif
 277		} else if (str_has_prefix(ptr + 8, "3215")) {
 278#if defined(CONFIG_TN3215_CONSOLE)
 279			SET_CONSOLE_3215;
 280#elif defined(CONFIG_TN3270_CONSOLE)
 281			SET_CONSOLE_3270;
 282#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 283			SET_CONSOLE_SCLP;
 284#endif
 285		}
 286	} else if (MACHINE_IS_KVM) {
 287		if (sclp.has_vt220 && IS_ENABLED(CONFIG_SCLP_VT220_CONSOLE))
 288			SET_CONSOLE_VT220;
 289		else if (sclp.has_linemode && IS_ENABLED(CONFIG_SCLP_CONSOLE))
 290			SET_CONSOLE_SCLP;
 291		else
 292			SET_CONSOLE_HVC;
 293	} else {
 294#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 295		SET_CONSOLE_SCLP;
 296#endif
 297	}
 
 
 298}
 299
 300#ifdef CONFIG_CRASH_DUMP
 301static void __init setup_zfcpdump(void)
 302{
 303	if (!is_ipl_type_dump())
 304		return;
 305	if (oldmem_data.start)
 306		return;
 307	strlcat(boot_command_line, " cio_ignore=all,!ipldev,!condev", COMMAND_LINE_SIZE);
 308	console_loglevel = 2;
 309}
 310#else
 311static inline void setup_zfcpdump(void) {}
 312#endif /* CONFIG_CRASH_DUMP */
 313
 314 /*
 315 * Reboot, halt and power_off stubs. They just call _machine_restart,
 316 * _machine_halt or _machine_power_off. 
 317 */
 318
 319void machine_restart(char *command)
 320{
 321	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
 322		/*
 323		 * Only unblank the console if we are called in enabled
 324		 * context or a bust_spinlocks cleared the way for us.
 325		 */
 326		console_unblank();
 327	_machine_restart(command);
 328}
 329
 330void machine_halt(void)
 331{
 332	if (!in_interrupt() || oops_in_progress)
 333		/*
 334		 * Only unblank the console if we are called in enabled
 335		 * context or a bust_spinlocks cleared the way for us.
 336		 */
 337		console_unblank();
 338	_machine_halt();
 339}
 340
 341void machine_power_off(void)
 342{
 343	if (!in_interrupt() || oops_in_progress)
 344		/*
 345		 * Only unblank the console if we are called in enabled
 346		 * context or a bust_spinlocks cleared the way for us.
 347		 */
 348		console_unblank();
 349	_machine_power_off();
 350}
 351
 352/*
 353 * Dummy power off function.
 354 */
 355void (*pm_power_off)(void) = machine_power_off;
 356EXPORT_SYMBOL_GPL(pm_power_off);
 357
 358void *restart_stack;
 359
 360unsigned long stack_alloc(void)
 361{
 362#ifdef CONFIG_VMAP_STACK
 363	void *ret;
 364
 365	ret = __vmalloc_node(THREAD_SIZE, THREAD_SIZE, THREADINFO_GFP,
 366			     NUMA_NO_NODE, __builtin_return_address(0));
 367	kmemleak_not_leak(ret);
 368	return (unsigned long)ret;
 369#else
 370	return __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
 371#endif
 372}
 373
 374void stack_free(unsigned long stack)
 375{
 376#ifdef CONFIG_VMAP_STACK
 377	vfree((void *) stack);
 378#else
 379	free_pages(stack, THREAD_SIZE_ORDER);
 380#endif
 381}
 382
 383static unsigned long __init stack_alloc_early(void)
 384{
 385	unsigned long stack;
 386
 387	stack = (unsigned long)memblock_alloc(THREAD_SIZE, THREAD_SIZE);
 388	if (!stack) {
 389		panic("%s: Failed to allocate %lu bytes align=0x%lx\n",
 390		      __func__, THREAD_SIZE, THREAD_SIZE);
 391	}
 392	return stack;
 393}
 394
 395static void __init setup_lowcore(void)
 396{
 397	struct lowcore *lc, *abs_lc;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 398
 399	/*
 400	 * Setup lowcore for boot cpu
 401	 */
 402	BUILD_BUG_ON(sizeof(struct lowcore) != LC_PAGES * PAGE_SIZE);
 403	lc = memblock_alloc_low(sizeof(*lc), sizeof(*lc));
 404	if (!lc)
 405		panic("%s: Failed to allocate %zu bytes align=%zx\n",
 406		      __func__, sizeof(*lc), sizeof(*lc));
 407
 408	lc->pcpu = (unsigned long)per_cpu_ptr(&pcpu_devices, 0);
 409	lc->restart_psw.mask = PSW_KERNEL_BITS & ~PSW_MASK_DAT;
 410	lc->restart_psw.addr = __pa(restart_int_handler);
 411	lc->external_new_psw.mask = PSW_KERNEL_BITS;
 412	lc->external_new_psw.addr = (unsigned long) ext_int_handler;
 413	lc->svc_new_psw.mask = PSW_KERNEL_BITS;
 
 414	lc->svc_new_psw.addr = (unsigned long) system_call;
 415	lc->program_new_psw.mask = PSW_KERNEL_BITS;
 416	lc->program_new_psw.addr = (unsigned long) pgm_check_handler;
 417	lc->mcck_new_psw.mask = PSW_KERNEL_BITS;
 418	lc->mcck_new_psw.addr = (unsigned long) mcck_int_handler;
 419	lc->io_new_psw.mask = PSW_KERNEL_BITS;
 420	lc->io_new_psw.addr = (unsigned long) io_int_handler;
 421	lc->clock_comparator = clock_comparator_max;
 
 
 422	lc->current_task = (unsigned long)&init_task;
 423	lc->lpp = LPP_MAGIC;
 424	lc->machine_flags = get_lowcore()->machine_flags;
 425	lc->preempt_count = get_lowcore()->preempt_count;
 426	nmi_alloc_mcesa_early(&lc->mcesad);
 427	lc->sys_enter_timer = get_lowcore()->sys_enter_timer;
 428	lc->exit_timer = get_lowcore()->exit_timer;
 429	lc->user_timer = get_lowcore()->user_timer;
 430	lc->system_timer = get_lowcore()->system_timer;
 431	lc->steal_timer = get_lowcore()->steal_timer;
 432	lc->last_update_timer = get_lowcore()->last_update_timer;
 433	lc->last_update_clock = get_lowcore()->last_update_clock;
 
 
 
 
 
 
 
 
 434	/*
 435	 * Allocate the global restart stack which is the same for
 436	 * all CPUs in case *one* of them does a PSW restart.
 437	 */
 438	restart_stack = (void *)(stack_alloc_early() + STACK_INIT_OFFSET);
 439	lc->mcck_stack = stack_alloc_early() + STACK_INIT_OFFSET;
 440	lc->async_stack = stack_alloc_early() + STACK_INIT_OFFSET;
 441	lc->nodat_stack = stack_alloc_early() + STACK_INIT_OFFSET;
 442	lc->kernel_stack = get_lowcore()->kernel_stack;
 
 443	/*
 444	 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
 445	 * restart data to the absolute zero lowcore. This is necessary if
 446	 * PSW restart is done on an offline CPU that has lowcore zero.
 447	 */
 448	lc->restart_stack = (unsigned long) restart_stack;
 449	lc->restart_fn = (unsigned long) do_restart;
 450	lc->restart_data = 0;
 451	lc->restart_source = -1U;
 
 
 
 
 
 
 
 
 452	lc->spinlock_lockval = arch_spin_lockval(0);
 453	lc->spinlock_index = 0;
 454	arch_spin_lock_setup(0);
 455	lc->return_lpswe = gen_lpswe(__LC_RETURN_PSW);
 456	lc->return_mcck_lpswe = gen_lpswe(__LC_RETURN_MCCK_PSW);
 457	lc->preempt_count = PREEMPT_DISABLED;
 458	lc->kernel_asce = get_lowcore()->kernel_asce;
 459	lc->user_asce = get_lowcore()->user_asce;
 460
 461	system_ctlreg_init_save_area(lc);
 462	abs_lc = get_abs_lowcore();
 463	abs_lc->restart_stack = lc->restart_stack;
 464	abs_lc->restart_fn = lc->restart_fn;
 465	abs_lc->restart_data = lc->restart_data;
 466	abs_lc->restart_source = lc->restart_source;
 467	abs_lc->restart_psw = lc->restart_psw;
 468	abs_lc->restart_flags = RESTART_FLAG_CTLREGS;
 469	abs_lc->program_new_psw = lc->program_new_psw;
 470	abs_lc->mcesad = lc->mcesad;
 471	put_abs_lowcore(abs_lc);
 472
 473	set_prefix(__pa(lc));
 474	lowcore_ptr[0] = lc;
 475	if (abs_lowcore_map(0, lowcore_ptr[0], false))
 476		panic("Couldn't setup absolute lowcore");
 
 
 
 
 
 
 
 
 477}
 478
 479static struct resource code_resource = {
 480	.name  = "Kernel code",
 481	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 482};
 483
 484static struct resource data_resource = {
 485	.name = "Kernel data",
 486	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 487};
 488
 489static struct resource bss_resource = {
 490	.name = "Kernel bss",
 491	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 492};
 493
 494static struct resource __initdata *standard_resources[] = {
 495	&code_resource,
 496	&data_resource,
 497	&bss_resource,
 498};
 499
 500static void __init setup_resources(void)
 501{
 502	struct resource *res, *std_res, *sub_res;
 503	phys_addr_t start, end;
 504	int j;
 505	u64 i;
 506
 507	code_resource.start = __pa_symbol(_text);
 508	code_resource.end = __pa_symbol(_etext) - 1;
 509	data_resource.start = __pa_symbol(_etext);
 510	data_resource.end = __pa_symbol(_edata) - 1;
 511	bss_resource.start = __pa_symbol(__bss_start);
 512	bss_resource.end = __pa_symbol(__bss_stop) - 1;
 513
 514	for_each_mem_range(i, &start, &end) {
 515		res = memblock_alloc(sizeof(*res), 8);
 516		if (!res)
 517			panic("%s: Failed to allocate %zu bytes align=0x%x\n",
 518			      __func__, sizeof(*res), 8);
 519		res->flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM;
 520
 521		res->name = "System RAM";
 522		res->start = start;
 523		/*
 524		 * In memblock, end points to the first byte after the
 525		 * range while in resources, end points to the last byte in
 526		 * the range.
 527		 */
 528		res->end = end - 1;
 529		request_resource(&iomem_resource, res);
 530
 531		for (j = 0; j < ARRAY_SIZE(standard_resources); j++) {
 532			std_res = standard_resources[j];
 533			if (std_res->start < res->start ||
 534			    std_res->start > res->end)
 535				continue;
 536			if (std_res->end > res->end) {
 537				sub_res = memblock_alloc(sizeof(*sub_res), 8);
 538				if (!sub_res)
 539					panic("%s: Failed to allocate %zu bytes align=0x%x\n",
 540					      __func__, sizeof(*sub_res), 8);
 541				*sub_res = *std_res;
 542				sub_res->end = res->end;
 543				std_res->start = res->end + 1;
 544				request_resource(res, sub_res);
 545			} else {
 546				request_resource(res, std_res);
 547			}
 548		}
 549	}
 550#ifdef CONFIG_CRASH_DUMP
 551	/*
 552	 * Re-add removed crash kernel memory as reserved memory. This makes
 553	 * sure it will be mapped with the identity mapping and struct pages
 554	 * will be created, so it can be resized later on.
 555	 * However add it later since the crash kernel resource should not be
 556	 * part of the System RAM resource.
 557	 */
 558	if (crashk_res.end) {
 559		memblock_add_node(crashk_res.start, resource_size(&crashk_res),
 560				  0, MEMBLOCK_NONE);
 561		memblock_reserve(crashk_res.start, resource_size(&crashk_res));
 562		insert_resource(&iomem_resource, &crashk_res);
 563	}
 564#endif
 565}
 566
 567static void __init setup_memory_end(void)
 568{
 569	max_pfn = max_low_pfn = PFN_DOWN(ident_map_size);
 570	pr_notice("The maximum memory size is %luMB\n", ident_map_size >> 20);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 571}
 572
 573#ifdef CONFIG_CRASH_DUMP
 574
 575/*
 576 * When kdump is enabled, we have to ensure that no memory from the area
 577 * [0 - crashkernel memory size] is set offline - it will be exchanged with
 578 * the crashkernel memory region when kdump is triggered. The crashkernel
 579 * memory region can never get offlined (pages are unmovable).
 580 */
 581static int kdump_mem_notifier(struct notifier_block *nb,
 582			      unsigned long action, void *data)
 583{
 584	struct memory_notify *arg = data;
 585
 586	if (action != MEM_GOING_OFFLINE)
 587		return NOTIFY_OK;
 588	if (arg->start_pfn < PFN_DOWN(resource_size(&crashk_res)))
 589		return NOTIFY_BAD;
 590	return NOTIFY_OK;
 
 
 
 
 591}
 592
 593static struct notifier_block kdump_mem_nb = {
 594	.notifier_call = kdump_mem_notifier,
 595};
 596
 597#endif
 598
 599/*
 600 * Reserve page tables created by decompressor
 601 */
 602static void __init reserve_pgtables(void)
 603{
 604	unsigned long start, end;
 605	struct reserved_range *range;
 
 
 
 
 
 
 
 
 
 
 
 
 
 606
 607	for_each_physmem_reserved_type_range(RR_VMEM, range, &start, &end)
 608		memblock_reserve(start, end - start);
 
 
 
 
 
 
 
 
 609}
 610
 611/*
 612 * Reserve memory for kdump kernel to be loaded with kexec
 613 */
 614static void __init reserve_crashkernel(void)
 615{
 616#ifdef CONFIG_CRASH_DUMP
 617	unsigned long long crash_base, crash_size;
 618	phys_addr_t low, high;
 619	int rc;
 620
 621	rc = parse_crashkernel(boot_command_line, ident_map_size,
 622			       &crash_size, &crash_base, NULL, NULL);
 623
 624	crash_base = ALIGN(crash_base, KEXEC_CRASH_MEM_ALIGN);
 625	crash_size = ALIGN(crash_size, KEXEC_CRASH_MEM_ALIGN);
 626	if (rc || crash_size == 0)
 627		return;
 628
 629	if (memblock.memory.regions[0].size < crash_size) {
 630		pr_info("crashkernel reservation failed: %s\n",
 631			"first memory chunk must be at least crashkernel size");
 632		return;
 633	}
 634
 635	low = crash_base ?: oldmem_data.start;
 636	high = low + crash_size;
 637	if (low >= oldmem_data.start && high <= oldmem_data.start + oldmem_data.size) {
 638		/* The crashkernel fits into OLDMEM, reuse OLDMEM */
 639		crash_base = low;
 640	} else {
 641		/* Find suitable area in free memory */
 642		low = max_t(unsigned long, crash_size, sclp.hsa_size);
 643		high = crash_base ? crash_base + crash_size : ULONG_MAX;
 644
 645		if (crash_base && crash_base < low) {
 646			pr_info("crashkernel reservation failed: %s\n",
 647				"crash_base too low");
 648			return;
 649		}
 650		low = crash_base ?: low;
 651		crash_base = memblock_phys_alloc_range(crash_size,
 652						       KEXEC_CRASH_MEM_ALIGN,
 653						       low, high);
 654	}
 655
 656	if (!crash_base) {
 657		pr_info("crashkernel reservation failed: %s\n",
 658			"no suitable area found");
 659		return;
 660	}
 661
 662	if (register_memory_notifier(&kdump_mem_nb)) {
 663		memblock_phys_free(crash_base, crash_size);
 664		return;
 665	}
 666
 667	if (!oldmem_data.start && MACHINE_IS_VM)
 668		diag10_range(PFN_DOWN(crash_base), PFN_DOWN(crash_size));
 669	crashk_res.start = crash_base;
 670	crashk_res.end = crash_base + crash_size - 1;
 671	memblock_remove(crash_base, crash_size);
 672	pr_info("Reserving %lluMB of memory at %lluMB "
 673		"for crashkernel (System RAM: %luMB)\n",
 674		crash_size >> 20, crash_base >> 20,
 675		(unsigned long)memblock.memory.total_size >> 20);
 676	os_info_crashkernel_add(crash_base, crash_size);
 677#endif
 678}
 679
 680/*
 681 * Reserve the initrd from being used by memblock
 682 */
 683static void __init reserve_initrd(void)
 684{
 685	unsigned long addr, size;
 686
 687	if (!IS_ENABLED(CONFIG_BLK_DEV_INITRD) || !get_physmem_reserved(RR_INITRD, &addr, &size))
 688		return;
 689	initrd_start = (unsigned long)__va(addr);
 690	initrd_end = initrd_start + size;
 691	memblock_reserve(addr, size);
 
 692}
 693
 694/*
 695 * Reserve the memory area used to pass the certificate lists
 696 */
 697static void __init reserve_certificate_list(void)
 698{
 699	if (ipl_cert_list_addr)
 700		memblock_reserve(ipl_cert_list_addr, ipl_cert_list_size);
 701}
 702
 703static void __init reserve_physmem_info(void)
 704{
 705	unsigned long addr, size;
 706
 707	if (get_physmem_reserved(RR_MEM_DETECT_EXTENDED, &addr, &size))
 708		memblock_reserve(addr, size);
 
 709}
 710
 711static void __init free_physmem_info(void)
 712{
 713	unsigned long addr, size;
 714
 715	if (get_physmem_reserved(RR_MEM_DETECT_EXTENDED, &addr, &size))
 716		memblock_phys_free(addr, size);
 
 717}
 718
 719static void __init memblock_add_physmem_info(void)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 720{
 721	unsigned long start, end;
 722	int i;
 723
 724	pr_debug("physmem info source: %s (%hhd)\n",
 725		 get_physmem_info_source(), physmem_info.info_source);
 726	/* keep memblock lists close to the kernel */
 727	memblock_set_bottom_up(true);
 728	for_each_physmem_usable_range(i, &start, &end)
 729		memblock_add(start, end - start);
 730	for_each_physmem_online_range(i, &start, &end)
 731		memblock_physmem_add(start, end - start);
 732	memblock_set_bottom_up(false);
 733	memblock_set_node(0, ULONG_MAX, &memblock.memory, 0);
 734}
 735
 736/*
 737 * Reserve memory used for lowcore.
 738 */
 739static void __init reserve_lowcore(void)
 740{
 741	void *lowcore_start = get_lowcore();
 742	void *lowcore_end = lowcore_start + sizeof(struct lowcore);
 743	void *start, *end;
 744
 745	if ((void *)__identity_base < lowcore_end) {
 746		start = max(lowcore_start, (void *)__identity_base);
 747		end = min(lowcore_end, (void *)(__identity_base + ident_map_size));
 748		memblock_reserve(__pa(start), __pa(end));
 749	}
 
 750}
 751
 752/*
 753 * Reserve memory used for absolute lowcore/command line/kernel image.
 754 */
 755static void __init reserve_kernel(void)
 756{
 757	memblock_reserve(0, STARTUP_NORMAL_OFFSET);
 758	memblock_reserve(OLDMEM_BASE, sizeof(unsigned long));
 759	memblock_reserve(OLDMEM_SIZE, sizeof(unsigned long));
 760	memblock_reserve(physmem_info.reserved[RR_AMODE31].start, __eamode31 - __samode31);
 761	memblock_reserve(__pa(sclp_early_sccb), EXT_SCCB_READ_SCP);
 762	memblock_reserve(__pa(_stext), _end - _stext);
 763}
 764
 765static void __init setup_memory(void)
 766{
 767	phys_addr_t start, end;
 768	u64 i;
 769
 770	/*
 771	 * Init storage key for present memory
 772	 */
 773	for_each_mem_range(i, &start, &end)
 774		storage_key_init_range(start, end);
 775
 776	psw_set_key(PAGE_DEFAULT_KEY);
 
 
 
 777}
 778
 779static void __init relocate_amode31_section(void)
 
 
 
 780{
 781	unsigned long amode31_size = __eamode31 - __samode31;
 782	long amode31_offset, *ptr;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 783
 784	amode31_offset = AMODE31_START - (unsigned long)__samode31;
 785	pr_info("Relocating AMODE31 section of size 0x%08lx\n", amode31_size);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 786
 787	/* Move original AMODE31 section to the new one */
 788	memmove((void *)physmem_info.reserved[RR_AMODE31].start, __samode31, amode31_size);
 789	/* Zero out the old AMODE31 section to catch invalid accesses within it */
 790	memset(__samode31, 0, amode31_size);
 791
 792	/* Update all AMODE31 region references */
 793	for (ptr = _start_amode31_refs; ptr != _end_amode31_refs; ptr++)
 794		*ptr += amode31_offset;
 795}
 796
 797/* This must be called after AMODE31 relocation */
 798static void __init setup_cr(void)
 799{
 800	union ctlreg2 cr2;
 801	union ctlreg5 cr5;
 802	union ctlreg15 cr15;
 803
 804	__ctl_duct[1] = (unsigned long)__ctl_aste;
 805	__ctl_duct[2] = (unsigned long)__ctl_aste;
 806	__ctl_duct[4] = (unsigned long)__ctl_duald;
 807
 808	/* Update control registers CR2, CR5 and CR15 */
 809	local_ctl_store(2, &cr2.reg);
 810	local_ctl_store(5, &cr5.reg);
 811	local_ctl_store(15, &cr15.reg);
 812	cr2.ducto = (unsigned long)__ctl_duct >> 6;
 813	cr5.pasteo = (unsigned long)__ctl_duct >> 6;
 814	cr15.lsea = (unsigned long)__ctl_linkage_stack >> 3;
 815	system_ctl_load(2, &cr2.reg);
 816	system_ctl_load(5, &cr5.reg);
 817	system_ctl_load(15, &cr15.reg);
 818}
 
 819
 820/*
 821 * Add system information as device randomness
 822 */
 823static void __init setup_randomness(void)
 824{
 825	struct sysinfo_3_2_2 *vmms;
 826
 827	vmms = memblock_alloc(PAGE_SIZE, PAGE_SIZE);
 
 828	if (!vmms)
 829		panic("Failed to allocate memory for sysinfo structure\n");
 
 830	if (stsi(vmms, 3, 2, 2) == 0 && vmms->count)
 831		add_device_randomness(&vmms->vm, sizeof(vmms->vm[0]) * vmms->count);
 832	memblock_free(vmms, PAGE_SIZE);
 
 
 
 
 
 
 
 
 
 
 833
 834	if (cpacf_query_func(CPACF_PRNO, CPACF_PRNO_TRNG))
 835		static_branch_enable(&s390_arch_random_available);
 
 
 
 836}
 837
 838/*
 839 * Issue diagnose 318 to set the control program name and
 840 * version codes.
 841 */
 842static void __init setup_control_program_code(void)
 843{
 844	union diag318_info diag318_info = {
 845		.cpnc = CPNC_LINUX,
 846		.cpvc = 0,
 
 847	};
 848
 849	if (!sclp.has_diag318)
 850		return;
 851
 852	diag_stat_inc(DIAG_STAT_X318);
 853	asm volatile("diag %0,0,0x318\n" : : "d" (diag318_info.val));
 854}
 855
 856/*
 857 * Print the component list from the IPL report
 858 */
 859static void __init log_component_list(void)
 860{
 861	struct ipl_rb_component_entry *ptr, *end;
 862	char *str;
 863
 864	if (!early_ipl_comp_list_addr)
 865		return;
 866	if (ipl_block.hdr.flags & IPL_PL_FLAG_SIPL)
 867		pr_info("Linux is running with Secure-IPL enabled\n");
 868	else
 869		pr_info("Linux is running with Secure-IPL disabled\n");
 870	ptr = __va(early_ipl_comp_list_addr);
 871	end = (void *) ptr + early_ipl_comp_list_size;
 872	pr_info("The IPL report contains the following components:\n");
 873	while (ptr < end) {
 874		if (ptr->flags & IPL_RB_COMPONENT_FLAG_SIGNED) {
 875			if (ptr->flags & IPL_RB_COMPONENT_FLAG_VERIFIED)
 876				str = "signed, verified";
 877			else
 878				str = "signed, verification failed";
 879		} else {
 880			str = "not signed";
 881		}
 882		pr_info("%016llx - %016llx (%s)\n",
 883			ptr->addr, ptr->addr + ptr->len, str);
 884		ptr++;
 885	}
 886}
 887
 888/*
 889 * Setup function called from init/main.c just after the banner
 890 * was printed.
 891 */
 892
 893void __init setup_arch(char **cmdline_p)
 894{
 895        /*
 896         * print what head.S has found out about the machine
 897         */
 898	if (MACHINE_IS_VM)
 899		pr_info("Linux is running as a z/VM "
 900			"guest operating system in 64-bit mode\n");
 901	else if (MACHINE_IS_KVM)
 902		pr_info("Linux is running under KVM in 64-bit mode\n");
 903	else if (MACHINE_IS_LPAR)
 904		pr_info("Linux is running natively in 64-bit mode\n");
 905	else
 906		pr_info("Linux is running as a guest in 64-bit mode\n");
 907
 908	if (have_relocated_lowcore())
 909		pr_info("Lowcore relocated to 0x%px\n", get_lowcore());
 910
 911	log_component_list();
 912
 913	/* Have one command line that is parsed and saved in /proc/cmdline */
 914	/* boot_command_line has been already set up in early.c */
 915	*cmdline_p = boot_command_line;
 916
 917        ROOT_DEV = Root_RAM0;
 918
 919	setup_initial_init_mm(_text, _etext, _edata, _end);
 
 
 
 920
 921	if (IS_ENABLED(CONFIG_EXPOLINE_AUTO))
 922		nospec_auto_detect();
 923
 924	jump_label_init();
 925	parse_early_param();
 926#ifdef CONFIG_CRASH_DUMP
 927	/* Deactivate elfcorehdr= kernel parameter */
 928	elfcorehdr_addr = ELFCORE_ADDR_MAX;
 929#endif
 930
 931	os_info_init();
 932	setup_ipl();
 
 933	setup_control_program_code();
 934
 935	/* Do some memory reservations *before* memory is added to memblock */
 936	reserve_pgtables();
 937	reserve_lowcore();
 938	reserve_kernel();
 939	reserve_initrd();
 940	reserve_certificate_list();
 941	reserve_physmem_info();
 942	memblock_set_current_limit(ident_map_size);
 943	memblock_allow_resize();
 944
 945	/* Get information about *all* installed memory */
 946	memblock_add_physmem_info();
 
 
 
 
 
 
 
 
 
 
 
 947
 948	free_physmem_info();
 949	setup_memory_end();
 950	memblock_dump_all();
 951	setup_memory();
 952
 953	relocate_amode31_section();
 954	setup_cr();
 955	setup_uv();
 956	dma_contiguous_reserve(ident_map_size);
 957	vmcp_cma_reserve();
 958	if (MACHINE_HAS_EDAT2)
 959		hugetlb_cma_reserve(PUD_SHIFT - PAGE_SHIFT);
 960
 
 961	reserve_crashkernel();
 962#ifdef CONFIG_CRASH_DUMP
 963	/*
 964	 * Be aware that smp_save_dump_secondary_cpus() triggers a system reset.
 965	 * Therefore CPU and device initialization should be done afterwards.
 966	 */
 967	smp_save_dump_secondary_cpus();
 968#endif
 969
 970	setup_resources();
 971	setup_lowcore();
 972	smp_fill_possible_mask();
 973	cpu_detect_mhz_feature();
 974        cpu_init();
 975	numa_setup();
 976	smp_detect_cpus();
 977	topology_init_early();
 978
 979	if (test_facility(193))
 980		static_branch_enable(&cpu_has_bear);
 981
 982	/*
 983	 * Create kernel page tables.
 984	 */
 985        paging_init();
 986
 987	/*
 988	 * After paging_init created the kernel page table, the new PSWs
 989	 * in lowcore can now run with DAT enabled.
 990	 */
 991#ifdef CONFIG_CRASH_DUMP
 992	smp_save_dump_ipl_cpu();
 993#endif
 994
 995        /* Setup default console */
 996	conmode_default();
 997	set_preferred_console();
 998
 999	apply_alternative_instructions();
1000	if (IS_ENABLED(CONFIG_EXPOLINE))
1001		nospec_init_branches();
1002
1003	/* Setup zfcp/nvme dump support */
1004	setup_zfcpdump();
1005
1006	/* Add system specific data to the random pool */
1007	setup_randomness();
1008}
1009
1010void __init arch_cpu_finalize_init(void)
1011{
1012	sclp_init();
1013}
v5.4
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 *  S390 version
   4 *    Copyright IBM Corp. 1999, 2012
   5 *    Author(s): Hartmut Penner (hp@de.ibm.com),
   6 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
   7 *
   8 *  Derived from "arch/i386/kernel/setup.c"
   9 *    Copyright (C) 1995, Linus Torvalds
  10 */
  11
  12/*
  13 * This file handles the architecture-dependent parts of initialization
  14 */
  15
  16#define KMSG_COMPONENT "setup"
  17#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
  18
  19#include <linux/errno.h>
  20#include <linux/export.h>
  21#include <linux/sched.h>
  22#include <linux/sched/task.h>
  23#include <linux/cpu.h>
  24#include <linux/kernel.h>
  25#include <linux/memblock.h>
  26#include <linux/mm.h>
  27#include <linux/stddef.h>
  28#include <linux/unistd.h>
  29#include <linux/ptrace.h>
  30#include <linux/random.h>
  31#include <linux/user.h>
  32#include <linux/tty.h>
  33#include <linux/ioport.h>
  34#include <linux/delay.h>
  35#include <linux/init.h>
  36#include <linux/initrd.h>
  37#include <linux/root_dev.h>
  38#include <linux/console.h>
  39#include <linux/kernel_stat.h>
  40#include <linux/dma-contiguous.h>
  41#include <linux/device.h>
  42#include <linux/notifier.h>
  43#include <linux/pfn.h>
  44#include <linux/ctype.h>
  45#include <linux/reboot.h>
  46#include <linux/topology.h>
  47#include <linux/kexec.h>
  48#include <linux/crash_dump.h>
  49#include <linux/memory.h>
  50#include <linux/compat.h>
  51#include <linux/start_kernel.h>
 
 
  52
 
  53#include <asm/boot_data.h>
  54#include <asm/ipl.h>
  55#include <asm/facility.h>
  56#include <asm/smp.h>
  57#include <asm/mmu_context.h>
  58#include <asm/cpcmd.h>
  59#include <asm/lowcore.h>
  60#include <asm/nmi.h>
  61#include <asm/irq.h>
  62#include <asm/page.h>
  63#include <asm/ptrace.h>
  64#include <asm/sections.h>
  65#include <asm/ebcdic.h>
  66#include <asm/diag.h>
  67#include <asm/os_info.h>
  68#include <asm/sclp.h>
  69#include <asm/stacktrace.h>
  70#include <asm/sysinfo.h>
  71#include <asm/numa.h>
  72#include <asm/alternative.h>
  73#include <asm/nospec-branch.h>
  74#include <asm/mem_detect.h>
 
  75#include <asm/uv.h>
 
  76#include "entry.h"
  77
  78/*
  79 * Machine setup..
  80 */
  81unsigned int console_mode = 0;
  82EXPORT_SYMBOL(console_mode);
  83
  84unsigned int console_devno = -1;
  85EXPORT_SYMBOL(console_devno);
  86
  87unsigned int console_irq = -1;
  88EXPORT_SYMBOL(console_irq);
  89
  90unsigned long elf_hwcap __read_mostly = 0;
  91char elf_platform[ELF_PLATFORM_SIZE];
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
  92
  93unsigned long int_hwcap = 0;
 
 
 
 
 
 
 
 
 
  94
  95#ifdef CONFIG_PROTECTED_VIRTUALIZATION_GUEST
  96int __bootdata_preserved(prot_virt_guest);
  97#endif
 
  98
  99int __bootdata(noexec_disabled);
 100int __bootdata(memory_end_set);
 101unsigned long __bootdata(memory_end);
 102unsigned long __bootdata(vmalloc_size);
 103unsigned long __bootdata(max_physmem_end);
 104struct mem_detect_info __bootdata(mem_detect);
 105
 106struct exception_table_entry *__bootdata_preserved(__start_dma_ex_table);
 107struct exception_table_entry *__bootdata_preserved(__stop_dma_ex_table);
 108unsigned long __bootdata_preserved(__swsusp_reset_dma);
 109unsigned long __bootdata_preserved(__stext_dma);
 110unsigned long __bootdata_preserved(__etext_dma);
 111unsigned long __bootdata_preserved(__sdma);
 112unsigned long __bootdata_preserved(__edma);
 113unsigned long __bootdata_preserved(__kaslr_offset);
 
 114
 115unsigned long VMALLOC_START;
 116EXPORT_SYMBOL(VMALLOC_START);
 117
 118unsigned long VMALLOC_END;
 119EXPORT_SYMBOL(VMALLOC_END);
 120
 121struct page *vmemmap;
 122EXPORT_SYMBOL(vmemmap);
 
 123
 124unsigned long MODULES_VADDR;
 125unsigned long MODULES_END;
 126
 127/* An array with a pointer to the lowcore of every CPU. */
 128struct lowcore *lowcore_ptr[NR_CPUS];
 129EXPORT_SYMBOL(lowcore_ptr);
 130
 
 
 
 
 
 
 
 
 131/*
 132 * This is set up by the setup-routine at boot-time
 133 * for S390 need to find out, what we have to setup
 134 * using address 0x10400 ...
 135 */
 136
 137#include <asm/setup.h>
 138
 139/*
 140 * condev= and conmode= setup parameter.
 141 */
 142
 143static int __init condev_setup(char *str)
 144{
 145	int vdev;
 146
 147	vdev = simple_strtoul(str, &str, 0);
 148	if (vdev >= 0 && vdev < 65536) {
 149		console_devno = vdev;
 150		console_irq = -1;
 151	}
 152	return 1;
 153}
 154
 155__setup("condev=", condev_setup);
 156
 157static void __init set_preferred_console(void)
 158{
 159	if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
 160		add_preferred_console("ttyS", 0, NULL);
 161	else if (CONSOLE_IS_3270)
 162		add_preferred_console("tty3270", 0, NULL);
 163	else if (CONSOLE_IS_VT220)
 164		add_preferred_console("ttyS", 1, NULL);
 165	else if (CONSOLE_IS_HVC)
 166		add_preferred_console("hvc", 0, NULL);
 167}
 168
 169static int __init conmode_setup(char *str)
 170{
 171#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 172	if (!strcmp(str, "hwc") || !strcmp(str, "sclp"))
 173                SET_CONSOLE_SCLP;
 174#endif
 175#if defined(CONFIG_TN3215_CONSOLE)
 176	if (!strcmp(str, "3215"))
 177		SET_CONSOLE_3215;
 178#endif
 179#if defined(CONFIG_TN3270_CONSOLE)
 180	if (!strcmp(str, "3270"))
 181		SET_CONSOLE_3270;
 182#endif
 183	set_preferred_console();
 184        return 1;
 185}
 186
 187__setup("conmode=", conmode_setup);
 188
 189static void __init conmode_default(void)
 190{
 191	char query_buffer[1024];
 192	char *ptr;
 193
 194        if (MACHINE_IS_VM) {
 195		cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
 196		console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
 197		ptr = strstr(query_buffer, "SUBCHANNEL =");
 198		console_irq = simple_strtoul(ptr + 13, NULL, 16);
 199		cpcmd("QUERY TERM", query_buffer, 1024, NULL);
 200		ptr = strstr(query_buffer, "CONMODE");
 201		/*
 202		 * Set the conmode to 3215 so that the device recognition 
 203		 * will set the cu_type of the console to 3215. If the
 204		 * conmode is 3270 and we don't set it back then both
 205		 * 3215 and the 3270 driver will try to access the console
 206		 * device (3215 as console and 3270 as normal tty).
 207		 */
 208		cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
 209		if (ptr == NULL) {
 210#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 211			SET_CONSOLE_SCLP;
 212#endif
 213			return;
 214		}
 215		if (str_has_prefix(ptr + 8, "3270")) {
 216#if defined(CONFIG_TN3270_CONSOLE)
 217			SET_CONSOLE_3270;
 218#elif defined(CONFIG_TN3215_CONSOLE)
 219			SET_CONSOLE_3215;
 220#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 221			SET_CONSOLE_SCLP;
 222#endif
 223		} else if (str_has_prefix(ptr + 8, "3215")) {
 224#if defined(CONFIG_TN3215_CONSOLE)
 225			SET_CONSOLE_3215;
 226#elif defined(CONFIG_TN3270_CONSOLE)
 227			SET_CONSOLE_3270;
 228#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 229			SET_CONSOLE_SCLP;
 230#endif
 231		}
 232	} else if (MACHINE_IS_KVM) {
 233		if (sclp.has_vt220 && IS_ENABLED(CONFIG_SCLP_VT220_CONSOLE))
 234			SET_CONSOLE_VT220;
 235		else if (sclp.has_linemode && IS_ENABLED(CONFIG_SCLP_CONSOLE))
 236			SET_CONSOLE_SCLP;
 237		else
 238			SET_CONSOLE_HVC;
 239	} else {
 240#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
 241		SET_CONSOLE_SCLP;
 242#endif
 243	}
 244	if (IS_ENABLED(CONFIG_VT) && IS_ENABLED(CONFIG_DUMMY_CONSOLE))
 245		conswitchp = &dummy_con;
 246}
 247
 248#ifdef CONFIG_CRASH_DUMP
 249static void __init setup_zfcpdump(void)
 250{
 251	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
 252		return;
 253	if (OLDMEM_BASE)
 254		return;
 255	strcat(boot_command_line, " cio_ignore=all,!ipldev,!condev");
 256	console_loglevel = 2;
 257}
 258#else
 259static inline void setup_zfcpdump(void) {}
 260#endif /* CONFIG_CRASH_DUMP */
 261
 262 /*
 263 * Reboot, halt and power_off stubs. They just call _machine_restart,
 264 * _machine_halt or _machine_power_off. 
 265 */
 266
 267void machine_restart(char *command)
 268{
 269	if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
 270		/*
 271		 * Only unblank the console if we are called in enabled
 272		 * context or a bust_spinlocks cleared the way for us.
 273		 */
 274		console_unblank();
 275	_machine_restart(command);
 276}
 277
 278void machine_halt(void)
 279{
 280	if (!in_interrupt() || oops_in_progress)
 281		/*
 282		 * Only unblank the console if we are called in enabled
 283		 * context or a bust_spinlocks cleared the way for us.
 284		 */
 285		console_unblank();
 286	_machine_halt();
 287}
 288
 289void machine_power_off(void)
 290{
 291	if (!in_interrupt() || oops_in_progress)
 292		/*
 293		 * Only unblank the console if we are called in enabled
 294		 * context or a bust_spinlocks cleared the way for us.
 295		 */
 296		console_unblank();
 297	_machine_power_off();
 298}
 299
 300/*
 301 * Dummy power off function.
 302 */
 303void (*pm_power_off)(void) = machine_power_off;
 304EXPORT_SYMBOL_GPL(pm_power_off);
 305
 306void *restart_stack __section(.data);
 307
 308unsigned long stack_alloc(void)
 309{
 310#ifdef CONFIG_VMAP_STACK
 311	return (unsigned long)
 312		__vmalloc_node_range(THREAD_SIZE, THREAD_SIZE,
 313				     VMALLOC_START, VMALLOC_END,
 314				     THREADINFO_GFP,
 315				     PAGE_KERNEL, 0, NUMA_NO_NODE,
 316				     __builtin_return_address(0));
 317#else
 318	return __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
 319#endif
 320}
 321
 322void stack_free(unsigned long stack)
 323{
 324#ifdef CONFIG_VMAP_STACK
 325	vfree((void *) stack);
 326#else
 327	free_pages(stack, THREAD_SIZE_ORDER);
 328#endif
 329}
 330
 331int __init arch_early_irq_init(void)
 332{
 333	unsigned long stack;
 334
 335	stack = __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
 336	if (!stack)
 337		panic("Couldn't allocate async stack");
 338	S390_lowcore.async_stack = stack + STACK_INIT_OFFSET;
 339	return 0;
 
 340}
 341
 342static int __init async_stack_realloc(void)
 343{
 344	unsigned long old, new;
 345
 346	old = S390_lowcore.async_stack - STACK_INIT_OFFSET;
 347	new = stack_alloc();
 348	if (!new)
 349		panic("Couldn't allocate async stack");
 350	S390_lowcore.async_stack = new + STACK_INIT_OFFSET;
 351	free_pages(old, THREAD_SIZE_ORDER);
 352	return 0;
 353}
 354early_initcall(async_stack_realloc);
 355
 356void __init arch_call_rest_init(void)
 357{
 358	struct stack_frame *frame;
 359	unsigned long stack;
 360
 361	stack = stack_alloc();
 362	if (!stack)
 363		panic("Couldn't allocate kernel stack");
 364	current->stack = (void *) stack;
 365#ifdef CONFIG_VMAP_STACK
 366	current->stack_vm_area = (void *) stack;
 367#endif
 368	set_task_stack_end_magic(current);
 369	stack += STACK_INIT_OFFSET;
 370	S390_lowcore.kernel_stack = stack;
 371	frame = (struct stack_frame *) stack;
 372	memset(frame, 0, sizeof(*frame));
 373	/* Branch to rest_init on the new stack, never returns */
 374	asm volatile(
 375		"	la	15,0(%[_frame])\n"
 376		"	jg	rest_init\n"
 377		: : [_frame] "a" (frame));
 378}
 379
 380static void __init setup_lowcore_dat_off(void)
 381{
 382	struct lowcore *lc;
 383
 384	/*
 385	 * Setup lowcore for boot cpu
 386	 */
 387	BUILD_BUG_ON(sizeof(struct lowcore) != LC_PAGES * PAGE_SIZE);
 388	lc = memblock_alloc_low(sizeof(*lc), sizeof(*lc));
 389	if (!lc)
 390		panic("%s: Failed to allocate %zu bytes align=%zx\n",
 391		      __func__, sizeof(*lc), sizeof(*lc));
 392
 393	lc->restart_psw.mask = PSW_KERNEL_BITS;
 394	lc->restart_psw.addr = (unsigned long) restart_int_handler;
 395	lc->external_new_psw.mask = PSW_KERNEL_BITS | PSW_MASK_MCHECK;
 
 396	lc->external_new_psw.addr = (unsigned long) ext_int_handler;
 397	lc->svc_new_psw.mask = PSW_KERNEL_BITS |
 398		PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK;
 399	lc->svc_new_psw.addr = (unsigned long) system_call;
 400	lc->program_new_psw.mask = PSW_KERNEL_BITS | PSW_MASK_MCHECK;
 401	lc->program_new_psw.addr = (unsigned long) pgm_check_handler;
 402	lc->mcck_new_psw.mask = PSW_KERNEL_BITS;
 403	lc->mcck_new_psw.addr = (unsigned long) mcck_int_handler;
 404	lc->io_new_psw.mask = PSW_KERNEL_BITS | PSW_MASK_MCHECK;
 405	lc->io_new_psw.addr = (unsigned long) io_int_handler;
 406	lc->clock_comparator = clock_comparator_max;
 407	lc->nodat_stack = ((unsigned long) &init_thread_union)
 408		+ THREAD_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
 409	lc->current_task = (unsigned long)&init_task;
 410	lc->lpp = LPP_MAGIC;
 411	lc->machine_flags = S390_lowcore.machine_flags;
 412	lc->preempt_count = S390_lowcore.preempt_count;
 413	lc->stfl_fac_list = S390_lowcore.stfl_fac_list;
 414	memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
 415	       sizeof(lc->stfle_fac_list));
 416	memcpy(lc->alt_stfle_fac_list, S390_lowcore.alt_stfle_fac_list,
 417	       sizeof(lc->alt_stfle_fac_list));
 418	nmi_alloc_boot_cpu(lc);
 419	vdso_alloc_boot_cpu(lc);
 420	lc->sync_enter_timer = S390_lowcore.sync_enter_timer;
 421	lc->async_enter_timer = S390_lowcore.async_enter_timer;
 422	lc->exit_timer = S390_lowcore.exit_timer;
 423	lc->user_timer = S390_lowcore.user_timer;
 424	lc->system_timer = S390_lowcore.system_timer;
 425	lc->steal_timer = S390_lowcore.steal_timer;
 426	lc->last_update_timer = S390_lowcore.last_update_timer;
 427	lc->last_update_clock = S390_lowcore.last_update_clock;
 428
 429	/*
 430	 * Allocate the global restart stack which is the same for
 431	 * all CPUs in cast *one* of them does a PSW restart.
 432	 */
 433	restart_stack = memblock_alloc(THREAD_SIZE, THREAD_SIZE);
 434	if (!restart_stack)
 435		panic("%s: Failed to allocate %lu bytes align=0x%lx\n",
 436		      __func__, THREAD_SIZE, THREAD_SIZE);
 437	restart_stack += STACK_INIT_OFFSET;
 438
 439	/*
 440	 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
 441	 * restart data to the absolute zero lowcore. This is necessary if
 442	 * PSW restart is done on an offline CPU that has lowcore zero.
 443	 */
 444	lc->restart_stack = (unsigned long) restart_stack;
 445	lc->restart_fn = (unsigned long) do_restart;
 446	lc->restart_data = 0;
 447	lc->restart_source = -1UL;
 448
 449	/* Setup absolute zero lowcore */
 450	mem_assign_absolute(S390_lowcore.restart_stack, lc->restart_stack);
 451	mem_assign_absolute(S390_lowcore.restart_fn, lc->restart_fn);
 452	mem_assign_absolute(S390_lowcore.restart_data, lc->restart_data);
 453	mem_assign_absolute(S390_lowcore.restart_source, lc->restart_source);
 454	mem_assign_absolute(S390_lowcore.restart_psw, lc->restart_psw);
 455
 456	lc->spinlock_lockval = arch_spin_lockval(0);
 457	lc->spinlock_index = 0;
 458	arch_spin_lock_setup(0);
 459	lc->br_r1_trampoline = 0x07f1;	/* br %r1 */
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 460
 461	set_prefix((u32)(unsigned long) lc);
 462	lowcore_ptr[0] = lc;
 463}
 464
 465static void __init setup_lowcore_dat_on(void)
 466{
 467	__ctl_clear_bit(0, 28);
 468	S390_lowcore.external_new_psw.mask |= PSW_MASK_DAT;
 469	S390_lowcore.svc_new_psw.mask |= PSW_MASK_DAT;
 470	S390_lowcore.program_new_psw.mask |= PSW_MASK_DAT;
 471	S390_lowcore.io_new_psw.mask |= PSW_MASK_DAT;
 472	__ctl_set_bit(0, 28);
 473}
 474
 475static struct resource code_resource = {
 476	.name  = "Kernel code",
 477	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 478};
 479
 480static struct resource data_resource = {
 481	.name = "Kernel data",
 482	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 483};
 484
 485static struct resource bss_resource = {
 486	.name = "Kernel bss",
 487	.flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
 488};
 489
 490static struct resource __initdata *standard_resources[] = {
 491	&code_resource,
 492	&data_resource,
 493	&bss_resource,
 494};
 495
 496static void __init setup_resources(void)
 497{
 498	struct resource *res, *std_res, *sub_res;
 499	struct memblock_region *reg;
 500	int j;
 
 501
 502	code_resource.start = (unsigned long) _text;
 503	code_resource.end = (unsigned long) _etext - 1;
 504	data_resource.start = (unsigned long) _etext;
 505	data_resource.end = (unsigned long) _edata - 1;
 506	bss_resource.start = (unsigned long) __bss_start;
 507	bss_resource.end = (unsigned long) __bss_stop - 1;
 508
 509	for_each_memblock(memory, reg) {
 510		res = memblock_alloc(sizeof(*res), 8);
 511		if (!res)
 512			panic("%s: Failed to allocate %zu bytes align=0x%x\n",
 513			      __func__, sizeof(*res), 8);
 514		res->flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM;
 515
 516		res->name = "System RAM";
 517		res->start = reg->base;
 518		res->end = reg->base + reg->size - 1;
 
 
 
 
 
 519		request_resource(&iomem_resource, res);
 520
 521		for (j = 0; j < ARRAY_SIZE(standard_resources); j++) {
 522			std_res = standard_resources[j];
 523			if (std_res->start < res->start ||
 524			    std_res->start > res->end)
 525				continue;
 526			if (std_res->end > res->end) {
 527				sub_res = memblock_alloc(sizeof(*sub_res), 8);
 528				if (!sub_res)
 529					panic("%s: Failed to allocate %zu bytes align=0x%x\n",
 530					      __func__, sizeof(*sub_res), 8);
 531				*sub_res = *std_res;
 532				sub_res->end = res->end;
 533				std_res->start = res->end + 1;
 534				request_resource(res, sub_res);
 535			} else {
 536				request_resource(res, std_res);
 537			}
 538		}
 539	}
 540#ifdef CONFIG_CRASH_DUMP
 541	/*
 542	 * Re-add removed crash kernel memory as reserved memory. This makes
 543	 * sure it will be mapped with the identity mapping and struct pages
 544	 * will be created, so it can be resized later on.
 545	 * However add it later since the crash kernel resource should not be
 546	 * part of the System RAM resource.
 547	 */
 548	if (crashk_res.end) {
 549		memblock_add_node(crashk_res.start, resource_size(&crashk_res), 0);
 
 550		memblock_reserve(crashk_res.start, resource_size(&crashk_res));
 551		insert_resource(&iomem_resource, &crashk_res);
 552	}
 553#endif
 554}
 555
 556static void __init setup_memory_end(void)
 557{
 558	unsigned long vmax, tmp;
 559
 560	/* Choose kernel address space layout: 3 or 4 levels. */
 561	if (IS_ENABLED(CONFIG_KASAN)) {
 562		vmax = IS_ENABLED(CONFIG_KASAN_S390_4_LEVEL_PAGING)
 563			   ? _REGION1_SIZE
 564			   : _REGION2_SIZE;
 565	} else {
 566		tmp = (memory_end ?: max_physmem_end) / PAGE_SIZE;
 567		tmp = tmp * (sizeof(struct page) + PAGE_SIZE);
 568		if (tmp + vmalloc_size + MODULES_LEN <= _REGION2_SIZE)
 569			vmax = _REGION2_SIZE; /* 3-level kernel page table */
 570		else
 571			vmax = _REGION1_SIZE; /* 4-level kernel page table */
 572	}
 573
 574	/* module area is at the end of the kernel address space. */
 575	MODULES_END = vmax;
 576	MODULES_VADDR = MODULES_END - MODULES_LEN;
 577	VMALLOC_END = MODULES_VADDR;
 578	VMALLOC_START = VMALLOC_END - vmalloc_size;
 579
 580	/* Split remaining virtual space between 1:1 mapping & vmemmap array */
 581	tmp = VMALLOC_START / (PAGE_SIZE + sizeof(struct page));
 582	/* vmemmap contains a multiple of PAGES_PER_SECTION struct pages */
 583	tmp = SECTION_ALIGN_UP(tmp);
 584	tmp = VMALLOC_START - tmp * sizeof(struct page);
 585	tmp &= ~((vmax >> 11) - 1);	/* align to page table level */
 586	tmp = min(tmp, 1UL << MAX_PHYSMEM_BITS);
 587	vmemmap = (struct page *) tmp;
 588
 589	/* Take care that memory_end is set and <= vmemmap */
 590	memory_end = min(memory_end ?: max_physmem_end, (unsigned long)vmemmap);
 591#ifdef CONFIG_KASAN
 592	/* fit in kasan shadow memory region between 1:1 and vmemmap */
 593	memory_end = min(memory_end, KASAN_SHADOW_START);
 594	vmemmap = max(vmemmap, (struct page *)KASAN_SHADOW_END);
 595#endif
 596	max_pfn = max_low_pfn = PFN_DOWN(memory_end);
 597	memblock_remove(memory_end, ULONG_MAX);
 598
 599	pr_notice("The maximum memory size is %luMB\n", memory_end >> 20);
 600}
 601
 602#ifdef CONFIG_CRASH_DUMP
 603
 604/*
 605 * When kdump is enabled, we have to ensure that no memory from
 606 * the area [0 - crashkernel memory size] and
 607 * [crashk_res.start - crashk_res.end] is set offline.
 
 608 */
 609static int kdump_mem_notifier(struct notifier_block *nb,
 610			      unsigned long action, void *data)
 611{
 612	struct memory_notify *arg = data;
 613
 614	if (action != MEM_GOING_OFFLINE)
 615		return NOTIFY_OK;
 616	if (arg->start_pfn < PFN_DOWN(resource_size(&crashk_res)))
 617		return NOTIFY_BAD;
 618	if (arg->start_pfn > PFN_DOWN(crashk_res.end))
 619		return NOTIFY_OK;
 620	if (arg->start_pfn + arg->nr_pages - 1 < PFN_DOWN(crashk_res.start))
 621		return NOTIFY_OK;
 622	return NOTIFY_BAD;
 623}
 624
 625static struct notifier_block kdump_mem_nb = {
 626	.notifier_call = kdump_mem_notifier,
 627};
 628
 629#endif
 630
 631/*
 632 * Make sure that the area behind memory_end is protected
 633 */
 634static void reserve_memory_end(void)
 635{
 636	if (memory_end_set)
 637		memblock_reserve(memory_end, ULONG_MAX);
 638}
 639
 640/*
 641 * Make sure that oldmem, where the dump is stored, is protected
 642 */
 643static void reserve_oldmem(void)
 644{
 645#ifdef CONFIG_CRASH_DUMP
 646	if (OLDMEM_BASE)
 647		/* Forget all memory above the running kdump system */
 648		memblock_reserve(OLDMEM_SIZE, (phys_addr_t)ULONG_MAX);
 649#endif
 650}
 651
 652/*
 653 * Make sure that oldmem, where the dump is stored, is protected
 654 */
 655static void remove_oldmem(void)
 656{
 657#ifdef CONFIG_CRASH_DUMP
 658	if (OLDMEM_BASE)
 659		/* Forget all memory above the running kdump system */
 660		memblock_remove(OLDMEM_SIZE, (phys_addr_t)ULONG_MAX);
 661#endif
 662}
 663
 664/*
 665 * Reserve memory for kdump kernel to be loaded with kexec
 666 */
 667static void __init reserve_crashkernel(void)
 668{
 669#ifdef CONFIG_CRASH_DUMP
 670	unsigned long long crash_base, crash_size;
 671	phys_addr_t low, high;
 672	int rc;
 673
 674	rc = parse_crashkernel(boot_command_line, memory_end, &crash_size,
 675			       &crash_base);
 676
 677	crash_base = ALIGN(crash_base, KEXEC_CRASH_MEM_ALIGN);
 678	crash_size = ALIGN(crash_size, KEXEC_CRASH_MEM_ALIGN);
 679	if (rc || crash_size == 0)
 680		return;
 681
 682	if (memblock.memory.regions[0].size < crash_size) {
 683		pr_info("crashkernel reservation failed: %s\n",
 684			"first memory chunk must be at least crashkernel size");
 685		return;
 686	}
 687
 688	low = crash_base ?: OLDMEM_BASE;
 689	high = low + crash_size;
 690	if (low >= OLDMEM_BASE && high <= OLDMEM_BASE + OLDMEM_SIZE) {
 691		/* The crashkernel fits into OLDMEM, reuse OLDMEM */
 692		crash_base = low;
 693	} else {
 694		/* Find suitable area in free memory */
 695		low = max_t(unsigned long, crash_size, sclp.hsa_size);
 696		high = crash_base ? crash_base + crash_size : ULONG_MAX;
 697
 698		if (crash_base && crash_base < low) {
 699			pr_info("crashkernel reservation failed: %s\n",
 700				"crash_base too low");
 701			return;
 702		}
 703		low = crash_base ?: low;
 704		crash_base = memblock_find_in_range(low, high, crash_size,
 705						    KEXEC_CRASH_MEM_ALIGN);
 
 706	}
 707
 708	if (!crash_base) {
 709		pr_info("crashkernel reservation failed: %s\n",
 710			"no suitable area found");
 711		return;
 712	}
 713
 714	if (register_memory_notifier(&kdump_mem_nb))
 
 715		return;
 
 716
 717	if (!OLDMEM_BASE && MACHINE_IS_VM)
 718		diag10_range(PFN_DOWN(crash_base), PFN_DOWN(crash_size));
 719	crashk_res.start = crash_base;
 720	crashk_res.end = crash_base + crash_size - 1;
 721	memblock_remove(crash_base, crash_size);
 722	pr_info("Reserving %lluMB of memory at %lluMB "
 723		"for crashkernel (System RAM: %luMB)\n",
 724		crash_size >> 20, crash_base >> 20,
 725		(unsigned long)memblock.memory.total_size >> 20);
 726	os_info_crashkernel_add(crash_base, crash_size);
 727#endif
 728}
 729
 730/*
 731 * Reserve the initrd from being used by memblock
 732 */
 733static void __init reserve_initrd(void)
 734{
 735#ifdef CONFIG_BLK_DEV_INITRD
 736	if (!INITRD_START || !INITRD_SIZE)
 
 737		return;
 738	initrd_start = INITRD_START;
 739	initrd_end = initrd_start + INITRD_SIZE;
 740	memblock_reserve(INITRD_START, INITRD_SIZE);
 741#endif
 742}
 743
 744/*
 745 * Reserve the memory area used to pass the certificate lists
 746 */
 747static void __init reserve_certificate_list(void)
 748{
 749	if (ipl_cert_list_addr)
 750		memblock_reserve(ipl_cert_list_addr, ipl_cert_list_size);
 751}
 752
 753static void __init reserve_mem_detect_info(void)
 754{
 755	unsigned long start, size;
 756
 757	get_mem_detect_reserved(&start, &size);
 758	if (size)
 759		memblock_reserve(start, size);
 760}
 761
 762static void __init free_mem_detect_info(void)
 763{
 764	unsigned long start, size;
 765
 766	get_mem_detect_reserved(&start, &size);
 767	if (size)
 768		memblock_free(start, size);
 769}
 770
 771static void __init memblock_physmem_add(phys_addr_t start, phys_addr_t size)
 772{
 773	memblock_dbg("memblock_physmem_add: [%#016llx-%#016llx]\n",
 774		     start, start + size - 1);
 775	memblock_add_range(&memblock.memory, start, size, 0, 0);
 776	memblock_add_range(&memblock.physmem, start, size, 0, 0);
 777}
 778
 779static const char * __init get_mem_info_source(void)
 780{
 781	switch (mem_detect.info_source) {
 782	case MEM_DETECT_SCLP_STOR_INFO:
 783		return "sclp storage info";
 784	case MEM_DETECT_DIAG260:
 785		return "diag260";
 786	case MEM_DETECT_SCLP_READ_INFO:
 787		return "sclp read info";
 788	case MEM_DETECT_BIN_SEARCH:
 789		return "binary search";
 790	}
 791	return "none";
 792}
 793
 794static void __init memblock_add_mem_detect_info(void)
 795{
 796	unsigned long start, end;
 797	int i;
 798
 799	memblock_dbg("physmem info source: %s (%hhd)\n",
 800		     get_mem_info_source(), mem_detect.info_source);
 801	/* keep memblock lists close to the kernel */
 802	memblock_set_bottom_up(true);
 803	for_each_mem_detect_block(i, &start, &end)
 
 
 804		memblock_physmem_add(start, end - start);
 805	memblock_set_bottom_up(false);
 806	memblock_dump_all();
 807}
 808
 809/*
 810 * Check for initrd being in usable memory
 811 */
 812static void __init check_initrd(void)
 813{
 814#ifdef CONFIG_BLK_DEV_INITRD
 815	if (INITRD_START && INITRD_SIZE &&
 816	    !memblock_is_region_memory(INITRD_START, INITRD_SIZE)) {
 817		pr_err("The initial RAM disk does not fit into the memory\n");
 818		memblock_free(INITRD_START, INITRD_SIZE);
 819		initrd_start = initrd_end = 0;
 
 
 820	}
 821#endif
 822}
 823
 824/*
 825 * Reserve memory used for lowcore/command line/kernel image.
 826 */
 827static void __init reserve_kernel(void)
 828{
 829	unsigned long start_pfn = PFN_UP(__pa(_end));
 830
 831	memblock_reserve(0, HEAD_END);
 832	memblock_reserve((unsigned long)_stext, PFN_PHYS(start_pfn)
 833			 - (unsigned long)_stext);
 834	memblock_reserve(__sdma, __edma - __sdma);
 835}
 836
 837static void __init setup_memory(void)
 838{
 839	struct memblock_region *reg;
 
 840
 841	/*
 842	 * Init storage key for present memory
 843	 */
 844	for_each_memblock(memory, reg) {
 845		storage_key_init_range(reg->base, reg->base + reg->size);
 846	}
 847	psw_set_key(PAGE_DEFAULT_KEY);
 848
 849	/* Only cosmetics */
 850	memblock_enforce_memory_limit(memblock_end_of_DRAM());
 851}
 852
 853/*
 854 * Setup hardware capabilities.
 855 */
 856static int __init setup_hwcaps(void)
 857{
 858	static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
 859	struct cpuid cpu_id;
 860	int i;
 861
 862	/*
 863	 * The store facility list bits numbers as found in the principles
 864	 * of operation are numbered with bit 1UL<<31 as number 0 to
 865	 * bit 1UL<<0 as number 31.
 866	 *   Bit 0: instructions named N3, "backported" to esa-mode
 867	 *   Bit 2: z/Architecture mode is active
 868	 *   Bit 7: the store-facility-list-extended facility is installed
 869	 *   Bit 17: the message-security assist is installed
 870	 *   Bit 19: the long-displacement facility is installed
 871	 *   Bit 21: the extended-immediate facility is installed
 872	 *   Bit 22: extended-translation facility 3 is installed
 873	 *   Bit 30: extended-translation facility 3 enhancement facility
 874	 * These get translated to:
 875	 *   HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
 876	 *   HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
 877	 *   HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
 878	 *   HWCAP_S390_ETF3EH bit 8 (22 && 30).
 879	 */
 880	for (i = 0; i < 6; i++)
 881		if (test_facility(stfl_bits[i]))
 882			elf_hwcap |= 1UL << i;
 883
 884	if (test_facility(22) && test_facility(30))
 885		elf_hwcap |= HWCAP_S390_ETF3EH;
 886
 887	/*
 888	 * Check for additional facilities with store-facility-list-extended.
 889	 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
 890	 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
 891	 * as stored by stfl, bits 32-xxx contain additional facilities.
 892	 * How many facility words are stored depends on the number of
 893	 * doublewords passed to the instruction. The additional facilities
 894	 * are:
 895	 *   Bit 42: decimal floating point facility is installed
 896	 *   Bit 44: perform floating point operation facility is installed
 897	 * translated to:
 898	 *   HWCAP_S390_DFP bit 6 (42 && 44).
 899	 */
 900	if ((elf_hwcap & (1UL << 2)) && test_facility(42) && test_facility(44))
 901		elf_hwcap |= HWCAP_S390_DFP;
 902
 903	/*
 904	 * Huge page support HWCAP_S390_HPAGE is bit 7.
 905	 */
 906	if (MACHINE_HAS_EDAT1)
 907		elf_hwcap |= HWCAP_S390_HPAGE;
 908
 909	/*
 910	 * 64-bit register support for 31-bit processes
 911	 * HWCAP_S390_HIGH_GPRS is bit 9.
 912	 */
 913	elf_hwcap |= HWCAP_S390_HIGH_GPRS;
 914
 915	/*
 916	 * Transactional execution support HWCAP_S390_TE is bit 10.
 917	 */
 918	if (MACHINE_HAS_TE)
 919		elf_hwcap |= HWCAP_S390_TE;
 920
 921	/*
 922	 * Vector extension HWCAP_S390_VXRS is bit 11. The Vector extension
 923	 * can be disabled with the "novx" parameter. Use MACHINE_HAS_VX
 924	 * instead of facility bit 129.
 925	 */
 926	if (MACHINE_HAS_VX) {
 927		elf_hwcap |= HWCAP_S390_VXRS;
 928		if (test_facility(134))
 929			elf_hwcap |= HWCAP_S390_VXRS_EXT;
 930		if (test_facility(135))
 931			elf_hwcap |= HWCAP_S390_VXRS_BCD;
 932		if (test_facility(148))
 933			elf_hwcap |= HWCAP_S390_VXRS_EXT2;
 934		if (test_facility(152))
 935			elf_hwcap |= HWCAP_S390_VXRS_PDE;
 936	}
 937	if (test_facility(150))
 938		elf_hwcap |= HWCAP_S390_SORT;
 939	if (test_facility(151))
 940		elf_hwcap |= HWCAP_S390_DFLT;
 941
 942	/*
 943	 * Guarded storage support HWCAP_S390_GS is bit 12.
 944	 */
 945	if (MACHINE_HAS_GS)
 946		elf_hwcap |= HWCAP_S390_GS;
 947
 948	get_cpu_id(&cpu_id);
 949	add_device_randomness(&cpu_id, sizeof(cpu_id));
 950	switch (cpu_id.machine) {
 951	case 0x2064:
 952	case 0x2066:
 953	default:	/* Use "z900" as default for 64 bit kernels. */
 954		strcpy(elf_platform, "z900");
 955		break;
 956	case 0x2084:
 957	case 0x2086:
 958		strcpy(elf_platform, "z990");
 959		break;
 960	case 0x2094:
 961	case 0x2096:
 962		strcpy(elf_platform, "z9-109");
 963		break;
 964	case 0x2097:
 965	case 0x2098:
 966		strcpy(elf_platform, "z10");
 967		break;
 968	case 0x2817:
 969	case 0x2818:
 970		strcpy(elf_platform, "z196");
 971		break;
 972	case 0x2827:
 973	case 0x2828:
 974		strcpy(elf_platform, "zEC12");
 975		break;
 976	case 0x2964:
 977	case 0x2965:
 978		strcpy(elf_platform, "z13");
 979		break;
 980	case 0x3906:
 981	case 0x3907:
 982		strcpy(elf_platform, "z14");
 983		break;
 984	case 0x8561:
 985	case 0x8562:
 986		strcpy(elf_platform, "z15");
 987		break;
 988	}
 989
 990	/*
 991	 * Virtualization support HWCAP_INT_SIE is bit 0.
 992	 */
 993	if (sclp.has_sief2)
 994		int_hwcap |= HWCAP_INT_SIE;
 995
 996	return 0;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 997}
 998arch_initcall(setup_hwcaps);
 999
1000/*
1001 * Add system information as device randomness
1002 */
1003static void __init setup_randomness(void)
1004{
1005	struct sysinfo_3_2_2 *vmms;
1006
1007	vmms = (struct sysinfo_3_2_2 *) memblock_phys_alloc(PAGE_SIZE,
1008							    PAGE_SIZE);
1009	if (!vmms)
1010		panic("Failed to allocate memory for sysinfo structure\n");
1011
1012	if (stsi(vmms, 3, 2, 2) == 0 && vmms->count)
1013		add_device_randomness(&vmms->vm, sizeof(vmms->vm[0]) * vmms->count);
1014	memblock_free((unsigned long) vmms, PAGE_SIZE);
1015}
1016
1017/*
1018 * Find the correct size for the task_struct. This depends on
1019 * the size of the struct fpu at the end of the thread_struct
1020 * which is embedded in the task_struct.
1021 */
1022static void __init setup_task_size(void)
1023{
1024	int task_size = sizeof(struct task_struct);
1025
1026	if (!MACHINE_HAS_VX) {
1027		task_size -= sizeof(__vector128) * __NUM_VXRS;
1028		task_size += sizeof(freg_t) * __NUM_FPRS;
1029	}
1030	arch_task_struct_size = task_size;
1031}
1032
1033/*
1034 * Issue diagnose 318 to set the control program name and
1035 * version codes.
1036 */
1037static void __init setup_control_program_code(void)
1038{
1039	union diag318_info diag318_info = {
1040		.cpnc = CPNC_LINUX,
1041		.cpvc_linux = 0,
1042		.cpvc_distro = {0},
1043	};
1044
1045	if (!sclp.has_diag318)
1046		return;
1047
1048	diag_stat_inc(DIAG_STAT_X318);
1049	asm volatile("diag %0,0,0x318\n" : : "d" (diag318_info.val));
1050}
1051
1052/*
1053 * Print the component list from the IPL report
1054 */
1055static void __init log_component_list(void)
1056{
1057	struct ipl_rb_component_entry *ptr, *end;
1058	char *str;
1059
1060	if (!early_ipl_comp_list_addr)
1061		return;
1062	if (ipl_block.hdr.flags & IPL_PL_FLAG_IPLSR)
1063		pr_info("Linux is running with Secure-IPL enabled\n");
1064	else
1065		pr_info("Linux is running with Secure-IPL disabled\n");
1066	ptr = (void *) early_ipl_comp_list_addr;
1067	end = (void *) ptr + early_ipl_comp_list_size;
1068	pr_info("The IPL report contains the following components:\n");
1069	while (ptr < end) {
1070		if (ptr->flags & IPL_RB_COMPONENT_FLAG_SIGNED) {
1071			if (ptr->flags & IPL_RB_COMPONENT_FLAG_VERIFIED)
1072				str = "signed, verified";
1073			else
1074				str = "signed, verification failed";
1075		} else {
1076			str = "not signed";
1077		}
1078		pr_info("%016llx - %016llx (%s)\n",
1079			ptr->addr, ptr->addr + ptr->len, str);
1080		ptr++;
1081	}
1082}
1083
1084/*
1085 * Setup function called from init/main.c just after the banner
1086 * was printed.
1087 */
1088
1089void __init setup_arch(char **cmdline_p)
1090{
1091        /*
1092         * print what head.S has found out about the machine
1093         */
1094	if (MACHINE_IS_VM)
1095		pr_info("Linux is running as a z/VM "
1096			"guest operating system in 64-bit mode\n");
1097	else if (MACHINE_IS_KVM)
1098		pr_info("Linux is running under KVM in 64-bit mode\n");
1099	else if (MACHINE_IS_LPAR)
1100		pr_info("Linux is running natively in 64-bit mode\n");
1101	else
1102		pr_info("Linux is running as a guest in 64-bit mode\n");
1103
 
 
 
1104	log_component_list();
1105
1106	/* Have one command line that is parsed and saved in /proc/cmdline */
1107	/* boot_command_line has been already set up in early.c */
1108	*cmdline_p = boot_command_line;
1109
1110        ROOT_DEV = Root_RAM0;
1111
1112	init_mm.start_code = (unsigned long) _text;
1113	init_mm.end_code = (unsigned long) _etext;
1114	init_mm.end_data = (unsigned long) _edata;
1115	init_mm.brk = (unsigned long) _end;
1116
1117	if (IS_ENABLED(CONFIG_EXPOLINE_AUTO))
1118		nospec_auto_detect();
1119
 
1120	parse_early_param();
1121#ifdef CONFIG_CRASH_DUMP
1122	/* Deactivate elfcorehdr= kernel parameter */
1123	elfcorehdr_addr = ELFCORE_ADDR_MAX;
1124#endif
1125
1126	os_info_init();
1127	setup_ipl();
1128	setup_task_size();
1129	setup_control_program_code();
1130
1131	/* Do some memory reservations *before* memory is added to memblock */
1132	reserve_memory_end();
1133	reserve_oldmem();
1134	reserve_kernel();
1135	reserve_initrd();
1136	reserve_certificate_list();
1137	reserve_mem_detect_info();
 
1138	memblock_allow_resize();
1139
1140	/* Get information about *all* installed memory */
1141	memblock_add_mem_detect_info();
1142
1143	free_mem_detect_info();
1144	remove_oldmem();
1145
1146	/*
1147	 * Make sure all chunks are MAX_ORDER aligned so we don't need the
1148	 * extra checks that HOLES_IN_ZONE would require.
1149	 *
1150	 * Is this still required?
1151	 */
1152	memblock_trim_memory(1UL << (MAX_ORDER - 1 + PAGE_SHIFT));
1153
 
1154	setup_memory_end();
 
1155	setup_memory();
1156	dma_contiguous_reserve(memory_end);
 
 
 
 
1157	vmcp_cma_reserve();
 
 
1158
1159	check_initrd();
1160	reserve_crashkernel();
1161#ifdef CONFIG_CRASH_DUMP
1162	/*
1163	 * Be aware that smp_save_dump_cpus() triggers a system reset.
1164	 * Therefore CPU and device initialization should be done afterwards.
1165	 */
1166	smp_save_dump_cpus();
1167#endif
1168
1169	setup_resources();
1170	setup_lowcore_dat_off();
1171	smp_fill_possible_mask();
1172	cpu_detect_mhz_feature();
1173        cpu_init();
1174	numa_setup();
1175	smp_detect_cpus();
1176	topology_init_early();
1177
 
 
 
1178	/*
1179	 * Create kernel page tables and switch to virtual addressing.
1180	 */
1181        paging_init();
1182
1183	/*
1184	 * After paging_init created the kernel page table, the new PSWs
1185	 * in lowcore can now run with DAT enabled.
1186	 */
1187	setup_lowcore_dat_on();
 
 
1188
1189        /* Setup default console */
1190	conmode_default();
1191	set_preferred_console();
1192
1193	apply_alternative_instructions();
1194	if (IS_ENABLED(CONFIG_EXPOLINE))
1195		nospec_init_branches();
1196
1197	/* Setup zfcpdump support */
1198	setup_zfcpdump();
1199
1200	/* Add system specific data to the random pool */
1201	setup_randomness();
 
 
 
 
 
1202}