memblock: rename memblock_alloc{_nid,_try_nid} to memblock_phys_alloc*
[linux-2.6-block.git] / arch / s390 / kernel / setup.c
CommitLineData
a17ae4c3 1// SPDX-License-Identifier: GPL-2.0
1da177e4 2/*
1da177e4 3 * S390 version
a53c8fab 4 * Copyright IBM Corp. 1999, 2012
1da177e4
LT
5 * Author(s): Hartmut Penner (hp@de.ibm.com),
6 * Martin Schwidefsky (schwidefsky@de.ibm.com)
7 *
8 * Derived from "arch/i386/kernel/setup.c"
9 * Copyright (C) 1995, Linus Torvalds
10 */
11
12/*
13 * This file handles the architecture-dependent parts of initialization
14 */
15
3b6ed4ab
MS
16#define KMSG_COMPONENT "setup"
17#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
18
1da177e4 19#include <linux/errno.h>
0872922f 20#include <linux/export.h>
1da177e4 21#include <linux/sched.h>
29930025 22#include <linux/sched/task.h>
1777e463 23#include <linux/cpu.h>
1da177e4 24#include <linux/kernel.h>
ff38df37 25#include <linux/memblock.h>
1da177e4
LT
26#include <linux/mm.h>
27#include <linux/stddef.h>
28#include <linux/unistd.h>
29#include <linux/ptrace.h>
bcfcbb6b 30#include <linux/random.h>
1da177e4 31#include <linux/user.h>
1da177e4
LT
32#include <linux/tty.h>
33#include <linux/ioport.h>
34#include <linux/delay.h>
1da177e4
LT
35#include <linux/init.h>
36#include <linux/initrd.h>
37#include <linux/bootmem.h>
38#include <linux/root_dev.h>
39#include <linux/console.h>
1da177e4 40#include <linux/kernel_stat.h>
e1231b0e 41#include <linux/dma-contiguous.h>
1e8e3383 42#include <linux/device.h>
585c3047 43#include <linux/notifier.h>
65912a84 44#include <linux/pfn.h>
fe355b7f 45#include <linux/ctype.h>
2b67fc46 46#include <linux/reboot.h>
dbd70fb4 47#include <linux/topology.h>
60a0c68d
MH
48#include <linux/kexec.h>
49#include <linux/crash_dump.h>
50#include <linux/memory.h>
048cd4e5 51#include <linux/compat.h>
ce3dc447 52#include <linux/start_kernel.h>
1da177e4 53
46b05d26 54#include <asm/ipl.h>
1e3cab2f 55#include <asm/facility.h>
1da177e4
LT
56#include <asm/smp.h>
57#include <asm/mmu_context.h>
58#include <asm/cpcmd.h>
59#include <asm/lowcore.h>
6c81511c 60#include <asm/nmi.h>
1da177e4 61#include <asm/irq.h>
0b642ede
PO
62#include <asm/page.h>
63#include <asm/ptrace.h>
cc13ad62 64#include <asm/sections.h>
fe355b7f 65#include <asm/ebcdic.h>
60a0c68d 66#include <asm/diag.h>
4857d4bb 67#include <asm/os_info.h>
cd183459 68#include <asm/sclp.h>
bcfcbb6b 69#include <asm/sysinfo.h>
3a368f74 70#include <asm/numa.h>
686140a1 71#include <asm/alternative.h>
f19fbd5e 72#include <asm/nospec-branch.h>
6966d604 73#include <asm/mem_detect.h>
8b646bd7 74#include "entry.h"
c1821c2e 75
1da177e4
LT
76/*
77 * Machine setup..
78 */
79unsigned int console_mode = 0;
1485c5c8
HC
80EXPORT_SYMBOL(console_mode);
81
1da177e4 82unsigned int console_devno = -1;
1485c5c8
HC
83EXPORT_SYMBOL(console_devno);
84
1da177e4 85unsigned int console_irq = -1;
1485c5c8
HC
86EXPORT_SYMBOL(console_irq);
87
8f00b3e2 88unsigned long elf_hwcap __read_mostly = 0;
cf8ba7a9 89char elf_platform[ELF_PLATFORM_SIZE];
36a2bd42 90
7f16d7e7
DH
91unsigned long int_hwcap = 0;
92
d58106c3 93int __bootdata(noexec_disabled);
49698745
VG
94int __bootdata(memory_end_set);
95unsigned long __bootdata(memory_end);
6966d604
VG
96unsigned long __bootdata(max_physmem_end);
97struct mem_detect_info __bootdata(mem_detect);
1da177e4 98
14045ebf
MS
99unsigned long VMALLOC_START;
100EXPORT_SYMBOL(VMALLOC_START);
101
102unsigned long VMALLOC_END;
103EXPORT_SYMBOL(VMALLOC_END);
104
105struct page *vmemmap;
106EXPORT_SYMBOL(vmemmap);
107
c972cc60
HC
108unsigned long MODULES_VADDR;
109unsigned long MODULES_END;
c972cc60 110
099b7651 111/* An array with a pointer to the lowcore of every CPU. */
c667aeac 112struct lowcore *lowcore_ptr[NR_CPUS];
099b7651
FM
113EXPORT_SYMBOL(lowcore_ptr);
114
1da177e4
LT
115/*
116 * This is set up by the setup-routine at boot-time
117 * for S390 need to find out, what we have to setup
118 * using address 0x10400 ...
119 */
120
121#include <asm/setup.h>
122
1da177e4
LT
123/*
124 * condev= and conmode= setup parameter.
125 */
126
127static int __init condev_setup(char *str)
128{
129 int vdev;
130
131 vdev = simple_strtoul(str, &str, 0);
132 if (vdev >= 0 && vdev < 65536) {
133 console_devno = vdev;
134 console_irq = -1;
135 }
136 return 1;
137}
138
139__setup("condev=", condev_setup);
140
637952ca
HB
141static void __init set_preferred_console(void)
142{
8f50af49 143 if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
637952ca 144 add_preferred_console("ttyS", 0, NULL);
c4de0c1a 145 else if (CONSOLE_IS_3270)
637952ca 146 add_preferred_console("tty3270", 0, NULL);
8f50af49
PO
147 else if (CONSOLE_IS_VT220)
148 add_preferred_console("ttyS", 1, NULL);
149 else if (CONSOLE_IS_HVC)
150 add_preferred_console("hvc", 0, NULL);
637952ca
HB
151}
152
1da177e4
LT
153static int __init conmode_setup(char *str)
154{
8c0933ee 155#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
156 if (strncmp(str, "hwc", 4) == 0 || strncmp(str, "sclp", 5) == 0)
157 SET_CONSOLE_SCLP;
158#endif
159#if defined(CONFIG_TN3215_CONSOLE)
160 if (strncmp(str, "3215", 5) == 0)
161 SET_CONSOLE_3215;
162#endif
163#if defined(CONFIG_TN3270_CONSOLE)
164 if (strncmp(str, "3270", 5) == 0)
165 SET_CONSOLE_3270;
166#endif
637952ca 167 set_preferred_console();
1da177e4
LT
168 return 1;
169}
170
171__setup("conmode=", conmode_setup);
172
173static void __init conmode_default(void)
174{
175 char query_buffer[1024];
176 char *ptr;
177
178 if (MACHINE_IS_VM) {
740b5706 179 cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
1da177e4
LT
180 console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
181 ptr = strstr(query_buffer, "SUBCHANNEL =");
182 console_irq = simple_strtoul(ptr + 13, NULL, 16);
740b5706 183 cpcmd("QUERY TERM", query_buffer, 1024, NULL);
1da177e4
LT
184 ptr = strstr(query_buffer, "CONMODE");
185 /*
186 * Set the conmode to 3215 so that the device recognition
187 * will set the cu_type of the console to 3215. If the
188 * conmode is 3270 and we don't set it back then both
189 * 3215 and the 3270 driver will try to access the console
190 * device (3215 as console and 3270 as normal tty).
191 */
740b5706 192 cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
1da177e4 193 if (ptr == NULL) {
8c0933ee 194#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
195 SET_CONSOLE_SCLP;
196#endif
197 return;
198 }
199 if (strncmp(ptr + 8, "3270", 4) == 0) {
200#if defined(CONFIG_TN3270_CONSOLE)
201 SET_CONSOLE_3270;
202#elif defined(CONFIG_TN3215_CONSOLE)
203 SET_CONSOLE_3215;
8c0933ee 204#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
205 SET_CONSOLE_SCLP;
206#endif
207 } else if (strncmp(ptr + 8, "3215", 4) == 0) {
208#if defined(CONFIG_TN3215_CONSOLE)
209 SET_CONSOLE_3215;
210#elif defined(CONFIG_TN3270_CONSOLE)
211 SET_CONSOLE_3270;
8c0933ee 212#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
213 SET_CONSOLE_SCLP;
214#endif
215 }
8f50af49 216 } else if (MACHINE_IS_KVM) {
a5ff1b34 217 if (sclp.has_vt220 && IS_ENABLED(CONFIG_SCLP_VT220_CONSOLE))
8f50af49 218 SET_CONSOLE_VT220;
a5ff1b34 219 else if (sclp.has_linemode && IS_ENABLED(CONFIG_SCLP_CONSOLE))
8f50af49
PO
220 SET_CONSOLE_SCLP;
221 else
222 SET_CONSOLE_HVC;
1da177e4 223 } else {
8c0933ee 224#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
225 SET_CONSOLE_SCLP;
226#endif
227 }
579f1a28
FA
228 if (IS_ENABLED(CONFIG_VT) && IS_ENABLED(CONFIG_DUMMY_CONSOLE))
229 conswitchp = &dummy_con;
1da177e4
LT
230}
231
bf28a597 232#ifdef CONFIG_CRASH_DUMP
fe72ffba 233static void __init setup_zfcpdump(void)
411ed322 234{
411ed322
MH
235 if (ipl_info.type != IPL_TYPE_FCP_DUMP)
236 return;
3f25dc4f
MH
237 if (OLDMEM_BASE)
238 return;
fe72ffba 239 strcat(boot_command_line, " cio_ignore=all,!ipldev,!condev");
411ed322
MH
240 console_loglevel = 2;
241}
242#else
fe72ffba 243static inline void setup_zfcpdump(void) {}
bf28a597 244#endif /* CONFIG_CRASH_DUMP */
411ed322 245
1da177e4
LT
246 /*
247 * Reboot, halt and power_off stubs. They just call _machine_restart,
248 * _machine_halt or _machine_power_off.
249 */
250
251void machine_restart(char *command)
252{
7aa8dac7 253 if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
06fa46a2
MS
254 /*
255 * Only unblank the console if we are called in enabled
256 * context or a bust_spinlocks cleared the way for us.
257 */
258 console_unblank();
1da177e4
LT
259 _machine_restart(command);
260}
261
1da177e4
LT
262void machine_halt(void)
263{
06fa46a2
MS
264 if (!in_interrupt() || oops_in_progress)
265 /*
266 * Only unblank the console if we are called in enabled
267 * context or a bust_spinlocks cleared the way for us.
268 */
269 console_unblank();
1da177e4
LT
270 _machine_halt();
271}
272
1da177e4
LT
273void machine_power_off(void)
274{
06fa46a2
MS
275 if (!in_interrupt() || oops_in_progress)
276 /*
277 * Only unblank the console if we are called in enabled
278 * context or a bust_spinlocks cleared the way for us.
279 */
280 console_unblank();
1da177e4
LT
281 _machine_power_off();
282}
283
53df751c
MS
284/*
285 * Dummy power off function.
286 */
287void (*pm_power_off)(void) = machine_power_off;
0872922f 288EXPORT_SYMBOL_GPL(pm_power_off);
53df751c 289
14045ebf
MS
290static int __init parse_vmalloc(char *arg)
291{
292 if (!arg)
293 return -EINVAL;
294 VMALLOC_END = (memparse(arg, &arg) + PAGE_SIZE - 1) & PAGE_MASK;
295 return 0;
296}
297early_param("vmalloc", parse_vmalloc);
298
72a9b02d 299void *restart_stack __section(.data);
8b646bd7 300
ce3dc447
MS
301unsigned long stack_alloc(void)
302{
303#ifdef CONFIG_VMAP_STACK
304 return (unsigned long)
32ce55a6 305 __vmalloc_node_range(THREAD_SIZE, THREAD_SIZE,
ce3dc447
MS
306 VMALLOC_START, VMALLOC_END,
307 THREADINFO_GFP,
308 PAGE_KERNEL, 0, NUMA_NO_NODE,
309 __builtin_return_address(0));
310#else
32ce55a6 311 return __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
ce3dc447
MS
312#endif
313}
314
315void stack_free(unsigned long stack)
316{
317#ifdef CONFIG_VMAP_STACK
318 vfree((void *) stack);
319#else
32ce55a6 320 free_pages(stack, THREAD_SIZE_ORDER);
ce3dc447
MS
321#endif
322}
323
324int __init arch_early_irq_init(void)
325{
326 unsigned long stack;
327
32ce55a6 328 stack = __get_free_pages(GFP_KERNEL, THREAD_SIZE_ORDER);
ce3dc447
MS
329 if (!stack)
330 panic("Couldn't allocate async stack");
331 S390_lowcore.async_stack = stack + STACK_INIT_OFFSET;
332 return 0;
333}
334
335static int __init async_stack_realloc(void)
336{
337 unsigned long old, new;
338
339 old = S390_lowcore.async_stack - STACK_INIT_OFFSET;
340 new = stack_alloc();
341 if (!new)
342 panic("Couldn't allocate async stack");
343 S390_lowcore.async_stack = new + STACK_INIT_OFFSET;
32ce55a6 344 free_pages(old, THREAD_SIZE_ORDER);
ce3dc447
MS
345 return 0;
346}
347early_initcall(async_stack_realloc);
348
349void __init arch_call_rest_init(void)
350{
351 struct stack_frame *frame;
352 unsigned long stack;
353
354 stack = stack_alloc();
355 if (!stack)
356 panic("Couldn't allocate kernel stack");
357 current->stack = (void *) stack;
358#ifdef CONFIG_VMAP_STACK
359 current->stack_vm_area = (void *) stack;
360#endif
361 set_task_stack_end_magic(current);
362 stack += STACK_INIT_OFFSET;
363 S390_lowcore.kernel_stack = stack;
364 frame = (struct stack_frame *) stack;
365 memset(frame, 0, sizeof(*frame));
366 /* Branch to rest_init on the new stack, never returns */
367 asm volatile(
368 " la 15,0(%[_frame])\n"
369 " jg rest_init\n"
370 : : [_frame] "a" (frame));
371}
372
8b646bd7 373static void __init setup_lowcore(void)
c9e37353 374{
c667aeac 375 struct lowcore *lc;
c9e37353
HC
376
377 /*
378 * Setup lowcore for boot cpu
379 */
f1c1174f 380 BUILD_BUG_ON(sizeof(struct lowcore) != LC_PAGES * PAGE_SIZE);
db7ad636 381 lc = memblock_virt_alloc_low(sizeof(*lc), sizeof(*lc));
e258d719 382 lc->restart_psw.mask = PSW_KERNEL_BITS;
fecc868a 383 lc->restart_psw.addr = (unsigned long) restart_int_handler;
e258d719 384 lc->external_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 385 PSW_MASK_DAT | PSW_MASK_MCHECK;
fecc868a 386 lc->external_new_psw.addr = (unsigned long) ext_int_handler;
e258d719 387 lc->svc_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 388 PSW_MASK_DAT | PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK;
fecc868a 389 lc->svc_new_psw.addr = (unsigned long) system_call;
e258d719 390 lc->program_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 391 PSW_MASK_DAT | PSW_MASK_MCHECK;
fecc868a 392 lc->program_new_psw.addr = (unsigned long) pgm_check_handler;
e258d719 393 lc->mcck_new_psw.mask = PSW_KERNEL_BITS;
fecc868a 394 lc->mcck_new_psw.addr = (unsigned long) mcck_int_handler;
e258d719 395 lc->io_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 396 PSW_MASK_DAT | PSW_MASK_MCHECK;
fecc868a 397 lc->io_new_psw.addr = (unsigned long) io_int_handler;
6e2ef5e4 398 lc->clock_comparator = clock_comparator_max;
ce3dc447 399 lc->nodat_stack = ((unsigned long) &init_thread_union)
dc7ee00d 400 + THREAD_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
d5c352cd 401 lc->current_task = (unsigned long)&init_task;
8f100bb1 402 lc->lpp = LPP_MAGIC;
25097bf1 403 lc->machine_flags = S390_lowcore.machine_flags;
c360192b 404 lc->preempt_count = S390_lowcore.preempt_count;
14375bc4
MS
405 lc->stfl_fac_list = S390_lowcore.stfl_fac_list;
406 memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
cf148998
MS
407 sizeof(lc->stfle_fac_list));
408 memcpy(lc->alt_stfle_fac_list, S390_lowcore.alt_stfle_fac_list,
409 sizeof(lc->alt_stfle_fac_list));
6c81511c 410 nmi_alloc_boot_cpu(lc);
608796ff 411 vdso_alloc_boot_cpu(lc);
ab96e798
MS
412 lc->sync_enter_timer = S390_lowcore.sync_enter_timer;
413 lc->async_enter_timer = S390_lowcore.async_enter_timer;
414 lc->exit_timer = S390_lowcore.exit_timer;
415 lc->user_timer = S390_lowcore.user_timer;
416 lc->system_timer = S390_lowcore.system_timer;
417 lc->steal_timer = S390_lowcore.steal_timer;
418 lc->last_update_timer = S390_lowcore.last_update_timer;
419 lc->last_update_clock = S390_lowcore.last_update_clock;
8b646bd7 420
ce3dc447
MS
421 /*
422 * Allocate the global restart stack which is the same for
423 * all CPUs in cast *one* of them does a PSW restart.
424 */
32ce55a6 425 restart_stack = memblock_virt_alloc(THREAD_SIZE, THREAD_SIZE);
ce3dc447 426 restart_stack += STACK_INIT_OFFSET;
8b646bd7
MS
427
428 /*
429 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
b4a96015 430 * restart data to the absolute zero lowcore. This is necessary if
8b646bd7
MS
431 * PSW restart is done on an offline CPU that has lowcore zero.
432 */
433 lc->restart_stack = (unsigned long) restart_stack;
434 lc->restart_fn = (unsigned long) do_restart;
435 lc->restart_data = 0;
436 lc->restart_source = -1UL;
73bf463e
MH
437
438 /* Setup absolute zero lowcore */
fbe76568
HC
439 mem_assign_absolute(S390_lowcore.restart_stack, lc->restart_stack);
440 mem_assign_absolute(S390_lowcore.restart_fn, lc->restart_fn);
441 mem_assign_absolute(S390_lowcore.restart_data, lc->restart_data);
442 mem_assign_absolute(S390_lowcore.restart_source, lc->restart_source);
443 mem_assign_absolute(S390_lowcore.restart_psw, lc->restart_psw);
8b646bd7 444
6c8cd5bb
PH
445#ifdef CONFIG_SMP
446 lc->spinlock_lockval = arch_spin_lockval(0);
b96f7d88
MS
447 lc->spinlock_index = 0;
448 arch_spin_lock_setup(0);
6c8cd5bb 449#endif
f19fbd5e 450 lc->br_r1_trampoline = 0x07f1; /* br %r1 */
6c8cd5bb 451
c9e37353 452 set_prefix((u32)(unsigned long) lc);
099b7651 453 lowcore_ptr[0] = lc;
c9e37353
HC
454}
455
71189284
HC
456static struct resource code_resource = {
457 .name = "Kernel code",
35d98e93 458 .flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
71189284
HC
459};
460
461static struct resource data_resource = {
462 .name = "Kernel data",
35d98e93 463 .flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
71189284
HC
464};
465
4cc69531
HC
466static struct resource bss_resource = {
467 .name = "Kernel bss",
35d98e93 468 .flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM,
4cc69531
HC
469};
470
71189284
HC
471static struct resource __initdata *standard_resources[] = {
472 &code_resource,
473 &data_resource,
4cc69531 474 &bss_resource,
71189284
HC
475};
476
477static void __init setup_resources(void)
c9e37353 478{
71189284 479 struct resource *res, *std_res, *sub_res;
50be6345
PH
480 struct memblock_region *reg;
481 int j;
c9e37353 482
320d9555
VG
483 code_resource.start = (unsigned long) _text;
484 code_resource.end = (unsigned long) _etext - 1;
485 data_resource.start = (unsigned long) _etext;
486 data_resource.end = (unsigned long) _edata - 1;
487 bss_resource.start = (unsigned long) __bss_start;
488 bss_resource.end = (unsigned long) __bss_stop - 1;
cc13ad62 489
50be6345 490 for_each_memblock(memory, reg) {
db7ad636 491 res = memblock_virt_alloc(sizeof(*res), 8);
35d98e93 492 res->flags = IORESOURCE_BUSY | IORESOURCE_SYSTEM_RAM;
50be6345
PH
493
494 res->name = "System RAM";
495 res->start = reg->base;
496 res->end = reg->base + reg->size - 1;
c9e37353 497 request_resource(&iomem_resource, res);
fe355b7f 498
71189284
HC
499 for (j = 0; j < ARRAY_SIZE(standard_resources); j++) {
500 std_res = standard_resources[j];
501 if (std_res->start < res->start ||
502 std_res->start > res->end)
503 continue;
504 if (std_res->end > res->end) {
db7ad636 505 sub_res = memblock_virt_alloc(sizeof(*sub_res), 8);
71189284
HC
506 *sub_res = *std_res;
507 sub_res->end = res->end;
508 std_res->start = res->end + 1;
509 request_resource(res, sub_res);
510 } else {
511 request_resource(res, std_res);
512 }
fe355b7f 513 }
c9e37353 514 }
4e042af4
HC
515#ifdef CONFIG_CRASH_DUMP
516 /*
517 * Re-add removed crash kernel memory as reserved memory. This makes
518 * sure it will be mapped with the identity mapping and struct pages
519 * will be created, so it can be resized later on.
520 * However add it later since the crash kernel resource should not be
521 * part of the System RAM resource.
522 */
523 if (crashk_res.end) {
9f88eb4d 524 memblock_add_node(crashk_res.start, resource_size(&crashk_res), 0);
4e042af4
HC
525 memblock_reserve(crashk_res.start, resource_size(&crashk_res));
526 insert_resource(&iomem_resource, &crashk_res);
527 }
528#endif
c9e37353
HC
529}
530
8b62bc96
HC
531static void __init setup_memory_end(void)
532{
14045ebf 533 unsigned long vmax, vmalloc_size, tmp;
9f4b0ba8 534
42db5ed8 535 /* Choose kernel address space layout: 3 or 4 levels. */
c972cc60 536 vmalloc_size = VMALLOC_END ?: (128UL << 30) - MODULES_LEN;
42db5ed8 537 if (IS_ENABLED(CONFIG_KASAN)) {
5dff0381
VG
538 vmax = IS_ENABLED(CONFIG_KASAN_S390_4_LEVEL_PAGING)
539 ? _REGION1_SIZE
540 : _REGION2_SIZE;
42db5ed8
VG
541 } else {
542 tmp = (memory_end ?: max_physmem_end) / PAGE_SIZE;
543 tmp = tmp * (sizeof(struct page) + PAGE_SIZE);
544 if (tmp + vmalloc_size + MODULES_LEN <= _REGION2_SIZE)
545 vmax = _REGION2_SIZE; /* 3-level kernel page table */
546 else
547 vmax = _REGION1_SIZE; /* 4-level kernel page table */
548 }
549
c972cc60
HC
550 /* module area is at the end of the kernel address space. */
551 MODULES_END = vmax;
552 MODULES_VADDR = MODULES_END - MODULES_LEN;
553 VMALLOC_END = MODULES_VADDR;
5eaf436e 554 VMALLOC_START = VMALLOC_END - vmalloc_size;
14045ebf
MS
555
556 /* Split remaining virtual space between 1:1 mapping & vmemmap array */
557 tmp = VMALLOC_START / (PAGE_SIZE + sizeof(struct page));
a7bb1ae7
HC
558 /* vmemmap contains a multiple of PAGES_PER_SECTION struct pages */
559 tmp = SECTION_ALIGN_UP(tmp);
14045ebf
MS
560 tmp = VMALLOC_START - tmp * sizeof(struct page);
561 tmp &= ~((vmax >> 11) - 1); /* align to page table level */
562 tmp = min(tmp, 1UL << MAX_PHYSMEM_BITS);
563 vmemmap = (struct page *) tmp;
564
565 /* Take care that memory_end is set and <= vmemmap */
5eaf436e 566 memory_end = min(memory_end ?: max_physmem_end, (unsigned long)vmemmap);
42db5ed8
VG
567#ifdef CONFIG_KASAN
568 /* fit in kasan shadow memory region between 1:1 and vmemmap */
569 memory_end = min(memory_end, KASAN_SHADOW_START);
570 vmemmap = max(vmemmap, (struct page *)KASAN_SHADOW_END);
571#endif
50be6345
PH
572 max_pfn = max_low_pfn = PFN_DOWN(memory_end);
573 memblock_remove(memory_end, ULONG_MAX);
8b62bc96 574
6d7b2ee9 575 pr_notice("The maximum memory size is %luMB\n", memory_end >> 20);
8b62bc96
HC
576}
577
60a0c68d
MH
578#ifdef CONFIG_CRASH_DUMP
579
60a0c68d
MH
580/*
581 * When kdump is enabled, we have to ensure that no memory from
582 * the area [0 - crashkernel memory size] and
583 * [crashk_res.start - crashk_res.end] is set offline.
584 */
585static int kdump_mem_notifier(struct notifier_block *nb,
586 unsigned long action, void *data)
587{
588 struct memory_notify *arg = data;
589
bd858e84
MH
590 if (action != MEM_GOING_OFFLINE)
591 return NOTIFY_OK;
60a0c68d
MH
592 if (arg->start_pfn < PFN_DOWN(resource_size(&crashk_res)))
593 return NOTIFY_BAD;
594 if (arg->start_pfn > PFN_DOWN(crashk_res.end))
595 return NOTIFY_OK;
596 if (arg->start_pfn + arg->nr_pages - 1 < PFN_DOWN(crashk_res.start))
597 return NOTIFY_OK;
598 return NOTIFY_BAD;
599}
600
601static struct notifier_block kdump_mem_nb = {
602 .notifier_call = kdump_mem_notifier,
603};
604
605#endif
606
50be6345
PH
607/*
608 * Make sure that the area behind memory_end is protected
609 */
610static void reserve_memory_end(void)
611{
49698745
VG
612 if (memory_end_set)
613 memblock_reserve(memory_end, ULONG_MAX);
50be6345
PH
614}
615
60a0c68d
MH
616/*
617 * Make sure that oldmem, where the dump is stored, is protected
618 */
619static void reserve_oldmem(void)
620{
621#ifdef CONFIG_CRASH_DUMP
50be6345
PH
622 if (OLDMEM_BASE)
623 /* Forget all memory above the running kdump system */
624 memblock_reserve(OLDMEM_SIZE, (phys_addr_t)ULONG_MAX);
625#endif
626}
60a0c68d 627
50be6345
PH
628/*
629 * Make sure that oldmem, where the dump is stored, is protected
630 */
631static void remove_oldmem(void)
632{
633#ifdef CONFIG_CRASH_DUMP
634 if (OLDMEM_BASE)
635 /* Forget all memory above the running kdump system */
636 memblock_remove(OLDMEM_SIZE, (phys_addr_t)ULONG_MAX);
60a0c68d
MH
637#endif
638}
639
640/*
641 * Reserve memory for kdump kernel to be loaded with kexec
642 */
643static void __init reserve_crashkernel(void)
644{
645#ifdef CONFIG_CRASH_DUMP
646 unsigned long long crash_base, crash_size;
50be6345 647 phys_addr_t low, high;
60a0c68d
MH
648 int rc;
649
650 rc = parse_crashkernel(boot_command_line, memory_end, &crash_size,
651 &crash_base);
50be6345 652
dab7a7b1
MH
653 crash_base = ALIGN(crash_base, KEXEC_CRASH_MEM_ALIGN);
654 crash_size = ALIGN(crash_size, KEXEC_CRASH_MEM_ALIGN);
50be6345 655 if (rc || crash_size == 0)
60a0c68d 656 return;
50be6345
PH
657
658 if (memblock.memory.regions[0].size < crash_size) {
659 pr_info("crashkernel reservation failed: %s\n",
660 "first memory chunk must be at least crashkernel size");
60a0c68d
MH
661 return;
662 }
50be6345
PH
663
664 low = crash_base ?: OLDMEM_BASE;
665 high = low + crash_size;
666 if (low >= OLDMEM_BASE && high <= OLDMEM_BASE + OLDMEM_SIZE) {
667 /* The crashkernel fits into OLDMEM, reuse OLDMEM */
668 crash_base = low;
669 } else {
670 /* Find suitable area in free memory */
37c5f6c8 671 low = max_t(unsigned long, crash_size, sclp.hsa_size);
50be6345
PH
672 high = crash_base ? crash_base + crash_size : ULONG_MAX;
673
674 if (crash_base && crash_base < low) {
675 pr_info("crashkernel reservation failed: %s\n",
676 "crash_base too low");
677 return;
678 }
679 low = crash_base ?: low;
680 crash_base = memblock_find_in_range(low, high, crash_size,
681 KEXEC_CRASH_MEM_ALIGN);
682 }
683
684 if (!crash_base) {
685 pr_info("crashkernel reservation failed: %s\n",
686 "no suitable area found");
60a0c68d
MH
687 return;
688 }
50be6345
PH
689
690 if (register_memory_notifier(&kdump_mem_nb))
691 return;
692
60a0c68d
MH
693 if (!OLDMEM_BASE && MACHINE_IS_VM)
694 diag10_range(PFN_DOWN(crash_base), PFN_DOWN(crash_size));
695 crashk_res.start = crash_base;
696 crashk_res.end = crash_base + crash_size - 1;
50be6345 697 memblock_remove(crash_base, crash_size);
60a0c68d
MH
698 pr_info("Reserving %lluMB of memory at %lluMB "
699 "for crashkernel (System RAM: %luMB)\n",
50be6345
PH
700 crash_size >> 20, crash_base >> 20,
701 (unsigned long)memblock.memory.total_size >> 20);
4857d4bb 702 os_info_crashkernel_add(crash_base, crash_size);
60a0c68d
MH
703#endif
704}
705
50be6345
PH
706/*
707 * Reserve the initrd from being used by memblock
708 */
709static void __init reserve_initrd(void)
c9e37353 710{
50be6345 711#ifdef CONFIG_BLK_DEV_INITRD
7be5e359
HC
712 if (!INITRD_START || !INITRD_SIZE)
713 return;
50be6345
PH
714 initrd_start = INITRD_START;
715 initrd_end = initrd_start + INITRD_SIZE;
716 memblock_reserve(INITRD_START, INITRD_SIZE);
717#endif
718}
1da177e4 719
6966d604
VG
720static void __init reserve_mem_detect_info(void)
721{
722 unsigned long start, size;
723
724 get_mem_detect_reserved(&start, &size);
725 if (size)
726 memblock_reserve(start, size);
727}
728
729static void __init free_mem_detect_info(void)
730{
731 unsigned long start, size;
732
733 get_mem_detect_reserved(&start, &size);
734 if (size)
735 memblock_free(start, size);
736}
737
738static void __init memblock_physmem_add(phys_addr_t start, phys_addr_t size)
739{
740 memblock_dbg("memblock_physmem_add: [%#016llx-%#016llx]\n",
741 start, start + size - 1);
742 memblock_add_range(&memblock.memory, start, size, 0, 0);
743 memblock_add_range(&memblock.physmem, start, size, 0, 0);
744}
745
f01b8bca
VG
746static const char * __init get_mem_info_source(void)
747{
748 switch (mem_detect.info_source) {
749 case MEM_DETECT_SCLP_STOR_INFO:
750 return "sclp storage info";
751 case MEM_DETECT_DIAG260:
752 return "diag260";
753 case MEM_DETECT_SCLP_READ_INFO:
754 return "sclp read info";
755 case MEM_DETECT_BIN_SEARCH:
756 return "binary search";
757 }
758 return "none";
759}
760
6966d604
VG
761static void __init memblock_add_mem_detect_info(void)
762{
763 unsigned long start, end;
764 int i;
765
f01b8bca
VG
766 memblock_dbg("physmem info source: %s (%hhd)\n",
767 get_mem_info_source(), mem_detect.info_source);
6966d604
VG
768 /* keep memblock lists close to the kernel */
769 memblock_set_bottom_up(true);
770 for_each_mem_detect_block(i, &start, &end)
771 memblock_physmem_add(start, end - start);
772 memblock_set_bottom_up(false);
773 memblock_dump_all();
774}
775
50be6345
PH
776/*
777 * Check for initrd being in usable memory
778 */
779static void __init check_initrd(void)
780{
781#ifdef CONFIG_BLK_DEV_INITRD
782 if (INITRD_START && INITRD_SIZE &&
783 !memblock_is_region_memory(INITRD_START, INITRD_SIZE)) {
6d7b2ee9 784 pr_err("The initial RAM disk does not fit into the memory\n");
50be6345
PH
785 memblock_free(INITRD_START, INITRD_SIZE);
786 initrd_start = initrd_end = 0;
787 }
788#endif
789}
790
791/*
0c36b8ac 792 * Reserve memory used for lowcore/command line/kernel image.
50be6345
PH
793 */
794static void __init reserve_kernel(void)
795{
320d9555 796 unsigned long start_pfn = PFN_UP(__pa(_end));
1da177e4 797
0c36b8ac 798#ifdef CONFIG_DMA_API_DEBUG
65912a84 799 /*
0c36b8ac 800 * DMA_API_DEBUG code stumbles over addresses from the
514211f5 801 * range [PARMAREA_END, _stext]. Mark the memory as reserved
0c36b8ac 802 * so it is not used for CONFIG_DMA_API_DEBUG=y.
65912a84 803 */
0c36b8ac
SO
804 memblock_reserve(0, PFN_PHYS(start_pfn));
805#else
514211f5 806 memblock_reserve(0, PARMAREA_END);
50be6345
PH
807 memblock_reserve((unsigned long)_stext, PFN_PHYS(start_pfn)
808 - (unsigned long)_stext);
0c36b8ac 809#endif
50be6345 810}
65912a84 811
50be6345
PH
812static void __init setup_memory(void)
813{
814 struct memblock_region *reg;
1da177e4
LT
815
816 /*
50be6345 817 * Init storage key for present memory
1da177e4 818 */
50be6345
PH
819 for_each_memblock(memory, reg) {
820 storage_key_init_range(reg->base, reg->base + reg->size);
1da177e4 821 }
0b642ede
PO
822 psw_set_key(PAGE_DEFAULT_KEY);
823
50be6345
PH
824 /* Only cosmetics */
825 memblock_enforce_memory_limit(memblock_end_of_DRAM());
c9e37353 826}
1da177e4 827
cf8ba7a9
MS
828/*
829 * Setup hardware capabilities.
830 */
89b1145e 831static int __init setup_hwcaps(void)
cf8ba7a9
MS
832{
833 static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
94038a99 834 struct cpuid cpu_id;
cf8ba7a9
MS
835 int i;
836
cf8ba7a9
MS
837 /*
838 * The store facility list bits numbers as found in the principles
839 * of operation are numbered with bit 1UL<<31 as number 0 to
840 * bit 1UL<<0 as number 31.
841 * Bit 0: instructions named N3, "backported" to esa-mode
842 * Bit 2: z/Architecture mode is active
843 * Bit 7: the store-facility-list-extended facility is installed
844 * Bit 17: the message-security assist is installed
845 * Bit 19: the long-displacement facility is installed
846 * Bit 21: the extended-immediate facility is installed
488253ce
AK
847 * Bit 22: extended-translation facility 3 is installed
848 * Bit 30: extended-translation facility 3 enhancement facility
cf8ba7a9
MS
849 * These get translated to:
850 * HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
851 * HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
488253ce
AK
852 * HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
853 * HWCAP_S390_ETF3EH bit 8 (22 && 30).
cf8ba7a9
MS
854 */
855 for (i = 0; i < 6; i++)
14375bc4 856 if (test_facility(stfl_bits[i]))
cf8ba7a9
MS
857 elf_hwcap |= 1UL << i;
858
14375bc4 859 if (test_facility(22) && test_facility(30))
ea2a4d3a 860 elf_hwcap |= HWCAP_S390_ETF3EH;
488253ce 861
cf8ba7a9
MS
862 /*
863 * Check for additional facilities with store-facility-list-extended.
864 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
865 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
866 * as stored by stfl, bits 32-xxx contain additional facilities.
867 * How many facility words are stored depends on the number of
25985edc 868 * doublewords passed to the instruction. The additional facilities
cf8ba7a9 869 * are:
2ac3307f
CE
870 * Bit 42: decimal floating point facility is installed
871 * Bit 44: perform floating point operation facility is installed
cf8ba7a9 872 * translated to:
488253ce 873 * HWCAP_S390_DFP bit 6 (42 && 44).
cf8ba7a9 874 */
14375bc4
MS
875 if ((elf_hwcap & (1UL << 2)) && test_facility(42) && test_facility(44))
876 elf_hwcap |= HWCAP_S390_DFP;
cf8ba7a9 877
ea2a4d3a
HC
878 /*
879 * Huge page support HWCAP_S390_HPAGE is bit 7.
880 */
466178fc 881 if (MACHINE_HAS_EDAT1)
ea2a4d3a
HC
882 elf_hwcap |= HWCAP_S390_HPAGE;
883
884 /*
885 * 64-bit register support for 31-bit processes
886 * HWCAP_S390_HIGH_GPRS is bit 9.
887 */
888 elf_hwcap |= HWCAP_S390_HIGH_GPRS;
d35339a4
MS
889
890 /*
891 * Transactional execution support HWCAP_S390_TE is bit 10.
892 */
baaf9be8 893 if (MACHINE_HAS_TE)
d35339a4 894 elf_hwcap |= HWCAP_S390_TE;
80703617
MS
895
896 /*
89b1145e
MS
897 * Vector extension HWCAP_S390_VXRS is bit 11. The Vector extension
898 * can be disabled with the "novx" parameter. Use MACHINE_HAS_VX
899 * instead of facility bit 129.
80703617 900 */
2583b848 901 if (MACHINE_HAS_VX) {
80703617 902 elf_hwcap |= HWCAP_S390_VXRS;
2583b848
MS
903 if (test_facility(134))
904 elf_hwcap |= HWCAP_S390_VXRS_EXT;
905 if (test_facility(135))
906 elf_hwcap |= HWCAP_S390_VXRS_BCD;
907 }
908
916cda1a
MS
909 /*
910 * Guarded storage support HWCAP_S390_GS is bit 12.
911 */
912 if (MACHINE_HAS_GS)
913 elf_hwcap |= HWCAP_S390_GS;
914
94038a99 915 get_cpu_id(&cpu_id);
bcfcbb6b 916 add_device_randomness(&cpu_id, sizeof(cpu_id));
94038a99 917 switch (cpu_id.machine) {
cf8ba7a9
MS
918 case 0x2064:
919 case 0x2066:
cf8ba7a9 920 default: /* Use "z900" as default for 64 bit kernels. */
cf8ba7a9
MS
921 strcpy(elf_platform, "z900");
922 break;
923 case 0x2084:
924 case 0x2086:
925 strcpy(elf_platform, "z990");
926 break;
927 case 0x2094:
9fee8db2 928 case 0x2096:
cf8ba7a9
MS
929 strcpy(elf_platform, "z9-109");
930 break;
9fee8db2
MS
931 case 0x2097:
932 case 0x2098:
933 strcpy(elf_platform, "z10");
934 break;
c84b9051 935 case 0x2817:
3a81b171 936 case 0x2818:
c84b9051
HC
937 strcpy(elf_platform, "z196");
938 break;
991c1505 939 case 0x2827:
59471227 940 case 0x2828:
991c1505
HC
941 strcpy(elf_platform, "zEC12");
942 break;
f8b2dcbd 943 case 0x2964:
bb3aa614 944 case 0x2965:
f8b2dcbd
MS
945 strcpy(elf_platform, "z13");
946 break;
6997c323 947 case 0x3906:
451239eb 948 case 0x3907:
6997c323
MS
949 strcpy(elf_platform, "z14");
950 break;
cf8ba7a9 951 }
7f16d7e7
DH
952
953 /*
954 * Virtualization support HWCAP_INT_SIE is bit 0.
955 */
956 if (sclp.has_sief2)
957 int_hwcap |= HWCAP_INT_SIE;
958
89b1145e 959 return 0;
cf8ba7a9 960}
89b1145e 961arch_initcall(setup_hwcaps);
cf8ba7a9 962
bcfcbb6b
MS
963/*
964 * Add system information as device randomness
965 */
966static void __init setup_randomness(void)
967{
968 struct sysinfo_3_2_2 *vmms;
969
9a8dd708
MR
970 vmms = (struct sysinfo_3_2_2 *) memblock_phys_alloc(PAGE_SIZE,
971 PAGE_SIZE);
da8fd820 972 if (stsi(vmms, 3, 2, 2) == 0 && vmms->count)
4920e3cf 973 add_device_randomness(&vmms->vm, sizeof(vmms->vm[0]) * vmms->count);
da8fd820 974 memblock_free((unsigned long) vmms, PAGE_SIZE);
bcfcbb6b
MS
975}
976
3f6813b9
MS
977/*
978 * Find the correct size for the task_struct. This depends on
979 * the size of the struct fpu at the end of the thread_struct
980 * which is embedded in the task_struct.
981 */
982static void __init setup_task_size(void)
983{
984 int task_size = sizeof(struct task_struct);
985
986 if (!MACHINE_HAS_VX) {
987 task_size -= sizeof(__vector128) * __NUM_VXRS;
988 task_size += sizeof(freg_t) * __NUM_FPRS;
989 }
990 arch_task_struct_size = task_size;
991}
992
c9e37353
HC
993/*
994 * Setup function called from init/main.c just after the banner
995 * was printed.
996 */
1da177e4 997
8b646bd7 998void __init setup_arch(char **cmdline_p)
c9e37353 999{
1da177e4 1000 /*
c9e37353 1001 * print what head.S has found out about the machine
1da177e4 1002 */
fa587743 1003 if (MACHINE_IS_VM)
3b6ed4ab
MS
1004 pr_info("Linux is running as a z/VM "
1005 "guest operating system in 64-bit mode\n");
637952ca 1006 else if (MACHINE_IS_KVM)
3b6ed4ab 1007 pr_info("Linux is running under KVM in 64-bit mode\n");
27d71602 1008 else if (MACHINE_IS_LPAR)
3b6ed4ab 1009 pr_info("Linux is running natively in 64-bit mode\n");
c9e37353 1010
a0443fbb
HB
1011 /* Have one command line that is parsed and saved in /proc/cmdline */
1012 /* boot_command_line has been already set up in early.c */
1013 *cmdline_p = boot_command_line;
59685296 1014
c9e37353 1015 ROOT_DEV = Root_RAM0;
59685296 1016
50be6345 1017 /* Is init_mm really needed? */
59685296 1018 init_mm.start_code = PAGE_OFFSET;
320d9555
VG
1019 init_mm.end_code = (unsigned long) _etext;
1020 init_mm.end_data = (unsigned long) _edata;
1021 init_mm.brk = (unsigned long) _end;
59685296 1022
6a3d1e81
MS
1023 if (IS_ENABLED(CONFIG_EXPOLINE_AUTO))
1024 nospec_auto_detect();
1025
59685296 1026 parse_early_param();
8a07dd02
MS
1027#ifdef CONFIG_CRASH_DUMP
1028 /* Deactivate elfcorehdr= kernel parameter */
1029 elfcorehdr_addr = ELFCORE_ADDR_MAX;
1030#endif
1031
4857d4bb 1032 os_info_init();
99ca4e58 1033 setup_ipl();
3f6813b9 1034 setup_task_size();
50be6345
PH
1035
1036 /* Do some memory reservations *before* memory is added to memblock */
1037 reserve_memory_end();
67b5c3ee 1038 reserve_oldmem();
50be6345
PH
1039 reserve_kernel();
1040 reserve_initrd();
6966d604 1041 reserve_mem_detect_info();
50be6345
PH
1042 memblock_allow_resize();
1043
1044 /* Get information about *all* installed memory */
6966d604 1045 memblock_add_mem_detect_info();
50be6345 1046
6966d604 1047 free_mem_detect_info();
50be6345
PH
1048 remove_oldmem();
1049
1050 /*
1051 * Make sure all chunks are MAX_ORDER aligned so we don't need the
1052 * extra checks that HOLES_IN_ZONE would require.
1053 *
1054 * Is this still required?
1055 */
1056 memblock_trim_memory(1UL << (MAX_ORDER - 1 + PAGE_SHIFT));
1057
8b62bc96 1058 setup_memory_end();
c9e37353 1059 setup_memory();
e1231b0e 1060 dma_contiguous_reserve(memory_end);
3f429842 1061 vmcp_cma_reserve();
50be6345
PH
1062
1063 check_initrd();
1064 reserve_crashkernel();
1a36a39e 1065#ifdef CONFIG_CRASH_DUMP
1592a8e4
MH
1066 /*
1067 * Be aware that smp_save_dump_cpus() triggers a system reset.
1068 * Therefore CPU and device initialization should be done afterwards.
1069 */
1070 smp_save_dump_cpus();
1a36a39e 1071#endif
50be6345 1072
c9e37353
HC
1073 setup_resources();
1074 setup_lowcore();
d80512f8 1075 smp_fill_possible_mask();
097a116c 1076 cpu_detect_mhz_feature();
1da177e4 1077 cpu_init();
3a368f74 1078 numa_setup();
af51160e 1079 smp_detect_cpus();
8c910580 1080 topology_init_early();
1da177e4
LT
1081
1082 /*
1083 * Create kernel page tables and switch to virtual addressing.
1084 */
1085 paging_init();
1086
1087 /* Setup default console */
1088 conmode_default();
637952ca 1089 set_preferred_console();
411ed322 1090
686140a1 1091 apply_alternative_instructions();
f19fbd5e
MS
1092 if (IS_ENABLED(CONFIG_EXPOLINE))
1093 nospec_init_branches();
686140a1 1094
411ed322 1095 /* Setup zfcpdump support */
fe72ffba 1096 setup_zfcpdump();
bcfcbb6b
MS
1097
1098 /* Add system specific data to the random pool */
1099 setup_randomness();
1da177e4 1100}