s390: wire up sys_renameat2
[deliverable/linux.git] / arch / s390 / kernel / setup.c
CommitLineData
1da177e4 1/*
1da177e4 2 * S390 version
a53c8fab 3 * Copyright IBM Corp. 1999, 2012
1da177e4
LT
4 * Author(s): Hartmut Penner (hp@de.ibm.com),
5 * Martin Schwidefsky (schwidefsky@de.ibm.com)
6 *
7 * Derived from "arch/i386/kernel/setup.c"
8 * Copyright (C) 1995, Linus Torvalds
9 */
10
11/*
12 * This file handles the architecture-dependent parts of initialization
13 */
14
3b6ed4ab
MS
15#define KMSG_COMPONENT "setup"
16#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
17
1da177e4 18#include <linux/errno.h>
0872922f 19#include <linux/export.h>
1da177e4
LT
20#include <linux/sched.h>
21#include <linux/kernel.h>
ff38df37 22#include <linux/memblock.h>
1da177e4
LT
23#include <linux/mm.h>
24#include <linux/stddef.h>
25#include <linux/unistd.h>
26#include <linux/ptrace.h>
1da177e4 27#include <linux/user.h>
1da177e4
LT
28#include <linux/tty.h>
29#include <linux/ioport.h>
30#include <linux/delay.h>
1da177e4
LT
31#include <linux/init.h>
32#include <linux/initrd.h>
33#include <linux/bootmem.h>
34#include <linux/root_dev.h>
35#include <linux/console.h>
1da177e4 36#include <linux/kernel_stat.h>
1e8e3383 37#include <linux/device.h>
585c3047 38#include <linux/notifier.h>
65912a84 39#include <linux/pfn.h>
fe355b7f 40#include <linux/ctype.h>
2b67fc46 41#include <linux/reboot.h>
dbd70fb4 42#include <linux/topology.h>
dfd9f7ab 43#include <linux/ftrace.h>
60a0c68d
MH
44#include <linux/kexec.h>
45#include <linux/crash_dump.h>
46#include <linux/memory.h>
048cd4e5 47#include <linux/compat.h>
1da177e4 48
46b05d26 49#include <asm/ipl.h>
1e3cab2f 50#include <asm/facility.h>
1da177e4
LT
51#include <asm/smp.h>
52#include <asm/mmu_context.h>
53#include <asm/cpcmd.h>
54#include <asm/lowcore.h>
55#include <asm/irq.h>
0b642ede
PO
56#include <asm/page.h>
57#include <asm/ptrace.h>
cc13ad62 58#include <asm/sections.h>
fe355b7f 59#include <asm/ebcdic.h>
faeba830 60#include <asm/kvm_virtio.h>
60a0c68d 61#include <asm/diag.h>
4857d4bb 62#include <asm/os_info.h>
cd183459 63#include <asm/sclp.h>
8b646bd7 64#include "entry.h"
c1821c2e 65
1da177e4
LT
66/*
67 * Machine setup..
68 */
69unsigned int console_mode = 0;
1485c5c8
HC
70EXPORT_SYMBOL(console_mode);
71
1da177e4 72unsigned int console_devno = -1;
1485c5c8
HC
73EXPORT_SYMBOL(console_devno);
74
1da177e4 75unsigned int console_irq = -1;
1485c5c8
HC
76EXPORT_SYMBOL(console_irq);
77
cf8ba7a9
MS
78unsigned long elf_hwcap = 0;
79char elf_platform[ELF_PLATFORM_SIZE];
36a2bd42 80
23d17421 81struct mem_chunk __initdata memory_chunk[MEMORY_CHUNKS];
23d75d9c
HC
82
83int __initdata memory_end_set;
84unsigned long __initdata memory_end;
1da177e4 85
14045ebf
MS
86unsigned long VMALLOC_START;
87EXPORT_SYMBOL(VMALLOC_START);
88
89unsigned long VMALLOC_END;
90EXPORT_SYMBOL(VMALLOC_END);
91
92struct page *vmemmap;
93EXPORT_SYMBOL(vmemmap);
94
c972cc60
HC
95#ifdef CONFIG_64BIT
96unsigned long MODULES_VADDR;
97unsigned long MODULES_END;
98#endif
99
099b7651
FM
100/* An array with a pointer to the lowcore of every CPU. */
101struct _lowcore *lowcore_ptr[NR_CPUS];
102EXPORT_SYMBOL(lowcore_ptr);
103
1da177e4
LT
104/*
105 * This is set up by the setup-routine at boot-time
106 * for S390 need to find out, what we have to setup
107 * using address 0x10400 ...
108 */
109
110#include <asm/setup.h>
111
1da177e4
LT
112/*
113 * condev= and conmode= setup parameter.
114 */
115
116static int __init condev_setup(char *str)
117{
118 int vdev;
119
120 vdev = simple_strtoul(str, &str, 0);
121 if (vdev >= 0 && vdev < 65536) {
122 console_devno = vdev;
123 console_irq = -1;
124 }
125 return 1;
126}
127
128__setup("condev=", condev_setup);
129
637952ca
HB
130static void __init set_preferred_console(void)
131{
cd183459
HG
132 if (MACHINE_IS_KVM) {
133 if (sclp_has_vt220())
134 add_preferred_console("ttyS", 1, NULL);
135 else if (sclp_has_linemode())
136 add_preferred_console("ttyS", 0, NULL);
137 else
138 add_preferred_console("hvc", 0, NULL);
139 } else if (CONSOLE_IS_3215 || CONSOLE_IS_SCLP)
637952ca 140 add_preferred_console("ttyS", 0, NULL);
c4de0c1a 141 else if (CONSOLE_IS_3270)
637952ca
HB
142 add_preferred_console("tty3270", 0, NULL);
143}
144
1da177e4
LT
145static int __init conmode_setup(char *str)
146{
8c0933ee 147#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
148 if (strncmp(str, "hwc", 4) == 0 || strncmp(str, "sclp", 5) == 0)
149 SET_CONSOLE_SCLP;
150#endif
151#if defined(CONFIG_TN3215_CONSOLE)
152 if (strncmp(str, "3215", 5) == 0)
153 SET_CONSOLE_3215;
154#endif
155#if defined(CONFIG_TN3270_CONSOLE)
156 if (strncmp(str, "3270", 5) == 0)
157 SET_CONSOLE_3270;
158#endif
637952ca 159 set_preferred_console();
1da177e4
LT
160 return 1;
161}
162
163__setup("conmode=", conmode_setup);
164
165static void __init conmode_default(void)
166{
167 char query_buffer[1024];
168 char *ptr;
169
170 if (MACHINE_IS_VM) {
740b5706 171 cpcmd("QUERY CONSOLE", query_buffer, 1024, NULL);
1da177e4
LT
172 console_devno = simple_strtoul(query_buffer + 5, NULL, 16);
173 ptr = strstr(query_buffer, "SUBCHANNEL =");
174 console_irq = simple_strtoul(ptr + 13, NULL, 16);
740b5706 175 cpcmd("QUERY TERM", query_buffer, 1024, NULL);
1da177e4
LT
176 ptr = strstr(query_buffer, "CONMODE");
177 /*
178 * Set the conmode to 3215 so that the device recognition
179 * will set the cu_type of the console to 3215. If the
180 * conmode is 3270 and we don't set it back then both
181 * 3215 and the 3270 driver will try to access the console
182 * device (3215 as console and 3270 as normal tty).
183 */
740b5706 184 cpcmd("TERM CONMODE 3215", NULL, 0, NULL);
1da177e4 185 if (ptr == NULL) {
8c0933ee 186#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
187 SET_CONSOLE_SCLP;
188#endif
189 return;
190 }
191 if (strncmp(ptr + 8, "3270", 4) == 0) {
192#if defined(CONFIG_TN3270_CONSOLE)
193 SET_CONSOLE_3270;
194#elif defined(CONFIG_TN3215_CONSOLE)
195 SET_CONSOLE_3215;
8c0933ee 196#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
197 SET_CONSOLE_SCLP;
198#endif
199 } else if (strncmp(ptr + 8, "3215", 4) == 0) {
200#if defined(CONFIG_TN3215_CONSOLE)
201 SET_CONSOLE_3215;
202#elif defined(CONFIG_TN3270_CONSOLE)
203 SET_CONSOLE_3270;
8c0933ee 204#elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
205 SET_CONSOLE_SCLP;
206#endif
207 }
1da177e4 208 } else {
8c0933ee 209#if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
1da177e4
LT
210 SET_CONSOLE_SCLP;
211#endif
212 }
213}
214
59f2e69d 215#ifdef CONFIG_ZFCPDUMP
fe72ffba 216static void __init setup_zfcpdump(void)
411ed322 217{
411ed322
MH
218 if (ipl_info.type != IPL_TYPE_FCP_DUMP)
219 return;
3f25dc4f
MH
220 if (OLDMEM_BASE)
221 return;
fe72ffba 222 strcat(boot_command_line, " cio_ignore=all,!ipldev,!condev");
411ed322
MH
223 console_loglevel = 2;
224}
225#else
fe72ffba 226static inline void setup_zfcpdump(void) {}
411ed322
MH
227#endif /* CONFIG_ZFCPDUMP */
228
1da177e4
LT
229 /*
230 * Reboot, halt and power_off stubs. They just call _machine_restart,
231 * _machine_halt or _machine_power_off.
232 */
233
234void machine_restart(char *command)
235{
7aa8dac7 236 if ((!in_interrupt() && !in_atomic()) || oops_in_progress)
06fa46a2
MS
237 /*
238 * Only unblank the console if we are called in enabled
239 * context or a bust_spinlocks cleared the way for us.
240 */
241 console_unblank();
1da177e4
LT
242 _machine_restart(command);
243}
244
1da177e4
LT
245void machine_halt(void)
246{
06fa46a2
MS
247 if (!in_interrupt() || oops_in_progress)
248 /*
249 * Only unblank the console if we are called in enabled
250 * context or a bust_spinlocks cleared the way for us.
251 */
252 console_unblank();
1da177e4
LT
253 _machine_halt();
254}
255
1da177e4
LT
256void machine_power_off(void)
257{
06fa46a2
MS
258 if (!in_interrupt() || oops_in_progress)
259 /*
260 * Only unblank the console if we are called in enabled
261 * context or a bust_spinlocks cleared the way for us.
262 */
263 console_unblank();
1da177e4
LT
264 _machine_power_off();
265}
266
53df751c
MS
267/*
268 * Dummy power off function.
269 */
270void (*pm_power_off)(void) = machine_power_off;
0872922f 271EXPORT_SYMBOL_GPL(pm_power_off);
53df751c 272
59685296
HC
273static int __init early_parse_mem(char *p)
274{
275 memory_end = memparse(p, &p);
23d75d9c 276 memory_end_set = 1;
59685296
HC
277 return 0;
278}
279early_param("mem", early_parse_mem);
280
14045ebf
MS
281static int __init parse_vmalloc(char *arg)
282{
283 if (!arg)
284 return -EINVAL;
285 VMALLOC_END = (memparse(arg, &arg) + PAGE_SIZE - 1) & PAGE_MASK;
286 return 0;
287}
288early_param("vmalloc", parse_vmalloc);
289
8b646bd7
MS
290void *restart_stack __attribute__((__section__(".data")));
291
292static void __init setup_lowcore(void)
c9e37353
HC
293{
294 struct _lowcore *lc;
c9e37353
HC
295
296 /*
297 * Setup lowcore for boot cpu
298 */
cbb870c8 299 BUILD_BUG_ON(sizeof(struct _lowcore) != LC_PAGES * 4096);
a0878656 300 lc = __alloc_bootmem_low(LC_PAGES * PAGE_SIZE, LC_PAGES * PAGE_SIZE, 0);
e258d719 301 lc->restart_psw.mask = PSW_KERNEL_BITS;
c9e37353 302 lc->restart_psw.addr =
8b646bd7 303 PSW_ADDR_AMODE | (unsigned long) restart_int_handler;
e258d719 304 lc->external_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 305 PSW_MASK_DAT | PSW_MASK_MCHECK;
c9e37353
HC
306 lc->external_new_psw.addr =
307 PSW_ADDR_AMODE | (unsigned long) ext_int_handler;
e258d719 308 lc->svc_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 309 PSW_MASK_DAT | PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK;
c9e37353 310 lc->svc_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) system_call;
e258d719 311 lc->program_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 312 PSW_MASK_DAT | PSW_MASK_MCHECK;
c9e37353 313 lc->program_new_psw.addr =
b50511e4 314 PSW_ADDR_AMODE | (unsigned long) pgm_check_handler;
e258d719 315 lc->mcck_new_psw.mask = PSW_KERNEL_BITS;
c9e37353
HC
316 lc->mcck_new_psw.addr =
317 PSW_ADDR_AMODE | (unsigned long) mcck_int_handler;
e258d719 318 lc->io_new_psw.mask = PSW_KERNEL_BITS |
b50511e4 319 PSW_MASK_DAT | PSW_MASK_MCHECK;
c9e37353 320 lc->io_new_psw.addr = PSW_ADDR_AMODE | (unsigned long) io_int_handler;
5a62b192 321 lc->clock_comparator = -1ULL;
dc7ee00d
MS
322 lc->kernel_stack = ((unsigned long) &init_thread_union)
323 + THREAD_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
c9e37353 324 lc->async_stack = (unsigned long)
dc7ee00d
MS
325 __alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0)
326 + ASYNC_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
c9e37353 327 lc->panic_stack = (unsigned long)
dc7ee00d
MS
328 __alloc_bootmem(PAGE_SIZE, PAGE_SIZE, 0)
329 + PAGE_SIZE - STACK_FRAME_OVERHEAD - sizeof(struct pt_regs);
c9e37353
HC
330 lc->current_task = (unsigned long) init_thread_union.thread_info.task;
331 lc->thread_info = (unsigned long) &init_thread_union;
25097bf1 332 lc->machine_flags = S390_lowcore.machine_flags;
14375bc4
MS
333 lc->stfl_fac_list = S390_lowcore.stfl_fac_list;
334 memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
335 MAX_FACILITY_BIT/8);
347a8dc3 336#ifndef CONFIG_64BIT
77fa2245
HC
337 if (MACHINE_HAS_IEEE) {
338 lc->extended_save_area_addr = (__u32)
a0878656 339 __alloc_bootmem_low(PAGE_SIZE, PAGE_SIZE, 0);
77fa2245 340 /* enable extended save area */
c4972f33 341 __ctl_set_bit(14, 29);
77fa2245 342 }
c742b31c
MS
343#else
344 lc->vdso_per_cpu_data = (unsigned long) &lc->paste[0];
77fa2245 345#endif
ab96e798
MS
346 lc->sync_enter_timer = S390_lowcore.sync_enter_timer;
347 lc->async_enter_timer = S390_lowcore.async_enter_timer;
348 lc->exit_timer = S390_lowcore.exit_timer;
349 lc->user_timer = S390_lowcore.user_timer;
350 lc->system_timer = S390_lowcore.system_timer;
351 lc->steal_timer = S390_lowcore.steal_timer;
352 lc->last_update_timer = S390_lowcore.last_update_timer;
353 lc->last_update_clock = S390_lowcore.last_update_clock;
dfd9f7ab 354 lc->ftrace_func = S390_lowcore.ftrace_func;
8b646bd7
MS
355
356 restart_stack = __alloc_bootmem(ASYNC_SIZE, ASYNC_SIZE, 0);
357 restart_stack += ASYNC_SIZE;
358
359 /*
360 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
b4a96015 361 * restart data to the absolute zero lowcore. This is necessary if
8b646bd7
MS
362 * PSW restart is done on an offline CPU that has lowcore zero.
363 */
364 lc->restart_stack = (unsigned long) restart_stack;
365 lc->restart_fn = (unsigned long) do_restart;
366 lc->restart_data = 0;
367 lc->restart_source = -1UL;
73bf463e
MH
368
369 /* Setup absolute zero lowcore */
fbe76568
HC
370 mem_assign_absolute(S390_lowcore.restart_stack, lc->restart_stack);
371 mem_assign_absolute(S390_lowcore.restart_fn, lc->restart_fn);
372 mem_assign_absolute(S390_lowcore.restart_data, lc->restart_data);
373 mem_assign_absolute(S390_lowcore.restart_source, lc->restart_source);
374 mem_assign_absolute(S390_lowcore.restart_psw, lc->restart_psw);
8b646bd7 375
c9e37353 376 set_prefix((u32)(unsigned long) lc);
099b7651 377 lowcore_ptr[0] = lc;
c9e37353
HC
378}
379
71189284
HC
380static struct resource code_resource = {
381 .name = "Kernel code",
382 .flags = IORESOURCE_BUSY | IORESOURCE_MEM,
383};
384
385static struct resource data_resource = {
386 .name = "Kernel data",
387 .flags = IORESOURCE_BUSY | IORESOURCE_MEM,
388};
389
4cc69531
HC
390static struct resource bss_resource = {
391 .name = "Kernel bss",
392 .flags = IORESOURCE_BUSY | IORESOURCE_MEM,
393};
394
71189284
HC
395static struct resource __initdata *standard_resources[] = {
396 &code_resource,
397 &data_resource,
4cc69531 398 &bss_resource,
71189284
HC
399};
400
401static void __init setup_resources(void)
c9e37353 402{
71189284
HC
403 struct resource *res, *std_res, *sub_res;
404 int i, j;
c9e37353 405
cc13ad62
HC
406 code_resource.start = (unsigned long) &_text;
407 code_resource.end = (unsigned long) &_etext - 1;
408 data_resource.start = (unsigned long) &_etext;
409 data_resource.end = (unsigned long) &_edata - 1;
4cc69531
HC
410 bss_resource.start = (unsigned long) &__bss_start;
411 bss_resource.end = (unsigned long) &__bss_stop - 1;
cc13ad62 412
9f4b0ba8
HC
413 for (i = 0; i < MEMORY_CHUNKS; i++) {
414 if (!memory_chunk[i].size)
415 continue;
71189284 416 res = alloc_bootmem_low(sizeof(*res));
c9e37353
HC
417 res->flags = IORESOURCE_BUSY | IORESOURCE_MEM;
418 switch (memory_chunk[i].type) {
419 case CHUNK_READ_WRITE:
420 res->name = "System RAM";
421 break;
422 case CHUNK_READ_ONLY:
423 res->name = "System ROM";
424 res->flags |= IORESOURCE_READONLY;
425 break;
426 default:
427 res->name = "reserved";
428 }
429 res->start = memory_chunk[i].addr;
71189284 430 res->end = res->start + memory_chunk[i].size - 1;
c9e37353 431 request_resource(&iomem_resource, res);
fe355b7f 432
71189284
HC
433 for (j = 0; j < ARRAY_SIZE(standard_resources); j++) {
434 std_res = standard_resources[j];
435 if (std_res->start < res->start ||
436 std_res->start > res->end)
437 continue;
438 if (std_res->end > res->end) {
439 sub_res = alloc_bootmem_low(sizeof(*sub_res));
440 *sub_res = *std_res;
441 sub_res->end = res->end;
442 std_res->start = res->end + 1;
443 request_resource(res, sub_res);
444 } else {
445 request_resource(res, std_res);
446 }
fe355b7f 447 }
c9e37353
HC
448 }
449}
450
8b62bc96
HC
451static void __init setup_memory_end(void)
452{
14045ebf 453 unsigned long vmax, vmalloc_size, tmp;
118131a2 454 unsigned long real_memory_size = 0;
8b62bc96
HC
455 int i;
456
60a0c68d 457
59f2e69d 458#ifdef CONFIG_ZFCPDUMP
e657d8fe
MH
459 if (ipl_info.type == IPL_TYPE_FCP_DUMP &&
460 !OLDMEM_BASE && sclp_get_hsa_size()) {
461 memory_end = sclp_get_hsa_size();
23d75d9c
HC
462 memory_end_set = 1;
463 }
411ed322 464#endif
8b62bc96
HC
465 memory_end &= PAGE_MASK;
466
9f4b0ba8
HC
467 /*
468 * Make sure all chunks are MAX_ORDER aligned so we don't need the
469 * extra checks that HOLES_IN_ZONE would require.
470 */
471 for (i = 0; i < MEMORY_CHUNKS; i++) {
472 unsigned long start, end;
473 struct mem_chunk *chunk;
474 unsigned long align;
475
476 chunk = &memory_chunk[i];
996b4a7d 477 if (!chunk->size)
67b5c3ee 478 continue;
9f4b0ba8
HC
479 align = 1UL << (MAX_ORDER + PAGE_SHIFT - 1);
480 start = (chunk->addr + align - 1) & ~(align - 1);
481 end = (chunk->addr + chunk->size) & ~(align - 1);
482 if (start >= end)
483 memset(chunk, 0, sizeof(*chunk));
484 else {
485 chunk->addr = start;
486 chunk->size = end - start;
487 }
14045ebf
MS
488 real_memory_size = max(real_memory_size,
489 chunk->addr + chunk->size);
9f4b0ba8
HC
490 }
491
14045ebf
MS
492 /* Choose kernel address space layout: 2, 3, or 4 levels. */
493#ifdef CONFIG_64BIT
c972cc60 494 vmalloc_size = VMALLOC_END ?: (128UL << 30) - MODULES_LEN;
14045ebf
MS
495 tmp = (memory_end ?: real_memory_size) / PAGE_SIZE;
496 tmp = tmp * (sizeof(struct page) + PAGE_SIZE) + vmalloc_size;
497 if (tmp <= (1UL << 42))
498 vmax = 1UL << 42; /* 3-level kernel page table */
499 else
500 vmax = 1UL << 53; /* 4-level kernel page table */
c972cc60
HC
501 /* module area is at the end of the kernel address space. */
502 MODULES_END = vmax;
503 MODULES_VADDR = MODULES_END - MODULES_LEN;
504 VMALLOC_END = MODULES_VADDR;
14045ebf
MS
505#else
506 vmalloc_size = VMALLOC_END ?: 96UL << 20;
507 vmax = 1UL << 31; /* 2-level kernel page table */
14045ebf
MS
508 /* vmalloc area is at the end of the kernel address space. */
509 VMALLOC_END = vmax;
c972cc60 510#endif
14045ebf
MS
511 VMALLOC_START = vmax - vmalloc_size;
512
513 /* Split remaining virtual space between 1:1 mapping & vmemmap array */
514 tmp = VMALLOC_START / (PAGE_SIZE + sizeof(struct page));
a7bb1ae7
HC
515 /* vmemmap contains a multiple of PAGES_PER_SECTION struct pages */
516 tmp = SECTION_ALIGN_UP(tmp);
14045ebf
MS
517 tmp = VMALLOC_START - tmp * sizeof(struct page);
518 tmp &= ~((vmax >> 11) - 1); /* align to page table level */
519 tmp = min(tmp, 1UL << MAX_PHYSMEM_BITS);
520 vmemmap = (struct page *) tmp;
521
522 /* Take care that memory_end is set and <= vmemmap */
523 memory_end = min(memory_end ?: real_memory_size, tmp);
524
525 /* Fixup memory chunk array to fit into 0..memory_end */
8b62bc96
HC
526 for (i = 0; i < MEMORY_CHUNKS; i++) {
527 struct mem_chunk *chunk = &memory_chunk[i];
528
996b4a7d 529 if (!chunk->size)
67b5c3ee 530 continue;
14045ebf 531 if (chunk->addr >= memory_end) {
8b62bc96
HC
532 memset(chunk, 0, sizeof(*chunk));
533 continue;
534 }
14045ebf
MS
535 if (chunk->addr + chunk->size > memory_end)
536 chunk->size = memory_end - chunk->addr;
8b62bc96 537 }
8b62bc96
HC
538}
539
d38593f9
MH
540static void __init setup_vmcoreinfo(void)
541{
fbe76568 542 mem_assign_absolute(S390_lowcore.vmcore_info, paddr_vmcoreinfo_note());
d38593f9
MH
543}
544
60a0c68d
MH
545#ifdef CONFIG_CRASH_DUMP
546
547/*
548 * Find suitable location for crashkernel memory
549 */
550static unsigned long __init find_crash_base(unsigned long crash_size,
551 char **msg)
552{
553 unsigned long crash_base;
554 struct mem_chunk *chunk;
555 int i;
556
557 if (memory_chunk[0].size < crash_size) {
558 *msg = "first memory chunk must be at least crashkernel size";
559 return 0;
560 }
5f894cbb 561 if (OLDMEM_BASE && crash_size == OLDMEM_SIZE)
60a0c68d
MH
562 return OLDMEM_BASE;
563
564 for (i = MEMORY_CHUNKS - 1; i >= 0; i--) {
565 chunk = &memory_chunk[i];
566 if (chunk->size == 0)
567 continue;
568 if (chunk->type != CHUNK_READ_WRITE)
569 continue;
570 if (chunk->size < crash_size)
571 continue;
572 crash_base = (chunk->addr + chunk->size) - crash_size;
573 if (crash_base < crash_size)
574 continue;
e657d8fe 575 if (crash_base < sclp_get_hsa_size())
60a0c68d
MH
576 continue;
577 if (crash_base < (unsigned long) INITRD_START + INITRD_SIZE)
578 continue;
579 return crash_base;
580 }
581 *msg = "no suitable area found";
582 return 0;
583}
584
585/*
586 * Check if crash_base and crash_size is valid
587 */
588static int __init verify_crash_base(unsigned long crash_base,
589 unsigned long crash_size,
590 char **msg)
591{
592 struct mem_chunk *chunk;
593 int i;
594
595 /*
596 * Because we do the swap to zero, we must have at least 'crash_size'
597 * bytes free space before crash_base
598 */
599 if (crash_size > crash_base) {
600 *msg = "crashkernel offset must be greater than size";
601 return -EINVAL;
602 }
603
604 /* First memory chunk must be at least crash_size */
605 if (memory_chunk[0].size < crash_size) {
606 *msg = "first memory chunk must be at least crashkernel size";
607 return -EINVAL;
608 }
609 /* Check if we fit into the respective memory chunk */
610 for (i = 0; i < MEMORY_CHUNKS; i++) {
611 chunk = &memory_chunk[i];
612 if (chunk->size == 0)
613 continue;
614 if (crash_base < chunk->addr)
615 continue;
616 if (crash_base >= chunk->addr + chunk->size)
617 continue;
618 /* we have found the memory chunk */
619 if (crash_base + crash_size > chunk->addr + chunk->size) {
620 *msg = "selected memory chunk is too small for "
621 "crashkernel memory";
622 return -EINVAL;
623 }
624 return 0;
625 }
626 *msg = "invalid memory range specified";
627 return -EINVAL;
628}
629
60a0c68d
MH
630/*
631 * When kdump is enabled, we have to ensure that no memory from
632 * the area [0 - crashkernel memory size] and
633 * [crashk_res.start - crashk_res.end] is set offline.
634 */
635static int kdump_mem_notifier(struct notifier_block *nb,
636 unsigned long action, void *data)
637{
638 struct memory_notify *arg = data;
639
640 if (arg->start_pfn < PFN_DOWN(resource_size(&crashk_res)))
641 return NOTIFY_BAD;
642 if (arg->start_pfn > PFN_DOWN(crashk_res.end))
643 return NOTIFY_OK;
644 if (arg->start_pfn + arg->nr_pages - 1 < PFN_DOWN(crashk_res.start))
645 return NOTIFY_OK;
646 return NOTIFY_BAD;
647}
648
649static struct notifier_block kdump_mem_nb = {
650 .notifier_call = kdump_mem_notifier,
651};
652
653#endif
654
655/*
656 * Make sure that oldmem, where the dump is stored, is protected
657 */
658static void reserve_oldmem(void)
659{
660#ifdef CONFIG_CRASH_DUMP
118131a2
HC
661 unsigned long real_size = 0;
662 int i;
663
60a0c68d
MH
664 if (!OLDMEM_BASE)
665 return;
118131a2
HC
666 for (i = 0; i < MEMORY_CHUNKS; i++) {
667 struct mem_chunk *chunk = &memory_chunk[i];
60a0c68d 668
118131a2
HC
669 real_size = max(real_size, chunk->addr + chunk->size);
670 }
996b4a7d
HC
671 create_mem_hole(memory_chunk, OLDMEM_BASE, OLDMEM_SIZE);
672 create_mem_hole(memory_chunk, OLDMEM_SIZE, real_size - OLDMEM_SIZE);
60a0c68d
MH
673#endif
674}
675
676/*
677 * Reserve memory for kdump kernel to be loaded with kexec
678 */
679static void __init reserve_crashkernel(void)
680{
681#ifdef CONFIG_CRASH_DUMP
682 unsigned long long crash_base, crash_size;
4fdf7f43 683 char *msg = NULL;
60a0c68d
MH
684 int rc;
685
686 rc = parse_crashkernel(boot_command_line, memory_end, &crash_size,
687 &crash_base);
688 if (rc || crash_size == 0)
689 return;
dab7a7b1
MH
690 crash_base = ALIGN(crash_base, KEXEC_CRASH_MEM_ALIGN);
691 crash_size = ALIGN(crash_size, KEXEC_CRASH_MEM_ALIGN);
60a0c68d
MH
692 if (register_memory_notifier(&kdump_mem_nb))
693 return;
694 if (!crash_base)
695 crash_base = find_crash_base(crash_size, &msg);
696 if (!crash_base) {
697 pr_info("crashkernel reservation failed: %s\n", msg);
698 unregister_memory_notifier(&kdump_mem_nb);
699 return;
700 }
701 if (verify_crash_base(crash_base, crash_size, &msg)) {
702 pr_info("crashkernel reservation failed: %s\n", msg);
703 unregister_memory_notifier(&kdump_mem_nb);
704 return;
705 }
706 if (!OLDMEM_BASE && MACHINE_IS_VM)
707 diag10_range(PFN_DOWN(crash_base), PFN_DOWN(crash_size));
708 crashk_res.start = crash_base;
709 crashk_res.end = crash_base + crash_size - 1;
710 insert_resource(&iomem_resource, &crashk_res);
996b4a7d 711 create_mem_hole(memory_chunk, crash_base, crash_size);
60a0c68d
MH
712 pr_info("Reserving %lluMB of memory at %lluMB "
713 "for crashkernel (System RAM: %luMB)\n",
714 crash_size >> 20, crash_base >> 20, memory_end >> 20);
4857d4bb 715 os_info_crashkernel_add(crash_base, crash_size);
60a0c68d
MH
716#endif
717}
718
8b646bd7 719static void __init setup_memory(void)
c9e37353
HC
720{
721 unsigned long bootmap_size;
fe355b7f 722 unsigned long start_pfn, end_pfn;
c9e37353 723 int i;
1da177e4
LT
724
725 /*
726 * partially used pages are not usable - thus
727 * we are rounding upwards:
728 */
65912a84
HC
729 start_pfn = PFN_UP(__pa(&_end));
730 end_pfn = max_pfn = PFN_DOWN(memory_end);
1da177e4 731
65912a84
HC
732#ifdef CONFIG_BLK_DEV_INITRD
733 /*
734 * Move the initrd in case the bitmap of the bootmem allocater
735 * would overwrite it.
736 */
737
738 if (INITRD_START && INITRD_SIZE) {
739 unsigned long bmap_size;
740 unsigned long start;
741
742 bmap_size = bootmem_bootmap_pages(end_pfn - start_pfn + 1);
743 bmap_size = PFN_PHYS(bmap_size);
744
745 if (PFN_PHYS(start_pfn) + bmap_size > INITRD_START) {
746 start = PFN_PHYS(start_pfn) + bmap_size + PAGE_SIZE;
747
60a0c68d
MH
748#ifdef CONFIG_CRASH_DUMP
749 if (OLDMEM_BASE) {
750 /* Move initrd behind kdump oldmem */
751 if (start + INITRD_SIZE > OLDMEM_BASE &&
752 start < OLDMEM_BASE + OLDMEM_SIZE)
753 start = OLDMEM_BASE + OLDMEM_SIZE;
754 }
755#endif
65912a84 756 if (start + INITRD_SIZE > memory_end) {
3b6ed4ab
MS
757 pr_err("initrd extends beyond end of "
758 "memory (0x%08lx > 0x%08lx) "
65912a84
HC
759 "disabling initrd\n",
760 start + INITRD_SIZE, memory_end);
761 INITRD_START = INITRD_SIZE = 0;
762 } else {
3b6ed4ab
MS
763 pr_info("Moving initrd (0x%08lx -> "
764 "0x%08lx, size: %ld)\n",
765 INITRD_START, start, INITRD_SIZE);
65912a84
HC
766 memmove((void *) start, (void *) INITRD_START,
767 INITRD_SIZE);
768 INITRD_START = start;
769 }
770 }
771 }
772#endif
773
1da177e4 774 /*
7676bef9 775 * Initialize the boot-time allocator
1da177e4
LT
776 */
777 bootmap_size = init_bootmem(start_pfn, end_pfn);
778
779 /*
780 * Register RAM areas with the bootmem allocator.
781 */
c9e37353 782
996b4a7d 783 for (i = 0; i < MEMORY_CHUNKS; i++) {
39b742f9 784 unsigned long start_chunk, end_chunk, pfn;
1da177e4 785
996b4a7d 786 if (!memory_chunk[i].size)
1da177e4 787 continue;
39b742f9 788 start_chunk = PFN_DOWN(memory_chunk[i].addr);
fb2e7c5e 789 end_chunk = start_chunk + PFN_DOWN(memory_chunk[i].size);
39b742f9
HC
790 end_chunk = min(end_chunk, end_pfn);
791 if (start_chunk >= end_chunk)
792 continue;
ff38df37
TH
793 memblock_add_node(PFN_PHYS(start_chunk),
794 PFN_PHYS(end_chunk - start_chunk), 0);
39b742f9 795 pfn = max(start_chunk, start_pfn);
6b70a920 796 storage_key_init_range(PFN_PHYS(pfn), PFN_PHYS(end_chunk));
1da177e4
LT
797 }
798
0b642ede
PO
799 psw_set_key(PAGE_DEFAULT_KEY);
800
39b742f9 801 free_bootmem_with_active_regions(0, max_pfn);
c9e37353 802
615b04b3
HC
803 /*
804 * Reserve memory used for lowcore/command line/kernel image.
805 */
72a7fe39 806 reserve_bootmem(0, (unsigned long)_ehead, BOOTMEM_DEFAULT);
615b04b3 807 reserve_bootmem((unsigned long)_stext,
72a7fe39
BW
808 PFN_PHYS(start_pfn) - (unsigned long)_stext,
809 BOOTMEM_DEFAULT);
c9e37353
HC
810 /*
811 * Reserve the bootmem bitmap itself as well. We do this in two
812 * steps (first step was init_bootmem()) because this catches
813 * the (very unlikely) case of us accidentally initializing the
814 * bootmem allocator with an invalid RAM area.
815 */
72a7fe39
BW
816 reserve_bootmem(start_pfn << PAGE_SHIFT, bootmap_size,
817 BOOTMEM_DEFAULT);
1da177e4 818
60a0c68d
MH
819#ifdef CONFIG_CRASH_DUMP
820 if (crashk_res.start)
821 reserve_bootmem(crashk_res.start,
822 crashk_res.end - crashk_res.start + 1,
823 BOOTMEM_DEFAULT);
824 if (is_kdump_kernel())
825 reserve_bootmem(elfcorehdr_addr - OLDMEM_BASE,
826 PAGE_ALIGN(elfcorehdr_size), BOOTMEM_DEFAULT);
827#endif
1da177e4 828#ifdef CONFIG_BLK_DEV_INITRD
65912a84 829 if (INITRD_START && INITRD_SIZE) {
1da177e4 830 if (INITRD_START + INITRD_SIZE <= memory_end) {
72a7fe39
BW
831 reserve_bootmem(INITRD_START, INITRD_SIZE,
832 BOOTMEM_DEFAULT);
1da177e4
LT
833 initrd_start = INITRD_START;
834 initrd_end = initrd_start + INITRD_SIZE;
835 } else {
3b6ed4ab
MS
836 pr_err("initrd extends beyond end of "
837 "memory (0x%08lx > 0x%08lx) "
838 "disabling initrd\n",
c9e37353
HC
839 initrd_start + INITRD_SIZE, memory_end);
840 initrd_start = initrd_end = 0;
1da177e4 841 }
c9e37353 842 }
1da177e4 843#endif
c9e37353 844}
1da177e4 845
cf8ba7a9
MS
846/*
847 * Setup hardware capabilities.
848 */
849static void __init setup_hwcaps(void)
850{
851 static const int stfl_bits[6] = { 0, 2, 7, 17, 19, 21 };
94038a99 852 struct cpuid cpu_id;
cf8ba7a9
MS
853 int i;
854
cf8ba7a9
MS
855 /*
856 * The store facility list bits numbers as found in the principles
857 * of operation are numbered with bit 1UL<<31 as number 0 to
858 * bit 1UL<<0 as number 31.
859 * Bit 0: instructions named N3, "backported" to esa-mode
860 * Bit 2: z/Architecture mode is active
861 * Bit 7: the store-facility-list-extended facility is installed
862 * Bit 17: the message-security assist is installed
863 * Bit 19: the long-displacement facility is installed
864 * Bit 21: the extended-immediate facility is installed
488253ce
AK
865 * Bit 22: extended-translation facility 3 is installed
866 * Bit 30: extended-translation facility 3 enhancement facility
cf8ba7a9
MS
867 * These get translated to:
868 * HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
869 * HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
488253ce
AK
870 * HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
871 * HWCAP_S390_ETF3EH bit 8 (22 && 30).
cf8ba7a9
MS
872 */
873 for (i = 0; i < 6; i++)
14375bc4 874 if (test_facility(stfl_bits[i]))
cf8ba7a9
MS
875 elf_hwcap |= 1UL << i;
876
14375bc4 877 if (test_facility(22) && test_facility(30))
ea2a4d3a 878 elf_hwcap |= HWCAP_S390_ETF3EH;
488253ce 879
cf8ba7a9
MS
880 /*
881 * Check for additional facilities with store-facility-list-extended.
882 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
883 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
884 * as stored by stfl, bits 32-xxx contain additional facilities.
885 * How many facility words are stored depends on the number of
25985edc 886 * doublewords passed to the instruction. The additional facilities
cf8ba7a9 887 * are:
2ac3307f
CE
888 * Bit 42: decimal floating point facility is installed
889 * Bit 44: perform floating point operation facility is installed
cf8ba7a9 890 * translated to:
488253ce 891 * HWCAP_S390_DFP bit 6 (42 && 44).
cf8ba7a9 892 */
14375bc4
MS
893 if ((elf_hwcap & (1UL << 2)) && test_facility(42) && test_facility(44))
894 elf_hwcap |= HWCAP_S390_DFP;
cf8ba7a9 895
ea2a4d3a
HC
896 /*
897 * Huge page support HWCAP_S390_HPAGE is bit 7.
898 */
53492b1d 899 if (MACHINE_HAS_HPAGE)
ea2a4d3a
HC
900 elf_hwcap |= HWCAP_S390_HPAGE;
901
db2e1f43 902#if defined(CONFIG_64BIT)
ea2a4d3a
HC
903 /*
904 * 64-bit register support for 31-bit processes
905 * HWCAP_S390_HIGH_GPRS is bit 9.
906 */
907 elf_hwcap |= HWCAP_S390_HIGH_GPRS;
d35339a4
MS
908
909 /*
910 * Transactional execution support HWCAP_S390_TE is bit 10.
911 */
912 if (test_facility(50) && test_facility(73))
913 elf_hwcap |= HWCAP_S390_TE;
db2e1f43 914#endif
53492b1d 915
94038a99
MS
916 get_cpu_id(&cpu_id);
917 switch (cpu_id.machine) {
cf8ba7a9
MS
918 case 0x9672:
919#if !defined(CONFIG_64BIT)
920 default: /* Use "g5" as default for 31 bit kernels. */
921#endif
922 strcpy(elf_platform, "g5");
923 break;
924 case 0x2064:
925 case 0x2066:
926#if defined(CONFIG_64BIT)
927 default: /* Use "z900" as default for 64 bit kernels. */
928#endif
929 strcpy(elf_platform, "z900");
930 break;
931 case 0x2084:
932 case 0x2086:
933 strcpy(elf_platform, "z990");
934 break;
935 case 0x2094:
9fee8db2 936 case 0x2096:
cf8ba7a9
MS
937 strcpy(elf_platform, "z9-109");
938 break;
9fee8db2
MS
939 case 0x2097:
940 case 0x2098:
941 strcpy(elf_platform, "z10");
942 break;
c84b9051 943 case 0x2817:
3a81b171 944 case 0x2818:
c84b9051
HC
945 strcpy(elf_platform, "z196");
946 break;
991c1505 947 case 0x2827:
59471227 948 case 0x2828:
991c1505
HC
949 strcpy(elf_platform, "zEC12");
950 break;
cf8ba7a9
MS
951 }
952}
953
c9e37353
HC
954/*
955 * Setup function called from init/main.c just after the banner
956 * was printed.
957 */
1da177e4 958
8b646bd7 959void __init setup_arch(char **cmdline_p)
c9e37353 960{
1da177e4 961 /*
c9e37353 962 * print what head.S has found out about the machine
1da177e4 963 */
347a8dc3 964#ifndef CONFIG_64BIT
3b6ed4ab
MS
965 if (MACHINE_IS_VM)
966 pr_info("Linux is running as a z/VM "
967 "guest operating system in 31-bit mode\n");
27d71602 968 else if (MACHINE_IS_LPAR)
3b6ed4ab
MS
969 pr_info("Linux is running natively in 31-bit mode\n");
970 if (MACHINE_HAS_IEEE)
971 pr_info("The hardware system has IEEE compatible "
972 "floating point units\n");
973 else
974 pr_info("The hardware system has no IEEE compatible "
975 "floating point units\n");
347a8dc3 976#else /* CONFIG_64BIT */
fa587743 977 if (MACHINE_IS_VM)
3b6ed4ab
MS
978 pr_info("Linux is running as a z/VM "
979 "guest operating system in 64-bit mode\n");
637952ca 980 else if (MACHINE_IS_KVM)
3b6ed4ab 981 pr_info("Linux is running under KVM in 64-bit mode\n");
27d71602 982 else if (MACHINE_IS_LPAR)
3b6ed4ab 983 pr_info("Linux is running natively in 64-bit mode\n");
347a8dc3 984#endif /* CONFIG_64BIT */
c9e37353 985
a0443fbb
HB
986 /* Have one command line that is parsed and saved in /proc/cmdline */
987 /* boot_command_line has been already set up in early.c */
988 *cmdline_p = boot_command_line;
59685296 989
c9e37353 990 ROOT_DEV = Root_RAM0;
59685296
HC
991
992 init_mm.start_code = PAGE_OFFSET;
993 init_mm.end_code = (unsigned long) &_etext;
994 init_mm.end_data = (unsigned long) &_edata;
995 init_mm.brk = (unsigned long) &_end;
996
59685296 997 parse_early_param();
df1bd59c 998 detect_memory_layout(memory_chunk, memory_end);
4857d4bb 999 os_info_init();
99ca4e58 1000 setup_ipl();
67b5c3ee 1001 reserve_oldmem();
8b62bc96 1002 setup_memory_end();
60a0c68d 1003 reserve_crashkernel();
c9e37353
HC
1004 setup_memory();
1005 setup_resources();
d38593f9 1006 setup_vmcoreinfo();
c9e37353
HC
1007 setup_lowcore();
1008
d80512f8 1009 smp_fill_possible_mask();
1da177e4 1010 cpu_init();
dbd70fb4 1011 s390_init_cpu_topology();
1da177e4 1012
cf8ba7a9
MS
1013 /*
1014 * Setup capabilities (ELF_HWCAP & ELF_PLATFORM).
1015 */
1016 setup_hwcaps();
1017
1da177e4
LT
1018 /*
1019 * Create kernel page tables and switch to virtual addressing.
1020 */
1021 paging_init();
1022
1023 /* Setup default console */
1024 conmode_default();
637952ca 1025 set_preferred_console();
411ed322
MH
1026
1027 /* Setup zfcpdump support */
fe72ffba 1028 setup_zfcpdump();
1da177e4 1029}
This page took 0.763663 seconds and 5 git commands to generate.