3 * Copyright IBM Corp. 1999, 2012
4 * Author(s): Hartmut Penner (hp@de.ibm.com),
5 * Martin Schwidefsky (schwidefsky@de.ibm.com)
7 * Derived from "arch/i386/kernel/setup.c"
8 * Copyright (C) 1995, Linus Torvalds
12 * This file handles the architecture-dependent parts of initialization
15 #define KMSG_COMPONENT "setup"
16 #define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
18 #include <linux/errno.h>
19 #include <linux/module.h>
20 #include <linux/sched.h>
21 #include <linux/kernel.h>
22 #include <linux/memblock.h>
24 #include <linux/stddef.h>
25 #include <linux/unistd.h>
26 #include <linux/ptrace.h>
27 #include <linux/user.h>
28 #include <linux/tty.h>
29 #include <linux/ioport.h>
30 #include <linux/delay.h>
31 #include <linux/init.h>
32 #include <linux/initrd.h>
33 #include <linux/bootmem.h>
34 #include <linux/root_dev.h>
35 #include <linux/console.h>
36 #include <linux/kernel_stat.h>
37 #include <linux/device.h>
38 #include <linux/notifier.h>
39 #include <linux/pfn.h>
40 #include <linux/ctype.h>
41 #include <linux/reboot.h>
42 #include <linux/topology.h>
43 #include <linux/ftrace.h>
44 #include <linux/kexec.h>
45 #include <linux/crash_dump.h>
46 #include <linux/memory.h>
47 #include <linux/compat.h>
50 #include <asm/uaccess.h>
51 #include <asm/facility.h>
53 #include <asm/mmu_context.h>
54 #include <asm/cpcmd.h>
55 #include <asm/lowcore.h>
58 #include <asm/ptrace.h>
59 #include <asm/sections.h>
60 #include <asm/ebcdic.h>
61 #include <asm/kvm_virtio.h>
63 #include <asm/os_info.h>
67 long psw_kernel_bits
= PSW_DEFAULT_KEY
| PSW_MASK_BASE
| PSW_ASC_PRIMARY
|
68 PSW_MASK_EA
| PSW_MASK_BA
;
69 long psw_user_bits
= PSW_MASK_DAT
| PSW_MASK_IO
| PSW_MASK_EXT
|
70 PSW_DEFAULT_KEY
| PSW_MASK_BASE
| PSW_MASK_MCHECK
|
71 PSW_MASK_PSTATE
| PSW_ASC_HOME
;
74 * User copy operations.
76 struct uaccess_ops uaccess
;
77 EXPORT_SYMBOL(uaccess
);
82 unsigned int console_mode
= 0;
83 EXPORT_SYMBOL(console_mode
);
85 unsigned int console_devno
= -1;
86 EXPORT_SYMBOL(console_devno
);
88 unsigned int console_irq
= -1;
89 EXPORT_SYMBOL(console_irq
);
91 unsigned long elf_hwcap
= 0;
92 char elf_platform
[ELF_PLATFORM_SIZE
];
94 struct mem_chunk __initdata memory_chunk
[MEMORY_CHUNKS
];
96 int __initdata memory_end_set
;
97 unsigned long __initdata memory_end
;
99 unsigned long VMALLOC_START
;
100 EXPORT_SYMBOL(VMALLOC_START
);
102 unsigned long VMALLOC_END
;
103 EXPORT_SYMBOL(VMALLOC_END
);
105 struct page
*vmemmap
;
106 EXPORT_SYMBOL(vmemmap
);
109 unsigned long MODULES_VADDR
;
110 unsigned long MODULES_END
;
113 /* An array with a pointer to the lowcore of every CPU. */
114 struct _lowcore
*lowcore_ptr
[NR_CPUS
];
115 EXPORT_SYMBOL(lowcore_ptr
);
118 * This is set up by the setup-routine at boot-time
119 * for S390 need to find out, what we have to setup
120 * using address 0x10400 ...
123 #include <asm/setup.h>
126 * condev= and conmode= setup parameter.
129 static int __init
condev_setup(char *str
)
133 vdev
= simple_strtoul(str
, &str
, 0);
134 if (vdev
>= 0 && vdev
< 65536) {
135 console_devno
= vdev
;
141 __setup("condev=", condev_setup
);
143 static void __init
set_preferred_console(void)
145 if (MACHINE_IS_KVM
) {
146 if (sclp_has_vt220())
147 add_preferred_console("ttyS", 1, NULL
);
148 else if (sclp_has_linemode())
149 add_preferred_console("ttyS", 0, NULL
);
151 add_preferred_console("hvc", 0, NULL
);
152 } else if (CONSOLE_IS_3215
|| CONSOLE_IS_SCLP
)
153 add_preferred_console("ttyS", 0, NULL
);
154 else if (CONSOLE_IS_3270
)
155 add_preferred_console("tty3270", 0, NULL
);
158 static int __init
conmode_setup(char *str
)
160 #if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
161 if (strncmp(str
, "hwc", 4) == 0 || strncmp(str
, "sclp", 5) == 0)
164 #if defined(CONFIG_TN3215_CONSOLE)
165 if (strncmp(str
, "3215", 5) == 0)
168 #if defined(CONFIG_TN3270_CONSOLE)
169 if (strncmp(str
, "3270", 5) == 0)
172 set_preferred_console();
176 __setup("conmode=", conmode_setup
);
178 static void __init
conmode_default(void)
180 char query_buffer
[1024];
184 cpcmd("QUERY CONSOLE", query_buffer
, 1024, NULL
);
185 console_devno
= simple_strtoul(query_buffer
+ 5, NULL
, 16);
186 ptr
= strstr(query_buffer
, "SUBCHANNEL =");
187 console_irq
= simple_strtoul(ptr
+ 13, NULL
, 16);
188 cpcmd("QUERY TERM", query_buffer
, 1024, NULL
);
189 ptr
= strstr(query_buffer
, "CONMODE");
191 * Set the conmode to 3215 so that the device recognition
192 * will set the cu_type of the console to 3215. If the
193 * conmode is 3270 and we don't set it back then both
194 * 3215 and the 3270 driver will try to access the console
195 * device (3215 as console and 3270 as normal tty).
197 cpcmd("TERM CONMODE 3215", NULL
, 0, NULL
);
199 #if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
204 if (strncmp(ptr
+ 8, "3270", 4) == 0) {
205 #if defined(CONFIG_TN3270_CONSOLE)
207 #elif defined(CONFIG_TN3215_CONSOLE)
209 #elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
212 } else if (strncmp(ptr
+ 8, "3215", 4) == 0) {
213 #if defined(CONFIG_TN3215_CONSOLE)
215 #elif defined(CONFIG_TN3270_CONSOLE)
217 #elif defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
222 #if defined(CONFIG_SCLP_CONSOLE) || defined(CONFIG_SCLP_VT220_CONSOLE)
228 #ifdef CONFIG_ZFCPDUMP
229 static void __init
setup_zfcpdump(unsigned int console_devno
)
233 if (ipl_info
.type
!= IPL_TYPE_FCP_DUMP
)
237 if (console_devno
!= -1)
238 sprintf(str
, " cio_ignore=all,!0.0.%04x,!0.0.%04x",
239 ipl_info
.data
.fcp
.dev_id
.devno
, console_devno
);
241 sprintf(str
, " cio_ignore=all,!0.0.%04x",
242 ipl_info
.data
.fcp
.dev_id
.devno
);
243 strcat(boot_command_line
, str
);
244 console_loglevel
= 2;
247 static inline void setup_zfcpdump(unsigned int console_devno
) {}
248 #endif /* CONFIG_ZFCPDUMP */
251 * Reboot, halt and power_off stubs. They just call _machine_restart,
252 * _machine_halt or _machine_power_off.
255 void machine_restart(char *command
)
257 if ((!in_interrupt() && !in_atomic()) || oops_in_progress
)
259 * Only unblank the console if we are called in enabled
260 * context or a bust_spinlocks cleared the way for us.
263 _machine_restart(command
);
266 void machine_halt(void)
268 if (!in_interrupt() || oops_in_progress
)
270 * Only unblank the console if we are called in enabled
271 * context or a bust_spinlocks cleared the way for us.
277 void machine_power_off(void)
279 if (!in_interrupt() || oops_in_progress
)
281 * Only unblank the console if we are called in enabled
282 * context or a bust_spinlocks cleared the way for us.
285 _machine_power_off();
289 * Dummy power off function.
291 void (*pm_power_off
)(void) = machine_power_off
;
293 static int __init
early_parse_mem(char *p
)
295 memory_end
= memparse(p
, &p
);
299 early_param("mem", early_parse_mem
);
301 static int __init
parse_vmalloc(char *arg
)
305 VMALLOC_END
= (memparse(arg
, &arg
) + PAGE_SIZE
- 1) & PAGE_MASK
;
308 early_param("vmalloc", parse_vmalloc
);
310 unsigned int s390_user_mode
= PRIMARY_SPACE_MODE
;
311 EXPORT_SYMBOL_GPL(s390_user_mode
);
313 static void __init
set_user_mode_primary(void)
315 psw_kernel_bits
= (psw_kernel_bits
& ~PSW_MASK_ASC
) | PSW_ASC_HOME
;
316 psw_user_bits
= (psw_user_bits
& ~PSW_MASK_ASC
) | PSW_ASC_PRIMARY
;
319 (psw32_user_bits
& ~PSW32_MASK_ASC
) | PSW32_ASC_PRIMARY
;
321 uaccess
= MACHINE_HAS_MVCOS
? uaccess_mvcos_switch
: uaccess_pt
;
324 static int __init
early_parse_user_mode(char *p
)
326 if (p
&& strcmp(p
, "primary") == 0)
327 s390_user_mode
= PRIMARY_SPACE_MODE
;
328 else if (!p
|| strcmp(p
, "home") == 0)
329 s390_user_mode
= HOME_SPACE_MODE
;
334 early_param("user_mode", early_parse_user_mode
);
336 static void __init
setup_addressing_mode(void)
338 if (s390_user_mode
!= PRIMARY_SPACE_MODE
)
340 set_user_mode_primary();
341 if (MACHINE_HAS_MVCOS
)
342 pr_info("Address spaces switched, mvcos available\n");
344 pr_info("Address spaces switched, mvcos not available\n");
347 void *restart_stack
__attribute__((__section__(".data")));
349 static void __init
setup_lowcore(void)
354 * Setup lowcore for boot cpu
356 BUILD_BUG_ON(sizeof(struct _lowcore
) != LC_PAGES
* 4096);
357 lc
= __alloc_bootmem_low(LC_PAGES
* PAGE_SIZE
, LC_PAGES
* PAGE_SIZE
, 0);
358 lc
->restart_psw
.mask
= psw_kernel_bits
;
359 lc
->restart_psw
.addr
=
360 PSW_ADDR_AMODE
| (unsigned long) restart_int_handler
;
361 lc
->external_new_psw
.mask
= psw_kernel_bits
|
362 PSW_MASK_DAT
| PSW_MASK_MCHECK
;
363 lc
->external_new_psw
.addr
=
364 PSW_ADDR_AMODE
| (unsigned long) ext_int_handler
;
365 lc
->svc_new_psw
.mask
= psw_kernel_bits
|
366 PSW_MASK_DAT
| PSW_MASK_IO
| PSW_MASK_EXT
| PSW_MASK_MCHECK
;
367 lc
->svc_new_psw
.addr
= PSW_ADDR_AMODE
| (unsigned long) system_call
;
368 lc
->program_new_psw
.mask
= psw_kernel_bits
|
369 PSW_MASK_DAT
| PSW_MASK_MCHECK
;
370 lc
->program_new_psw
.addr
=
371 PSW_ADDR_AMODE
| (unsigned long) pgm_check_handler
;
372 lc
->mcck_new_psw
.mask
= psw_kernel_bits
;
373 lc
->mcck_new_psw
.addr
=
374 PSW_ADDR_AMODE
| (unsigned long) mcck_int_handler
;
375 lc
->io_new_psw
.mask
= psw_kernel_bits
|
376 PSW_MASK_DAT
| PSW_MASK_MCHECK
;
377 lc
->io_new_psw
.addr
= PSW_ADDR_AMODE
| (unsigned long) io_int_handler
;
378 lc
->clock_comparator
= -1ULL;
379 lc
->kernel_stack
= ((unsigned long) &init_thread_union
) + THREAD_SIZE
;
380 lc
->async_stack
= (unsigned long)
381 __alloc_bootmem(ASYNC_SIZE
, ASYNC_SIZE
, 0) + ASYNC_SIZE
;
382 lc
->panic_stack
= (unsigned long)
383 __alloc_bootmem(PAGE_SIZE
, PAGE_SIZE
, 0) + PAGE_SIZE
;
384 lc
->current_task
= (unsigned long) init_thread_union
.thread_info
.task
;
385 lc
->thread_info
= (unsigned long) &init_thread_union
;
386 lc
->machine_flags
= S390_lowcore
.machine_flags
;
387 lc
->stfl_fac_list
= S390_lowcore
.stfl_fac_list
;
388 memcpy(lc
->stfle_fac_list
, S390_lowcore
.stfle_fac_list
,
391 if (MACHINE_HAS_IEEE
) {
392 lc
->extended_save_area_addr
= (__u32
)
393 __alloc_bootmem_low(PAGE_SIZE
, PAGE_SIZE
, 0);
394 /* enable extended save area */
395 __ctl_set_bit(14, 29);
398 lc
->vdso_per_cpu_data
= (unsigned long) &lc
->paste
[0];
400 lc
->sync_enter_timer
= S390_lowcore
.sync_enter_timer
;
401 lc
->async_enter_timer
= S390_lowcore
.async_enter_timer
;
402 lc
->exit_timer
= S390_lowcore
.exit_timer
;
403 lc
->user_timer
= S390_lowcore
.user_timer
;
404 lc
->system_timer
= S390_lowcore
.system_timer
;
405 lc
->steal_timer
= S390_lowcore
.steal_timer
;
406 lc
->last_update_timer
= S390_lowcore
.last_update_timer
;
407 lc
->last_update_clock
= S390_lowcore
.last_update_clock
;
408 lc
->ftrace_func
= S390_lowcore
.ftrace_func
;
410 restart_stack
= __alloc_bootmem(ASYNC_SIZE
, ASYNC_SIZE
, 0);
411 restart_stack
+= ASYNC_SIZE
;
414 * Set up PSW restart to call ipl.c:do_restart(). Copy the relevant
415 * restart data to the absolute zero lowcore. This is necesary if
416 * PSW restart is done on an offline CPU that has lowcore zero.
418 lc
->restart_stack
= (unsigned long) restart_stack
;
419 lc
->restart_fn
= (unsigned long) do_restart
;
420 lc
->restart_data
= 0;
421 lc
->restart_source
= -1UL;
423 /* Setup absolute zero lowcore */
424 mem_assign_absolute(S390_lowcore
.restart_stack
, lc
->restart_stack
);
425 mem_assign_absolute(S390_lowcore
.restart_fn
, lc
->restart_fn
);
426 mem_assign_absolute(S390_lowcore
.restart_data
, lc
->restart_data
);
427 mem_assign_absolute(S390_lowcore
.restart_source
, lc
->restart_source
);
428 mem_assign_absolute(S390_lowcore
.restart_psw
, lc
->restart_psw
);
430 set_prefix((u32
)(unsigned long) lc
);
434 static struct resource code_resource
= {
435 .name
= "Kernel code",
436 .flags
= IORESOURCE_BUSY
| IORESOURCE_MEM
,
439 static struct resource data_resource
= {
440 .name
= "Kernel data",
441 .flags
= IORESOURCE_BUSY
| IORESOURCE_MEM
,
444 static struct resource bss_resource
= {
445 .name
= "Kernel bss",
446 .flags
= IORESOURCE_BUSY
| IORESOURCE_MEM
,
449 static struct resource __initdata
*standard_resources
[] = {
455 static void __init
setup_resources(void)
457 struct resource
*res
, *std_res
, *sub_res
;
460 code_resource
.start
= (unsigned long) &_text
;
461 code_resource
.end
= (unsigned long) &_etext
- 1;
462 data_resource
.start
= (unsigned long) &_etext
;
463 data_resource
.end
= (unsigned long) &_edata
- 1;
464 bss_resource
.start
= (unsigned long) &__bss_start
;
465 bss_resource
.end
= (unsigned long) &__bss_stop
- 1;
467 for (i
= 0; i
< MEMORY_CHUNKS
; i
++) {
468 if (!memory_chunk
[i
].size
)
470 if (memory_chunk
[i
].type
== CHUNK_OLDMEM
||
471 memory_chunk
[i
].type
== CHUNK_CRASHK
)
473 res
= alloc_bootmem_low(sizeof(*res
));
474 res
->flags
= IORESOURCE_BUSY
| IORESOURCE_MEM
;
475 switch (memory_chunk
[i
].type
) {
476 case CHUNK_READ_WRITE
:
478 res
->name
= "System RAM";
480 case CHUNK_READ_ONLY
:
481 res
->name
= "System ROM";
482 res
->flags
|= IORESOURCE_READONLY
;
485 res
->name
= "reserved";
487 res
->start
= memory_chunk
[i
].addr
;
488 res
->end
= res
->start
+ memory_chunk
[i
].size
- 1;
489 request_resource(&iomem_resource
, res
);
491 for (j
= 0; j
< ARRAY_SIZE(standard_resources
); j
++) {
492 std_res
= standard_resources
[j
];
493 if (std_res
->start
< res
->start
||
494 std_res
->start
> res
->end
)
496 if (std_res
->end
> res
->end
) {
497 sub_res
= alloc_bootmem_low(sizeof(*sub_res
));
499 sub_res
->end
= res
->end
;
500 std_res
->start
= res
->end
+ 1;
501 request_resource(res
, sub_res
);
503 request_resource(res
, std_res
);
509 unsigned long real_memory_size
;
510 EXPORT_SYMBOL_GPL(real_memory_size
);
512 static void __init
setup_memory_end(void)
514 unsigned long vmax
, vmalloc_size
, tmp
;
518 #ifdef CONFIG_ZFCPDUMP
519 if (ipl_info
.type
== IPL_TYPE_FCP_DUMP
&& !OLDMEM_BASE
) {
520 memory_end
= ZFCPDUMP_HSA_SIZE
;
524 real_memory_size
= 0;
525 memory_end
&= PAGE_MASK
;
528 * Make sure all chunks are MAX_ORDER aligned so we don't need the
529 * extra checks that HOLES_IN_ZONE would require.
531 for (i
= 0; i
< MEMORY_CHUNKS
; i
++) {
532 unsigned long start
, end
;
533 struct mem_chunk
*chunk
;
536 chunk
= &memory_chunk
[i
];
537 align
= 1UL << (MAX_ORDER
+ PAGE_SHIFT
- 1);
538 start
= (chunk
->addr
+ align
- 1) & ~(align
- 1);
539 end
= (chunk
->addr
+ chunk
->size
) & ~(align
- 1);
541 memset(chunk
, 0, sizeof(*chunk
));
544 chunk
->size
= end
- start
;
546 real_memory_size
= max(real_memory_size
,
547 chunk
->addr
+ chunk
->size
);
550 /* Choose kernel address space layout: 2, 3, or 4 levels. */
552 vmalloc_size
= VMALLOC_END
?: (128UL << 30) - MODULES_LEN
;
553 tmp
= (memory_end
?: real_memory_size
) / PAGE_SIZE
;
554 tmp
= tmp
* (sizeof(struct page
) + PAGE_SIZE
) + vmalloc_size
;
555 if (tmp
<= (1UL << 42))
556 vmax
= 1UL << 42; /* 3-level kernel page table */
558 vmax
= 1UL << 53; /* 4-level kernel page table */
559 /* module area is at the end of the kernel address space. */
561 MODULES_VADDR
= MODULES_END
- MODULES_LEN
;
562 VMALLOC_END
= MODULES_VADDR
;
564 vmalloc_size
= VMALLOC_END
?: 96UL << 20;
565 vmax
= 1UL << 31; /* 2-level kernel page table */
566 /* vmalloc area is at the end of the kernel address space. */
569 VMALLOC_START
= vmax
- vmalloc_size
;
571 /* Split remaining virtual space between 1:1 mapping & vmemmap array */
572 tmp
= VMALLOC_START
/ (PAGE_SIZE
+ sizeof(struct page
));
573 tmp
= VMALLOC_START
- tmp
* sizeof(struct page
);
574 tmp
&= ~((vmax
>> 11) - 1); /* align to page table level */
575 tmp
= min(tmp
, 1UL << MAX_PHYSMEM_BITS
);
576 vmemmap
= (struct page
*) tmp
;
578 /* Take care that memory_end is set and <= vmemmap */
579 memory_end
= min(memory_end
?: real_memory_size
, tmp
);
581 /* Fixup memory chunk array to fit into 0..memory_end */
582 for (i
= 0; i
< MEMORY_CHUNKS
; i
++) {
583 struct mem_chunk
*chunk
= &memory_chunk
[i
];
585 if (chunk
->addr
>= memory_end
) {
586 memset(chunk
, 0, sizeof(*chunk
));
589 if (chunk
->addr
+ chunk
->size
> memory_end
)
590 chunk
->size
= memory_end
- chunk
->addr
;
594 static void __init
setup_vmcoreinfo(void)
596 mem_assign_absolute(S390_lowcore
.vmcore_info
, paddr_vmcoreinfo_note());
599 #ifdef CONFIG_CRASH_DUMP
602 * Find suitable location for crashkernel memory
604 static unsigned long __init
find_crash_base(unsigned long crash_size
,
607 unsigned long crash_base
;
608 struct mem_chunk
*chunk
;
611 if (memory_chunk
[0].size
< crash_size
) {
612 *msg
= "first memory chunk must be at least crashkernel size";
615 if (OLDMEM_BASE
&& crash_size
== OLDMEM_SIZE
)
618 for (i
= MEMORY_CHUNKS
- 1; i
>= 0; i
--) {
619 chunk
= &memory_chunk
[i
];
620 if (chunk
->size
== 0)
622 if (chunk
->type
!= CHUNK_READ_WRITE
)
624 if (chunk
->size
< crash_size
)
626 crash_base
= (chunk
->addr
+ chunk
->size
) - crash_size
;
627 if (crash_base
< crash_size
)
629 if (crash_base
< ZFCPDUMP_HSA_SIZE_MAX
)
631 if (crash_base
< (unsigned long) INITRD_START
+ INITRD_SIZE
)
635 *msg
= "no suitable area found";
640 * Check if crash_base and crash_size is valid
642 static int __init
verify_crash_base(unsigned long crash_base
,
643 unsigned long crash_size
,
646 struct mem_chunk
*chunk
;
650 * Because we do the swap to zero, we must have at least 'crash_size'
651 * bytes free space before crash_base
653 if (crash_size
> crash_base
) {
654 *msg
= "crashkernel offset must be greater than size";
658 /* First memory chunk must be at least crash_size */
659 if (memory_chunk
[0].size
< crash_size
) {
660 *msg
= "first memory chunk must be at least crashkernel size";
663 /* Check if we fit into the respective memory chunk */
664 for (i
= 0; i
< MEMORY_CHUNKS
; i
++) {
665 chunk
= &memory_chunk
[i
];
666 if (chunk
->size
== 0)
668 if (crash_base
< chunk
->addr
)
670 if (crash_base
>= chunk
->addr
+ chunk
->size
)
672 /* we have found the memory chunk */
673 if (crash_base
+ crash_size
> chunk
->addr
+ chunk
->size
) {
674 *msg
= "selected memory chunk is too small for "
675 "crashkernel memory";
680 *msg
= "invalid memory range specified";
685 * Reserve kdump memory by creating a memory hole in the mem_chunk array
687 static void __init
reserve_kdump_bootmem(unsigned long addr
, unsigned long size
,
690 create_mem_hole(memory_chunk
, addr
, size
, type
);
694 * When kdump is enabled, we have to ensure that no memory from
695 * the area [0 - crashkernel memory size] and
696 * [crashk_res.start - crashk_res.end] is set offline.
698 static int kdump_mem_notifier(struct notifier_block
*nb
,
699 unsigned long action
, void *data
)
701 struct memory_notify
*arg
= data
;
703 if (arg
->start_pfn
< PFN_DOWN(resource_size(&crashk_res
)))
705 if (arg
->start_pfn
> PFN_DOWN(crashk_res
.end
))
707 if (arg
->start_pfn
+ arg
->nr_pages
- 1 < PFN_DOWN(crashk_res
.start
))
712 static struct notifier_block kdump_mem_nb
= {
713 .notifier_call
= kdump_mem_notifier
,
719 * Make sure that oldmem, where the dump is stored, is protected
721 static void reserve_oldmem(void)
723 #ifdef CONFIG_CRASH_DUMP
727 reserve_kdump_bootmem(OLDMEM_BASE
, OLDMEM_SIZE
, CHUNK_OLDMEM
);
728 reserve_kdump_bootmem(OLDMEM_SIZE
, memory_end
- OLDMEM_SIZE
,
730 if (OLDMEM_BASE
+ OLDMEM_SIZE
== real_memory_size
)
731 saved_max_pfn
= PFN_DOWN(OLDMEM_BASE
) - 1;
733 saved_max_pfn
= PFN_DOWN(real_memory_size
) - 1;
738 * Reserve memory for kdump kernel to be loaded with kexec
740 static void __init
reserve_crashkernel(void)
742 #ifdef CONFIG_CRASH_DUMP
743 unsigned long long crash_base
, crash_size
;
747 rc
= parse_crashkernel(boot_command_line
, memory_end
, &crash_size
,
749 if (rc
|| crash_size
== 0)
751 crash_base
= ALIGN(crash_base
, KEXEC_CRASH_MEM_ALIGN
);
752 crash_size
= ALIGN(crash_size
, KEXEC_CRASH_MEM_ALIGN
);
753 if (register_memory_notifier(&kdump_mem_nb
))
756 crash_base
= find_crash_base(crash_size
, &msg
);
758 pr_info("crashkernel reservation failed: %s\n", msg
);
759 unregister_memory_notifier(&kdump_mem_nb
);
762 if (verify_crash_base(crash_base
, crash_size
, &msg
)) {
763 pr_info("crashkernel reservation failed: %s\n", msg
);
764 unregister_memory_notifier(&kdump_mem_nb
);
767 if (!OLDMEM_BASE
&& MACHINE_IS_VM
)
768 diag10_range(PFN_DOWN(crash_base
), PFN_DOWN(crash_size
));
769 crashk_res
.start
= crash_base
;
770 crashk_res
.end
= crash_base
+ crash_size
- 1;
771 insert_resource(&iomem_resource
, &crashk_res
);
772 reserve_kdump_bootmem(crash_base
, crash_size
, CHUNK_CRASHK
);
773 pr_info("Reserving %lluMB of memory at %lluMB "
774 "for crashkernel (System RAM: %luMB)\n",
775 crash_size
>> 20, crash_base
>> 20, memory_end
>> 20);
776 os_info_crashkernel_add(crash_base
, crash_size
);
780 static void __init
init_storage_keys(unsigned long start
, unsigned long end
)
782 unsigned long boundary
, function
, size
;
784 while (start
< end
) {
785 if (MACHINE_HAS_EDAT2
) {
786 /* set storage keys for a 2GB frame */
787 function
= 0x22000 | PAGE_DEFAULT_KEY
;
789 boundary
= (start
+ size
) & ~(size
- 1);
790 if (boundary
<= end
) {
792 start
= pfmf(function
, start
);
793 } while (start
< boundary
);
797 if (MACHINE_HAS_EDAT1
) {
798 /* set storage keys for a 1MB frame */
799 function
= 0x21000 | PAGE_DEFAULT_KEY
;
801 boundary
= (start
+ size
) & ~(size
- 1);
802 if (boundary
<= end
) {
804 start
= pfmf(function
, start
);
805 } while (start
< boundary
);
809 page_set_storage_key(start
, PAGE_DEFAULT_KEY
, 0);
814 static void __init
setup_memory(void)
816 unsigned long bootmap_size
;
817 unsigned long start_pfn
, end_pfn
;
821 * partially used pages are not usable - thus
822 * we are rounding upwards:
824 start_pfn
= PFN_UP(__pa(&_end
));
825 end_pfn
= max_pfn
= PFN_DOWN(memory_end
);
827 #ifdef CONFIG_BLK_DEV_INITRD
829 * Move the initrd in case the bitmap of the bootmem allocater
830 * would overwrite it.
833 if (INITRD_START
&& INITRD_SIZE
) {
834 unsigned long bmap_size
;
837 bmap_size
= bootmem_bootmap_pages(end_pfn
- start_pfn
+ 1);
838 bmap_size
= PFN_PHYS(bmap_size
);
840 if (PFN_PHYS(start_pfn
) + bmap_size
> INITRD_START
) {
841 start
= PFN_PHYS(start_pfn
) + bmap_size
+ PAGE_SIZE
;
843 #ifdef CONFIG_CRASH_DUMP
845 /* Move initrd behind kdump oldmem */
846 if (start
+ INITRD_SIZE
> OLDMEM_BASE
&&
847 start
< OLDMEM_BASE
+ OLDMEM_SIZE
)
848 start
= OLDMEM_BASE
+ OLDMEM_SIZE
;
851 if (start
+ INITRD_SIZE
> memory_end
) {
852 pr_err("initrd extends beyond end of "
853 "memory (0x%08lx > 0x%08lx) "
854 "disabling initrd\n",
855 start
+ INITRD_SIZE
, memory_end
);
856 INITRD_START
= INITRD_SIZE
= 0;
858 pr_info("Moving initrd (0x%08lx -> "
859 "0x%08lx, size: %ld)\n",
860 INITRD_START
, start
, INITRD_SIZE
);
861 memmove((void *) start
, (void *) INITRD_START
,
863 INITRD_START
= start
;
870 * Initialize the boot-time allocator
872 bootmap_size
= init_bootmem(start_pfn
, end_pfn
);
875 * Register RAM areas with the bootmem allocator.
878 for (i
= 0; i
< MEMORY_CHUNKS
&& memory_chunk
[i
].size
> 0; i
++) {
879 unsigned long start_chunk
, end_chunk
, pfn
;
881 if (memory_chunk
[i
].type
!= CHUNK_READ_WRITE
&&
882 memory_chunk
[i
].type
!= CHUNK_CRASHK
)
884 start_chunk
= PFN_DOWN(memory_chunk
[i
].addr
);
885 end_chunk
= start_chunk
+ PFN_DOWN(memory_chunk
[i
].size
);
886 end_chunk
= min(end_chunk
, end_pfn
);
887 if (start_chunk
>= end_chunk
)
889 memblock_add_node(PFN_PHYS(start_chunk
),
890 PFN_PHYS(end_chunk
- start_chunk
), 0);
891 pfn
= max(start_chunk
, start_pfn
);
892 init_storage_keys(PFN_PHYS(pfn
), PFN_PHYS(end_chunk
));
895 psw_set_key(PAGE_DEFAULT_KEY
);
897 free_bootmem_with_active_regions(0, max_pfn
);
900 * Reserve memory used for lowcore/command line/kernel image.
902 reserve_bootmem(0, (unsigned long)_ehead
, BOOTMEM_DEFAULT
);
903 reserve_bootmem((unsigned long)_stext
,
904 PFN_PHYS(start_pfn
) - (unsigned long)_stext
,
907 * Reserve the bootmem bitmap itself as well. We do this in two
908 * steps (first step was init_bootmem()) because this catches
909 * the (very unlikely) case of us accidentally initializing the
910 * bootmem allocator with an invalid RAM area.
912 reserve_bootmem(start_pfn
<< PAGE_SHIFT
, bootmap_size
,
915 #ifdef CONFIG_CRASH_DUMP
916 if (crashk_res
.start
)
917 reserve_bootmem(crashk_res
.start
,
918 crashk_res
.end
- crashk_res
.start
+ 1,
920 if (is_kdump_kernel())
921 reserve_bootmem(elfcorehdr_addr
- OLDMEM_BASE
,
922 PAGE_ALIGN(elfcorehdr_size
), BOOTMEM_DEFAULT
);
924 #ifdef CONFIG_BLK_DEV_INITRD
925 if (INITRD_START
&& INITRD_SIZE
) {
926 if (INITRD_START
+ INITRD_SIZE
<= memory_end
) {
927 reserve_bootmem(INITRD_START
, INITRD_SIZE
,
929 initrd_start
= INITRD_START
;
930 initrd_end
= initrd_start
+ INITRD_SIZE
;
932 pr_err("initrd extends beyond end of "
933 "memory (0x%08lx > 0x%08lx) "
934 "disabling initrd\n",
935 initrd_start
+ INITRD_SIZE
, memory_end
);
936 initrd_start
= initrd_end
= 0;
943 * Setup hardware capabilities.
945 static void __init
setup_hwcaps(void)
947 static const int stfl_bits
[6] = { 0, 2, 7, 17, 19, 21 };
952 * The store facility list bits numbers as found in the principles
953 * of operation are numbered with bit 1UL<<31 as number 0 to
954 * bit 1UL<<0 as number 31.
955 * Bit 0: instructions named N3, "backported" to esa-mode
956 * Bit 2: z/Architecture mode is active
957 * Bit 7: the store-facility-list-extended facility is installed
958 * Bit 17: the message-security assist is installed
959 * Bit 19: the long-displacement facility is installed
960 * Bit 21: the extended-immediate facility is installed
961 * Bit 22: extended-translation facility 3 is installed
962 * Bit 30: extended-translation facility 3 enhancement facility
963 * These get translated to:
964 * HWCAP_S390_ESAN3 bit 0, HWCAP_S390_ZARCH bit 1,
965 * HWCAP_S390_STFLE bit 2, HWCAP_S390_MSA bit 3,
966 * HWCAP_S390_LDISP bit 4, HWCAP_S390_EIMM bit 5 and
967 * HWCAP_S390_ETF3EH bit 8 (22 && 30).
969 for (i
= 0; i
< 6; i
++)
970 if (test_facility(stfl_bits
[i
]))
971 elf_hwcap
|= 1UL << i
;
973 if (test_facility(22) && test_facility(30))
974 elf_hwcap
|= HWCAP_S390_ETF3EH
;
977 * Check for additional facilities with store-facility-list-extended.
978 * stfle stores doublewords (8 byte) with bit 1ULL<<63 as bit 0
979 * and 1ULL<<0 as bit 63. Bits 0-31 contain the same information
980 * as stored by stfl, bits 32-xxx contain additional facilities.
981 * How many facility words are stored depends on the number of
982 * doublewords passed to the instruction. The additional facilities
984 * Bit 42: decimal floating point facility is installed
985 * Bit 44: perform floating point operation facility is installed
987 * HWCAP_S390_DFP bit 6 (42 && 44).
989 if ((elf_hwcap
& (1UL << 2)) && test_facility(42) && test_facility(44))
990 elf_hwcap
|= HWCAP_S390_DFP
;
993 * Huge page support HWCAP_S390_HPAGE is bit 7.
995 if (MACHINE_HAS_HPAGE
)
996 elf_hwcap
|= HWCAP_S390_HPAGE
;
998 #if defined(CONFIG_64BIT)
1000 * 64-bit register support for 31-bit processes
1001 * HWCAP_S390_HIGH_GPRS is bit 9.
1003 elf_hwcap
|= HWCAP_S390_HIGH_GPRS
;
1006 * Transactional execution support HWCAP_S390_TE is bit 10.
1008 if (test_facility(50) && test_facility(73))
1009 elf_hwcap
|= HWCAP_S390_TE
;
1012 get_cpu_id(&cpu_id
);
1013 switch (cpu_id
.machine
) {
1015 #if !defined(CONFIG_64BIT)
1016 default: /* Use "g5" as default for 31 bit kernels. */
1018 strcpy(elf_platform
, "g5");
1022 #if defined(CONFIG_64BIT)
1023 default: /* Use "z900" as default for 64 bit kernels. */
1025 strcpy(elf_platform
, "z900");
1029 strcpy(elf_platform
, "z990");
1033 strcpy(elf_platform
, "z9-109");
1037 strcpy(elf_platform
, "z10");
1041 strcpy(elf_platform
, "z196");
1047 * Setup function called from init/main.c just after the banner
1051 void __init
setup_arch(char **cmdline_p
)
1054 * print what head.S has found out about the machine
1056 #ifndef CONFIG_64BIT
1058 pr_info("Linux is running as a z/VM "
1059 "guest operating system in 31-bit mode\n");
1060 else if (MACHINE_IS_LPAR
)
1061 pr_info("Linux is running natively in 31-bit mode\n");
1062 if (MACHINE_HAS_IEEE
)
1063 pr_info("The hardware system has IEEE compatible "
1064 "floating point units\n");
1066 pr_info("The hardware system has no IEEE compatible "
1067 "floating point units\n");
1068 #else /* CONFIG_64BIT */
1070 pr_info("Linux is running as a z/VM "
1071 "guest operating system in 64-bit mode\n");
1072 else if (MACHINE_IS_KVM
)
1073 pr_info("Linux is running under KVM in 64-bit mode\n");
1074 else if (MACHINE_IS_LPAR
)
1075 pr_info("Linux is running natively in 64-bit mode\n");
1076 #endif /* CONFIG_64BIT */
1078 /* Have one command line that is parsed and saved in /proc/cmdline */
1079 /* boot_command_line has been already set up in early.c */
1080 *cmdline_p
= boot_command_line
;
1082 ROOT_DEV
= Root_RAM0
;
1084 init_mm
.start_code
= PAGE_OFFSET
;
1085 init_mm
.end_code
= (unsigned long) &_etext
;
1086 init_mm
.end_data
= (unsigned long) &_edata
;
1087 init_mm
.brk
= (unsigned long) &_end
;
1089 if (MACHINE_HAS_MVCOS
)
1090 memcpy(&uaccess
, &uaccess_mvcos
, sizeof(uaccess
));
1092 memcpy(&uaccess
, &uaccess_std
, sizeof(uaccess
));
1094 parse_early_param();
1099 setup_addressing_mode();
1101 reserve_crashkernel();
1108 s390_init_cpu_topology();
1111 * Setup capabilities (ELF_HWCAP & ELF_PLATFORM).
1116 * Create kernel page tables and switch to virtual addressing.
1120 /* Setup default console */
1122 set_preferred_console();
1124 /* Setup zfcpdump support */
1125 setup_zfcpdump(console_devno
);