1 // SPDX-License-Identifier: GPL-2.0
2 #include <linux/init.h>
3 #include <linux/async.h>
5 #include <linux/slab.h>
6 #include <linux/types.h>
7 #include <linux/fcntl.h>
8 #include <linux/delay.h>
9 #include <linux/string.h>
10 #include <linux/dirent.h>
11 #include <linux/syscalls.h>
12 #include <linux/utime.h>
13 #include <linux/file.h>
14 #include <linux/kstrtox.h>
15 #include <linux/memblock.h>
17 #include <linux/namei.h>
18 #include <linux/init_syscalls.h>
19 #include <linux/umh.h>
20 #include <linux/security.h>
22 #include "do_mounts.h"
24 static __initdata
bool csum_present
;
25 static __initdata u32 io_csum
;
27 static ssize_t __init
xwrite(struct file
*file
, const unsigned char *p
,
28 size_t count
, loff_t
*pos
)
32 /* sys_write only can write MAX_RW_COUNT aka 2G-4K bytes at most */
34 ssize_t rv
= kernel_write(file
, p
, count
, pos
);
37 if (rv
== -EINTR
|| rv
== -EAGAIN
)
39 return out
? out
: rv
;
46 for (i
= 0; i
< rv
; i
++)
58 static __initdata
char *message
;
59 static void __init
error(char *x
)
65 #define panic_show_mem(fmt, ...) \
66 ({ show_mem(); panic(fmt, ##__VA_ARGS__); })
70 #define N_ALIGN(len) ((((len) + 1) & ~3) + 2)
72 static __initdata
struct hash
{
73 int ino
, minor
, major
;
76 char name
[N_ALIGN(PATH_MAX
)];
79 static inline int hash(int major
, int minor
, int ino
)
81 unsigned long tmp
= ino
+ minor
+ (major
<< 3);
86 static char __init
*find_link(int major
, int minor
, int ino
,
87 umode_t mode
, char *name
)
90 for (p
= head
+ hash(major
, minor
, ino
); *p
; p
= &(*p
)->next
) {
93 if ((*p
)->minor
!= minor
)
95 if ((*p
)->major
!= major
)
97 if (((*p
)->mode
^ mode
) & S_IFMT
)
101 q
= kmalloc(sizeof(struct hash
), GFP_KERNEL
);
103 panic_show_mem("can't allocate link hash entry");
108 strcpy(q
->name
, name
);
114 static void __init
free_hash(void)
117 for (p
= head
; p
< head
+ 32; p
++) {
126 #ifdef CONFIG_INITRAMFS_PRESERVE_MTIME
127 static void __init
do_utime(char *filename
, time64_t mtime
)
129 struct timespec64 t
[2] = { { .tv_sec
= mtime
}, { .tv_sec
= mtime
} };
130 init_utimes(filename
, t
);
133 static void __init
do_utime_path(const struct path
*path
, time64_t mtime
)
135 struct timespec64 t
[2] = { { .tv_sec
= mtime
}, { .tv_sec
= mtime
} };
139 static __initdata
LIST_HEAD(dir_list
);
141 struct list_head list
;
146 static void __init
dir_add(const char *name
, time64_t mtime
)
148 size_t nlen
= strlen(name
) + 1;
149 struct dir_entry
*de
;
151 de
= kmalloc(sizeof(struct dir_entry
) + nlen
, GFP_KERNEL
);
153 panic_show_mem("can't allocate dir_entry buffer");
154 INIT_LIST_HEAD(&de
->list
);
155 strscpy(de
->name
, name
, nlen
);
157 list_add(&de
->list
, &dir_list
);
160 static void __init
dir_utime(void)
162 struct dir_entry
*de
, *tmp
;
163 list_for_each_entry_safe(de
, tmp
, &dir_list
, list
) {
165 do_utime(de
->name
, de
->mtime
);
170 static void __init
do_utime(char *filename
, time64_t mtime
) {}
171 static void __init
do_utime_path(const struct path
*path
, time64_t mtime
) {}
172 static void __init
dir_add(const char *name
, time64_t mtime
) {}
173 static void __init
dir_utime(void) {}
176 static __initdata time64_t mtime
;
178 /* cpio header parsing */
180 static __initdata
unsigned long ino
, major
, minor
, nlink
;
181 static __initdata umode_t mode
;
182 static __initdata
unsigned long body_len
, name_len
;
183 static __initdata uid_t uid
;
184 static __initdata gid_t gid
;
185 static __initdata
unsigned rdev
;
186 static __initdata u32 hdr_csum
;
188 static void __init
parse_header(char *s
)
190 unsigned long parsed
[13];
195 for (i
= 0, s
+= 6; i
< 13; i
++, s
+= 8) {
197 parsed
[i
] = simple_strtoul(buf
, NULL
, 16);
204 mtime
= parsed
[5]; /* breaks in y2106 */
205 body_len
= parsed
[6];
208 rdev
= new_encode_dev(MKDEV(parsed
[9], parsed
[10]));
209 name_len
= parsed
[11];
210 hdr_csum
= parsed
[12];
215 static __initdata
enum state
{
226 static __initdata
char *victim
;
227 static unsigned long byte_count __initdata
;
228 static __initdata loff_t this_header
, next_header
;
230 static inline void __init
eat(unsigned n
)
237 static __initdata
char *collected
;
238 static long remains __initdata
;
239 static __initdata
char *collect
;
241 static void __init
read_into(char *buf
, unsigned size
, enum state next
)
243 if (byte_count
>= size
) {
248 collect
= collected
= buf
;
255 static __initdata
char *header_buf
, *symlink_buf
, *name_buf
;
257 static int __init
do_start(void)
259 read_into(header_buf
, 110, GotHeader
);
263 static int __init
do_collect(void)
265 unsigned long n
= remains
;
268 memcpy(collect
, victim
, n
);
271 if ((remains
-= n
) != 0)
277 static int __init
do_header(void)
279 if (!memcmp(collected
, "070701", 6)) {
280 csum_present
= false;
281 } else if (!memcmp(collected
, "070702", 6)) {
284 if (memcmp(collected
, "070707", 6) == 0)
285 error("incorrect cpio method used: use -H newc option");
287 error("no cpio magic");
290 parse_header(collected
);
291 next_header
= this_header
+ N_ALIGN(name_len
) + body_len
;
292 next_header
= (next_header
+ 3) & ~3;
294 if (name_len
<= 0 || name_len
> PATH_MAX
)
297 if (body_len
> PATH_MAX
)
299 collect
= collected
= symlink_buf
;
300 remains
= N_ALIGN(name_len
) + body_len
;
301 next_state
= GotSymlink
;
305 if (S_ISREG(mode
) || !body_len
)
306 read_into(name_buf
, N_ALIGN(name_len
), GotName
);
310 static int __init
do_skip(void)
312 if (this_header
+ byte_count
< next_header
) {
316 eat(next_header
- this_header
);
322 static int __init
do_reset(void)
324 while (byte_count
&& *victim
== '\0')
326 if (byte_count
&& (this_header
& 3))
327 error("broken padding");
331 static void __init
clean_path(char *path
, umode_t fmode
)
335 if (!init_stat(path
, &st
, AT_SYMLINK_NOFOLLOW
) &&
336 (st
.mode
^ fmode
) & S_IFMT
) {
337 if (S_ISDIR(st
.mode
))
344 static int __init
maybe_link(void)
347 char *old
= find_link(major
, minor
, ino
, mode
, collected
);
349 clean_path(collected
, 0);
350 return (init_link(old
, collected
) < 0) ? -1 : 1;
356 static __initdata
struct file
*wfile
;
357 static __initdata loff_t wfile_pos
;
359 static int __init
do_name(void)
363 if (strcmp(collected
, "TRAILER!!!") == 0) {
367 clean_path(collected
, mode
);
369 int ml
= maybe_link();
371 int openflags
= O_WRONLY
|O_CREAT
|O_LARGEFILE
;
373 openflags
|= O_TRUNC
;
374 wfile
= filp_open(collected
, openflags
, mode
);
380 vfs_fchown(wfile
, uid
, gid
);
381 vfs_fchmod(wfile
, mode
);
383 vfs_truncate(&wfile
->f_path
, body_len
);
386 } else if (S_ISDIR(mode
)) {
387 init_mkdir(collected
, mode
);
388 init_chown(collected
, uid
, gid
, 0);
389 init_chmod(collected
, mode
);
390 dir_add(collected
, mtime
);
391 } else if (S_ISBLK(mode
) || S_ISCHR(mode
) ||
392 S_ISFIFO(mode
) || S_ISSOCK(mode
)) {
393 if (maybe_link() == 0) {
394 init_mknod(collected
, mode
, rdev
);
395 init_chown(collected
, uid
, gid
, 0);
396 init_chmod(collected
, mode
);
397 do_utime(collected
, mtime
);
403 static int __init
do_copy(void)
405 if (byte_count
>= body_len
) {
406 if (xwrite(wfile
, victim
, body_len
, &wfile_pos
) != body_len
)
407 error("write error");
409 do_utime_path(&wfile
->f_path
, mtime
);
411 if (csum_present
&& io_csum
!= hdr_csum
)
412 error("bad data checksum");
417 if (xwrite(wfile
, victim
, byte_count
, &wfile_pos
) != byte_count
)
418 error("write error");
419 body_len
-= byte_count
;
425 static int __init
do_symlink(void)
427 collected
[N_ALIGN(name_len
) + body_len
] = '\0';
428 clean_path(collected
, 0);
429 init_symlink(collected
+ N_ALIGN(name_len
), collected
);
430 init_chown(collected
, uid
, gid
, AT_SYMLINK_NOFOLLOW
);
431 do_utime(collected
, mtime
);
437 static __initdata
int (*actions
[])(void) = {
439 [Collect
] = do_collect
,
440 [GotHeader
] = do_header
,
443 [CopyFile
] = do_copy
,
444 [GotSymlink
] = do_symlink
,
448 static long __init
write_buffer(char *buf
, unsigned long len
)
453 while (!actions
[state
]())
455 return len
- byte_count
;
458 static long __init
flush_buffer(void *bufv
, unsigned long len
)
465 while ((written
= write_buffer(buf
, len
)) < len
&& !message
) {
466 char c
= buf
[written
];
476 error("junk within compressed archive");
481 static unsigned long my_inptr __initdata
; /* index of next byte to be processed in inbuf */
483 #include <linux/decompress/generic.h>
485 static char * __init
unpack_to_rootfs(char *buf
, unsigned long len
)
488 decompress_fn decompress
;
489 const char *compress_name
;
490 static __initdata
char msg_buf
[64];
492 header_buf
= kmalloc(110, GFP_KERNEL
);
493 symlink_buf
= kmalloc(PATH_MAX
+ N_ALIGN(PATH_MAX
) + 1, GFP_KERNEL
);
494 name_buf
= kmalloc(N_ALIGN(PATH_MAX
), GFP_KERNEL
);
496 if (!header_buf
|| !symlink_buf
|| !name_buf
)
497 panic_show_mem("can't allocate buffers");
502 while (!message
&& len
) {
503 loff_t saved_offset
= this_header
;
504 if (*buf
== '0' && !(this_header
& 3)) {
506 written
= write_buffer(buf
, len
);
518 decompress
= decompress_method(buf
, len
, &compress_name
);
519 pr_debug("Detected %s compressed data\n", compress_name
);
521 int res
= decompress(buf
, len
, NULL
, flush_buffer
, NULL
,
524 error("decompressor failed");
525 } else if (compress_name
) {
527 snprintf(msg_buf
, sizeof msg_buf
,
528 "compression method %s not configured",
533 error("invalid magic at start of compressed archive");
535 error("junk at the end of compressed archive");
536 this_header
= saved_offset
+ my_inptr
;
547 static int __initdata do_retain_initrd
;
549 static int __init
retain_initrd_param(char *str
)
553 do_retain_initrd
= 1;
556 __setup("retain_initrd", retain_initrd_param
);
558 #ifdef CONFIG_ARCH_HAS_KEEPINITRD
559 static int __init
keepinitrd_setup(char *__unused
)
561 do_retain_initrd
= 1;
564 __setup("keepinitrd", keepinitrd_setup
);
567 static bool __initdata initramfs_async
= true;
568 static int __init
initramfs_async_setup(char *str
)
570 return kstrtobool(str
, &initramfs_async
) == 0;
572 __setup("initramfs_async=", initramfs_async_setup
);
574 extern char __initramfs_start
[];
575 extern unsigned long __initramfs_size
;
576 #include <linux/initrd.h>
577 #include <linux/kexec.h>
579 static BIN_ATTR(initrd
, 0440, sysfs_bin_attr_simple_read
, NULL
, 0);
581 void __init
reserve_initrd_mem(void)
586 /* Ignore the virtul address computed during device tree parsing */
587 initrd_start
= initrd_end
= 0;
589 if (!phys_initrd_size
)
592 * Round the memory region to page boundaries as per free_initrd_mem()
593 * This allows us to detect whether the pages overlapping the initrd
594 * are in use, but more importantly, reserves the entire set of pages
595 * as we don't want these pages allocated for other purposes.
597 start
= round_down(phys_initrd_start
, PAGE_SIZE
);
598 size
= phys_initrd_size
+ (phys_initrd_start
- start
);
599 size
= round_up(size
, PAGE_SIZE
);
601 if (!memblock_is_region_memory(start
, size
)) {
602 pr_err("INITRD: 0x%08llx+0x%08lx is not a memory region",
607 if (memblock_is_region_reserved(start
, size
)) {
608 pr_err("INITRD: 0x%08llx+0x%08lx overlaps in-use memory region\n",
613 memblock_reserve(start
, size
);
614 /* Now convert initrd to virtual addresses */
615 initrd_start
= (unsigned long)__va(phys_initrd_start
);
616 initrd_end
= initrd_start
+ phys_initrd_size
;
617 initrd_below_start_ok
= 1;
621 pr_cont(" - disabling initrd\n");
626 void __weak __init
free_initrd_mem(unsigned long start
, unsigned long end
)
628 #ifdef CONFIG_ARCH_KEEP_MEMBLOCK
629 unsigned long aligned_start
= ALIGN_DOWN(start
, PAGE_SIZE
);
630 unsigned long aligned_end
= ALIGN(end
, PAGE_SIZE
);
632 memblock_free((void *)aligned_start
, aligned_end
- aligned_start
);
635 free_reserved_area((void *)start
, (void *)end
, POISON_FREE_INITMEM
,
639 #ifdef CONFIG_CRASH_RESERVE
640 static bool __init
kexec_free_initrd(void)
642 unsigned long crashk_start
= (unsigned long)__va(crashk_res
.start
);
643 unsigned long crashk_end
= (unsigned long)__va(crashk_res
.end
);
646 * If the initrd region is overlapped with crashkernel reserved region,
647 * free only memory that is not part of crashkernel region.
649 if (initrd_start
>= crashk_end
|| initrd_end
<= crashk_start
)
653 * Initialize initrd memory region since the kexec boot does not do.
655 memset((void *)initrd_start
, 0, initrd_end
- initrd_start
);
656 if (initrd_start
< crashk_start
)
657 free_initrd_mem(initrd_start
, crashk_start
);
658 if (initrd_end
> crashk_end
)
659 free_initrd_mem(crashk_end
, initrd_end
);
663 static inline bool kexec_free_initrd(void)
667 #endif /* CONFIG_KEXEC_CORE */
669 #ifdef CONFIG_BLK_DEV_RAM
670 static void __init
populate_initrd_image(char *err
)
676 printk(KERN_INFO
"rootfs image is not initramfs (%s); looks like an initrd\n",
678 file
= filp_open("/initrd.image", O_WRONLY
|O_CREAT
|O_LARGEFILE
, 0700);
682 written
= xwrite(file
, (char *)initrd_start
, initrd_end
- initrd_start
,
684 if (written
!= initrd_end
- initrd_start
)
685 pr_err("/initrd.image: incomplete write (%zd != %ld)\n",
686 written
, initrd_end
- initrd_start
);
689 #endif /* CONFIG_BLK_DEV_RAM */
691 static void __init
do_populate_rootfs(void *unused
, async_cookie_t cookie
)
693 /* Load the built in initramfs */
694 char *err
= unpack_to_rootfs(__initramfs_start
, __initramfs_size
);
696 panic_show_mem("%s", err
); /* Failed to decompress INTERNAL initramfs */
698 if (!initrd_start
|| IS_ENABLED(CONFIG_INITRAMFS_FORCE
))
701 if (IS_ENABLED(CONFIG_BLK_DEV_RAM
))
702 printk(KERN_INFO
"Trying to unpack rootfs image as initramfs...\n");
704 printk(KERN_INFO
"Unpacking initramfs...\n");
706 err
= unpack_to_rootfs((char *)initrd_start
, initrd_end
- initrd_start
);
708 #ifdef CONFIG_BLK_DEV_RAM
709 populate_initrd_image(err
);
711 printk(KERN_EMERG
"Initramfs unpacking failed: %s\n", err
);
716 security_initramfs_populated();
719 * If the initrd region is overlapped with crashkernel reserved region,
720 * free only memory that is not part of crashkernel region.
722 if (!do_retain_initrd
&& initrd_start
&& !kexec_free_initrd()) {
723 free_initrd_mem(initrd_start
, initrd_end
);
724 } else if (do_retain_initrd
&& initrd_start
) {
725 bin_attr_initrd
.size
= initrd_end
- initrd_start
;
726 bin_attr_initrd
.private = (void *)initrd_start
;
727 if (sysfs_create_bin_file(firmware_kobj
, &bin_attr_initrd
))
728 pr_err("Failed to create initrd sysfs file");
736 static ASYNC_DOMAIN_EXCLUSIVE(initramfs_domain
);
737 static async_cookie_t initramfs_cookie
;
739 void wait_for_initramfs(void)
741 if (!initramfs_cookie
) {
743 * Something before rootfs_initcall wants to access
744 * the filesystem/initramfs. Probably a bug. Make a
745 * note, avoid deadlocking the machine, and let the
746 * caller's access fail as it used to.
748 pr_warn_once("wait_for_initramfs() called before rootfs_initcalls\n");
751 async_synchronize_cookie_domain(initramfs_cookie
+ 1, &initramfs_domain
);
753 EXPORT_SYMBOL_GPL(wait_for_initramfs
);
755 static int __init
populate_rootfs(void)
757 initramfs_cookie
= async_schedule_domain(do_populate_rootfs
, NULL
,
759 usermodehelper_enable();
760 if (!initramfs_async
)
761 wait_for_initramfs();
764 rootfs_initcall(populate_rootfs
);