2 #include <asm/e820/types.h>
3 #include <asm/processor.h>
9 * __force_order is used by special_insns.h asm code to force instruction
12 * It is not referenced from the code, but GCC < 5 with -fPIE would fail
13 * due to an undefined symbol. Define it to make these ancient GCCs work.
15 unsigned long __force_order
;
17 #define BIOS_START_MIN 0x20000U /* 128K, less than this is insane */
18 #define BIOS_START_MAX 0x9f000U /* 640K, absolute maximum */
20 struct paging_config
{
21 unsigned long trampoline_start
;
22 unsigned long l5_required
;
25 /* Buffer to preserve trampoline memory */
26 static char trampoline_save
[TRAMPOLINE_32BIT_SIZE
];
29 * Trampoline address will be printed by extract_kernel() for debugging
32 * Avoid putting the pointer into .bss as it will be cleared between
33 * paging_prepare() and extract_kernel().
35 unsigned long *trampoline_32bit
__section(.data
);
37 extern struct boot_params
*boot_params
;
38 int cmdline_find_option_bool(const char *option
);
40 static unsigned long find_trampoline_placement(void)
42 unsigned long bios_start
= 0, ebda_start
= 0;
43 struct boot_e820_entry
*entry
;
48 * Find a suitable spot for the trampoline.
49 * This code is based on reserve_bios_regions().
53 * EFI systems may not provide legacy ROM. The memory may not be mapped
56 * Only look for values in the legacy ROM for non-EFI system.
58 signature
= (char *)&boot_params
->efi_info
.efi_loader_signature
;
59 if (strncmp(signature
, EFI32_LOADER_SIGNATURE
, 4) &&
60 strncmp(signature
, EFI64_LOADER_SIGNATURE
, 4)) {
61 ebda_start
= *(unsigned short *)0x40e << 4;
62 bios_start
= *(unsigned short *)0x413 << 10;
65 if (bios_start
< BIOS_START_MIN
|| bios_start
> BIOS_START_MAX
)
66 bios_start
= BIOS_START_MAX
;
68 if (ebda_start
> BIOS_START_MIN
&& ebda_start
< bios_start
)
69 bios_start
= ebda_start
;
71 bios_start
= round_down(bios_start
, PAGE_SIZE
);
73 /* Find the first usable memory region under bios_start. */
74 for (i
= boot_params
->e820_entries
- 1; i
>= 0; i
--) {
75 unsigned long new = bios_start
;
77 entry
= &boot_params
->e820_table
[i
];
79 /* Skip all entries above bios_start. */
80 if (bios_start
<= entry
->addr
)
83 /* Skip non-RAM entries. */
84 if (entry
->type
!= E820_TYPE_RAM
)
87 /* Adjust bios_start to the end of the entry if needed. */
88 if (bios_start
> entry
->addr
+ entry
->size
)
89 new = entry
->addr
+ entry
->size
;
91 /* Keep bios_start page-aligned. */
92 new = round_down(new, PAGE_SIZE
);
94 /* Skip the entry if it's too small. */
95 if (new - TRAMPOLINE_32BIT_SIZE
< entry
->addr
)
98 /* Protect against underflow. */
99 if (new - TRAMPOLINE_32BIT_SIZE
> bios_start
)
106 /* Place the trampoline just below the end of low memory */
107 return bios_start
- TRAMPOLINE_32BIT_SIZE
;
110 struct paging_config
paging_prepare(void *rmode
)
112 struct paging_config paging_config
= {};
114 /* Initialize boot_params. Required for cmdline_find_option_bool(). */
118 * Check if LA57 is desired and supported.
120 * There are several parts to the check:
121 * - if the kernel supports 5-level paging: CONFIG_X86_5LEVEL=y
122 * - if user asked to disable 5-level paging: no5lvl in cmdline
123 * - if the machine supports 5-level paging:
124 * + CPUID leaf 7 is supported
125 * + the leaf has the feature bit set
127 * That's substitute for boot_cpu_has() in early boot code.
129 if (IS_ENABLED(CONFIG_X86_5LEVEL
) &&
130 !cmdline_find_option_bool("no5lvl") &&
131 native_cpuid_eax(0) >= 7 &&
132 (native_cpuid_ecx(7) & (1 << (X86_FEATURE_LA57
& 31)))) {
133 paging_config
.l5_required
= 1;
136 paging_config
.trampoline_start
= find_trampoline_placement();
138 trampoline_32bit
= (unsigned long *)paging_config
.trampoline_start
;
140 /* Preserve trampoline memory */
141 memcpy(trampoline_save
, trampoline_32bit
, TRAMPOLINE_32BIT_SIZE
);
143 /* Clear trampoline memory first */
144 memset(trampoline_32bit
, 0, TRAMPOLINE_32BIT_SIZE
);
146 /* Copy trampoline code in place */
147 memcpy(trampoline_32bit
+ TRAMPOLINE_32BIT_CODE_OFFSET
/ sizeof(unsigned long),
148 &trampoline_32bit_src
, TRAMPOLINE_32BIT_CODE_SIZE
);
151 * The code below prepares page table in trampoline memory.
153 * The new page table will be used by trampoline code for switching
154 * from 4- to 5-level paging or vice versa.
156 * If switching is not required, the page table is unused: trampoline
157 * code wouldn't touch CR3.
161 * We are not going to use the page table in trampoline memory if we
162 * are already in the desired paging mode.
164 if (paging_config
.l5_required
== !!(native_read_cr4() & X86_CR4_LA57
))
167 if (paging_config
.l5_required
) {
169 * For 4- to 5-level paging transition, set up current CR3 as
170 * the first and the only entry in a new top-level page table.
172 trampoline_32bit
[TRAMPOLINE_32BIT_PGTABLE_OFFSET
] = __native_read_cr3() | _PAGE_TABLE_NOENC
;
177 * For 5- to 4-level paging transition, copy page table pointed
178 * by first entry in the current top-level page table as our
179 * new top-level page table.
181 * We cannot just point to the page table from trampoline as it
184 src
= *(unsigned long *)__native_read_cr3() & PAGE_MASK
;
185 memcpy(trampoline_32bit
+ TRAMPOLINE_32BIT_PGTABLE_OFFSET
/ sizeof(unsigned long),
186 (void *)src
, PAGE_SIZE
);
190 return paging_config
;
193 void cleanup_trampoline(void *pgtable
)
195 void *trampoline_pgtable
;
197 trampoline_pgtable
= trampoline_32bit
+ TRAMPOLINE_32BIT_PGTABLE_OFFSET
/ sizeof(unsigned long);
200 * Move the top level page table out of trampoline memory,
203 if ((void *)__native_read_cr3() == trampoline_pgtable
) {
204 memcpy(pgtable
, trampoline_pgtable
, PAGE_SIZE
);
205 native_write_cr3((unsigned long)pgtable
);
208 /* Restore trampoline memory */
209 memcpy(trampoline_32bit
, trampoline_save
, TRAMPOLINE_32BIT_SIZE
);