1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Machine check exception handling CPU-side for power7 and power8
5 * Copyright 2013 IBM Corporation
6 * Author: Mahesh Salgaonkar <mahesh@linux.vnet.ibm.com>
10 #define pr_fmt(fmt) "mce_power: " fmt
12 #include <linux/types.h>
13 #include <linux/ptrace.h>
14 #include <linux/extable.h>
17 #include <asm/machdep.h>
18 #include <asm/pgtable.h>
19 #include <asm/pte-walk.h>
20 #include <asm/sstep.h>
21 #include <asm/exception-64s.h>
22 #include <asm/extable.h>
25 * Convert an address related to an mm to a PFN. NOTE: we are in real
26 * mode, we could potentially race with page table updates.
28 unsigned long addr_to_pfn(struct pt_regs
*regs
, unsigned long addr
)
32 unsigned long pfn
, flags
;
40 local_irq_save(flags
);
41 ptep
= __find_linux_pte(mm
->pgd
, addr
, NULL
, &shift
);
43 if (!ptep
|| pte_special(*ptep
)) {
48 if (shift
<= PAGE_SHIFT
)
51 unsigned long rpnmask
= (1ul << shift
) - PAGE_SIZE
;
52 pfn
= pte_pfn(__pte(pte_val(*ptep
) | (addr
& rpnmask
)));
56 local_irq_restore(flags
);
60 /* flush SLBs and reload */
61 #ifdef CONFIG_PPC_BOOK3S_64
62 void flush_and_reload_slb(void)
64 /* Invalidate all SLBs */
65 slb_flush_all_realmode();
67 #ifdef CONFIG_KVM_BOOK3S_HANDLER
69 * If machine check is hit when in guest or in transition, we will
70 * only flush the SLBs and continue.
72 if (get_paca()->kvm_hstate
.in_guest
)
75 if (early_radix_enabled())
79 * This probably shouldn't happen, but it may be possible it's
80 * called in early boot before SLB shadows are allocated.
82 if (!get_slb_shadow())
85 slb_restore_bolted_realmode();
89 static void flush_erat(void)
91 #ifdef CONFIG_PPC_BOOK3S_64
92 if (!early_cpu_has_feature(CPU_FTR_ARCH_300
)) {
93 flush_and_reload_slb();
97 asm volatile(PPC_ISA_3_0_INVALIDATE_ERAT
: : :"memory");
100 #define MCE_FLUSH_SLB 1
101 #define MCE_FLUSH_TLB 2
102 #define MCE_FLUSH_ERAT 3
104 static int mce_flush(int what
)
106 #ifdef CONFIG_PPC_BOOK3S_64
107 if (what
== MCE_FLUSH_SLB
) {
108 flush_and_reload_slb();
112 if (what
== MCE_FLUSH_ERAT
) {
116 if (what
== MCE_FLUSH_TLB
) {
124 #define SRR1_MC_LOADSTORE(srr1) ((srr1) & PPC_BIT(42))
126 struct mce_ierror_table
{
127 unsigned long srr1_mask
;
128 unsigned long srr1_value
;
129 bool nip_valid
; /* nip is a valid indicator of faulting address */
130 unsigned int error_type
;
131 unsigned int error_subtype
;
132 unsigned int error_class
;
133 unsigned int initiator
;
134 unsigned int severity
;
138 static const struct mce_ierror_table mce_p7_ierror_table
[] = {
139 { 0x00000000001c0000, 0x0000000000040000, true,
140 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_IFETCH
, MCE_ECLASS_HARDWARE
,
141 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
142 { 0x00000000001c0000, 0x0000000000080000, true,
143 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_PARITY
, MCE_ECLASS_HARD_INDETERMINATE
,
144 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
145 { 0x00000000001c0000, 0x00000000000c0000, true,
146 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
147 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
148 { 0x00000000001c0000, 0x0000000000100000, true,
149 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_INDETERMINATE
, /* BOTH */
150 MCE_ECLASS_SOFT_INDETERMINATE
,
151 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
152 { 0x00000000001c0000, 0x0000000000140000, true,
153 MCE_ERROR_TYPE_TLB
, MCE_TLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
154 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
155 { 0x00000000001c0000, 0x0000000000180000, true,
156 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_PAGE_TABLE_WALK_IFETCH
, MCE_ECLASS_HARDWARE
,
157 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
158 { 0x00000000001c0000, 0x00000000001c0000, true,
159 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_IFETCH
, MCE_ECLASS_HARDWARE
,
160 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
161 { 0, 0, 0, 0, 0, 0, 0 } };
163 static const struct mce_ierror_table mce_p8_ierror_table
[] = {
164 { 0x00000000081c0000, 0x0000000000040000, true,
165 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_IFETCH
, MCE_ECLASS_HARDWARE
,
166 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
167 { 0x00000000081c0000, 0x0000000000080000, true,
168 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_PARITY
, MCE_ECLASS_HARD_INDETERMINATE
,
169 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
170 { 0x00000000081c0000, 0x00000000000c0000, true,
171 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
172 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
173 { 0x00000000081c0000, 0x0000000000100000, true,
174 MCE_ERROR_TYPE_ERAT
, MCE_ERAT_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
175 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
176 { 0x00000000081c0000, 0x0000000000140000, true,
177 MCE_ERROR_TYPE_TLB
, MCE_TLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
178 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
179 { 0x00000000081c0000, 0x0000000000180000, true,
180 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_PAGE_TABLE_WALK_IFETCH
,
182 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
183 { 0x00000000081c0000, 0x00000000001c0000, true,
184 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_IFETCH
, MCE_ECLASS_HARDWARE
,
185 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
186 { 0x00000000081c0000, 0x0000000008000000, true,
187 MCE_ERROR_TYPE_LINK
, MCE_LINK_ERROR_IFETCH_TIMEOUT
, MCE_ECLASS_HARDWARE
,
188 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
189 { 0x00000000081c0000, 0x0000000008040000, true,
190 MCE_ERROR_TYPE_LINK
,MCE_LINK_ERROR_PAGE_TABLE_WALK_IFETCH_TIMEOUT
,
192 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
193 { 0, 0, 0, 0, 0, 0, 0 } };
195 static const struct mce_ierror_table mce_p9_ierror_table
[] = {
196 { 0x00000000081c0000, 0x0000000000040000, true,
197 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_IFETCH
, MCE_ECLASS_HARDWARE
,
198 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
199 { 0x00000000081c0000, 0x0000000000080000, true,
200 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_PARITY
, MCE_ECLASS_HARD_INDETERMINATE
,
201 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
202 { 0x00000000081c0000, 0x00000000000c0000, true,
203 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
204 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
205 { 0x00000000081c0000, 0x0000000000100000, true,
206 MCE_ERROR_TYPE_ERAT
, MCE_ERAT_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
207 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
208 { 0x00000000081c0000, 0x0000000000140000, true,
209 MCE_ERROR_TYPE_TLB
, MCE_TLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
210 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
211 { 0x00000000081c0000, 0x0000000000180000, true,
212 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_PAGE_TABLE_WALK_IFETCH
, MCE_ECLASS_HARDWARE
,
213 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
214 { 0x00000000081c0000, 0x00000000001c0000, true,
215 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_IFETCH_FOREIGN
, MCE_ECLASS_SOFTWARE
,
216 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
217 { 0x00000000081c0000, 0x0000000008000000, true,
218 MCE_ERROR_TYPE_LINK
, MCE_LINK_ERROR_IFETCH_TIMEOUT
, MCE_ECLASS_HARDWARE
,
219 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
220 { 0x00000000081c0000, 0x0000000008040000, true,
221 MCE_ERROR_TYPE_LINK
,MCE_LINK_ERROR_PAGE_TABLE_WALK_IFETCH_TIMEOUT
,
223 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
224 { 0x00000000081c0000, 0x00000000080c0000, true,
225 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_IFETCH
, MCE_ECLASS_SOFTWARE
,
226 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
227 { 0x00000000081c0000, 0x0000000008100000, true,
228 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_PAGE_TABLE_WALK_IFETCH
, MCE_ECLASS_SOFTWARE
,
229 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
230 { 0x00000000081c0000, 0x0000000008140000, false,
231 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_STORE
, MCE_ECLASS_HARDWARE
,
232 MCE_INITIATOR_CPU
, MCE_SEV_FATAL
, false }, /* ASYNC is fatal */
233 { 0x00000000081c0000, 0x0000000008180000, false,
234 MCE_ERROR_TYPE_LINK
,MCE_LINK_ERROR_STORE_TIMEOUT
,
235 MCE_INITIATOR_CPU
, MCE_SEV_FATAL
, false }, /* ASYNC is fatal */
236 { 0x00000000081c0000, 0x00000000081c0000, true, MCE_ECLASS_HARDWARE
,
237 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_PAGE_TABLE_WALK_IFETCH_FOREIGN
,
238 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
239 { 0, 0, 0, 0, 0, 0, 0 } };
241 struct mce_derror_table
{
242 unsigned long dsisr_value
;
243 bool dar_valid
; /* dar is a valid indicator of faulting address */
244 unsigned int error_type
;
245 unsigned int error_subtype
;
246 unsigned int error_class
;
247 unsigned int initiator
;
248 unsigned int severity
;
252 static const struct mce_derror_table mce_p7_derror_table
[] = {
254 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_LOAD_STORE
, MCE_ECLASS_HARDWARE
,
255 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
257 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_PAGE_TABLE_WALK_LOAD_STORE
,
259 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
261 MCE_ERROR_TYPE_ERAT
, MCE_ERAT_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
262 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
264 MCE_ERROR_TYPE_TLB
, MCE_TLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
265 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
267 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
268 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
270 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_PARITY
, MCE_ECLASS_HARD_INDETERMINATE
,
271 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
273 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_INDETERMINATE
, /* BOTH */
274 MCE_ECLASS_HARD_INDETERMINATE
,
275 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
276 { 0, false, 0, 0, 0, 0, 0 } };
278 static const struct mce_derror_table mce_p8_derror_table
[] = {
280 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_LOAD_STORE
, MCE_ECLASS_HARDWARE
,
281 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
283 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_PAGE_TABLE_WALK_LOAD_STORE
,
285 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
287 MCE_ERROR_TYPE_LINK
, MCE_LINK_ERROR_LOAD_TIMEOUT
, MCE_ECLASS_HARDWARE
,
288 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
290 MCE_ERROR_TYPE_LINK
, MCE_LINK_ERROR_PAGE_TABLE_WALK_LOAD_STORE_TIMEOUT
,
292 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
294 MCE_ERROR_TYPE_ERAT
, MCE_ERAT_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
295 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
297 MCE_ERROR_TYPE_TLB
, MCE_TLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
298 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
300 MCE_ERROR_TYPE_ERAT
, MCE_ERAT_ERROR_MULTIHIT
, /* SECONDARY ERAT */
301 MCE_ECLASS_SOFT_INDETERMINATE
,
302 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
304 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_MULTIHIT
, /* Before PARITY */
305 MCE_ECLASS_SOFT_INDETERMINATE
,
306 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
308 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_PARITY
, MCE_ECLASS_HARD_INDETERMINATE
,
309 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
310 { 0, false, 0, 0, 0, 0, 0 } };
312 static const struct mce_derror_table mce_p9_derror_table
[] = {
314 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_LOAD_STORE
, MCE_ECLASS_HARDWARE
,
315 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
317 MCE_ERROR_TYPE_UE
, MCE_UE_ERROR_PAGE_TABLE_WALK_LOAD_STORE
,
319 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
321 MCE_ERROR_TYPE_LINK
, MCE_LINK_ERROR_LOAD_TIMEOUT
, MCE_ECLASS_HARDWARE
,
322 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
324 MCE_ERROR_TYPE_LINK
, MCE_LINK_ERROR_PAGE_TABLE_WALK_LOAD_STORE_TIMEOUT
,
326 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
328 MCE_ERROR_TYPE_ERAT
, MCE_ERAT_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
329 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
331 MCE_ERROR_TYPE_TLB
, MCE_TLB_ERROR_MULTIHIT
, MCE_ECLASS_SOFT_INDETERMINATE
,
332 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
334 MCE_ERROR_TYPE_USER
, MCE_USER_ERROR_TLBIE
, MCE_ECLASS_SOFTWARE
,
335 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
337 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_MULTIHIT
, /* Before PARITY */
338 MCE_ECLASS_SOFT_INDETERMINATE
,
339 MCE_INITIATOR_CPU
, MCE_SEV_WARNING
, true },
341 MCE_ERROR_TYPE_SLB
, MCE_SLB_ERROR_PARITY
, MCE_ECLASS_HARD_INDETERMINATE
,
342 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
344 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_LOAD
, MCE_ECLASS_HARDWARE
,
345 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
347 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_PAGE_TABLE_WALK_LOAD_STORE
,
349 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
351 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_PAGE_TABLE_WALK_LOAD_STORE_FOREIGN
,
353 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
355 MCE_ERROR_TYPE_RA
, MCE_RA_ERROR_LOAD_STORE_FOREIGN
, MCE_ECLASS_HARDWARE
,
356 MCE_INITIATOR_CPU
, MCE_SEV_SEVERE
, true },
357 { 0, false, 0, 0, 0, 0, 0 } };
359 static int mce_find_instr_ea_and_phys(struct pt_regs
*regs
, uint64_t *addr
,
363 * Carefully look at the NIP to determine
364 * the instruction to analyse. Reading the NIP
365 * in real-mode is tricky and can lead to recursive
369 unsigned long pfn
, instr_addr
;
370 struct instruction_op op
;
371 struct pt_regs tmp
= *regs
;
373 pfn
= addr_to_pfn(regs
, regs
->nip
);
374 if (pfn
!= ULONG_MAX
) {
375 instr_addr
= (pfn
<< PAGE_SHIFT
) + (regs
->nip
& ~PAGE_MASK
);
376 instr
= *(unsigned int *)(instr_addr
);
377 if (!analyse_instr(&op
, &tmp
, instr
)) {
378 pfn
= addr_to_pfn(regs
, op
.ea
);
380 *phys_addr
= (pfn
<< PAGE_SHIFT
);
384 * analyse_instr() might fail if the instruction
385 * is not a load/store, although this is unexpected
386 * for load/store errors or if we got the NIP
394 static int mce_handle_ierror(struct pt_regs
*regs
,
395 const struct mce_ierror_table table
[],
396 struct mce_error_info
*mce_err
, uint64_t *addr
,
399 uint64_t srr1
= regs
->msr
;
405 for (i
= 0; table
[i
].srr1_mask
; i
++) {
406 if ((srr1
& table
[i
].srr1_mask
) != table
[i
].srr1_value
)
409 /* attempt to correct the error */
410 switch (table
[i
].error_type
) {
411 case MCE_ERROR_TYPE_SLB
:
412 if (local_paca
->in_mce
== 1)
413 slb_save_contents(local_paca
->mce_faulty_slbs
);
414 handled
= mce_flush(MCE_FLUSH_SLB
);
416 case MCE_ERROR_TYPE_ERAT
:
417 handled
= mce_flush(MCE_FLUSH_ERAT
);
419 case MCE_ERROR_TYPE_TLB
:
420 handled
= mce_flush(MCE_FLUSH_TLB
);
424 /* now fill in mce_error_info */
425 mce_err
->error_type
= table
[i
].error_type
;
426 mce_err
->error_class
= table
[i
].error_class
;
427 switch (table
[i
].error_type
) {
428 case MCE_ERROR_TYPE_UE
:
429 mce_err
->u
.ue_error_type
= table
[i
].error_subtype
;
431 case MCE_ERROR_TYPE_SLB
:
432 mce_err
->u
.slb_error_type
= table
[i
].error_subtype
;
434 case MCE_ERROR_TYPE_ERAT
:
435 mce_err
->u
.erat_error_type
= table
[i
].error_subtype
;
437 case MCE_ERROR_TYPE_TLB
:
438 mce_err
->u
.tlb_error_type
= table
[i
].error_subtype
;
440 case MCE_ERROR_TYPE_USER
:
441 mce_err
->u
.user_error_type
= table
[i
].error_subtype
;
443 case MCE_ERROR_TYPE_RA
:
444 mce_err
->u
.ra_error_type
= table
[i
].error_subtype
;
446 case MCE_ERROR_TYPE_LINK
:
447 mce_err
->u
.link_error_type
= table
[i
].error_subtype
;
450 mce_err
->sync_error
= table
[i
].sync_error
;
451 mce_err
->severity
= table
[i
].severity
;
452 mce_err
->initiator
= table
[i
].initiator
;
453 if (table
[i
].nip_valid
) {
455 if (mce_err
->sync_error
&&
456 table
[i
].error_type
== MCE_ERROR_TYPE_UE
) {
459 if (get_paca()->in_mce
< MAX_MCE_DEPTH
) {
460 pfn
= addr_to_pfn(regs
, regs
->nip
);
461 if (pfn
!= ULONG_MAX
) {
471 mce_err
->error_type
= MCE_ERROR_TYPE_UNKNOWN
;
472 mce_err
->error_class
= MCE_ECLASS_UNKNOWN
;
473 mce_err
->severity
= MCE_SEV_SEVERE
;
474 mce_err
->initiator
= MCE_INITIATOR_CPU
;
475 mce_err
->sync_error
= true;
480 static int mce_handle_derror(struct pt_regs
*regs
,
481 const struct mce_derror_table table
[],
482 struct mce_error_info
*mce_err
, uint64_t *addr
,
485 uint64_t dsisr
= regs
->dsisr
;
492 for (i
= 0; table
[i
].dsisr_value
; i
++) {
493 if (!(dsisr
& table
[i
].dsisr_value
))
496 /* attempt to correct the error */
497 switch (table
[i
].error_type
) {
498 case MCE_ERROR_TYPE_SLB
:
499 if (local_paca
->in_mce
== 1)
500 slb_save_contents(local_paca
->mce_faulty_slbs
);
501 if (mce_flush(MCE_FLUSH_SLB
))
504 case MCE_ERROR_TYPE_ERAT
:
505 if (mce_flush(MCE_FLUSH_ERAT
))
508 case MCE_ERROR_TYPE_TLB
:
509 if (mce_flush(MCE_FLUSH_TLB
))
515 * Attempt to handle multiple conditions, but only return
516 * one. Ensure uncorrectable errors are first in the table
522 /* now fill in mce_error_info */
523 mce_err
->error_type
= table
[i
].error_type
;
524 mce_err
->error_class
= table
[i
].error_class
;
525 switch (table
[i
].error_type
) {
526 case MCE_ERROR_TYPE_UE
:
527 mce_err
->u
.ue_error_type
= table
[i
].error_subtype
;
529 case MCE_ERROR_TYPE_SLB
:
530 mce_err
->u
.slb_error_type
= table
[i
].error_subtype
;
532 case MCE_ERROR_TYPE_ERAT
:
533 mce_err
->u
.erat_error_type
= table
[i
].error_subtype
;
535 case MCE_ERROR_TYPE_TLB
:
536 mce_err
->u
.tlb_error_type
= table
[i
].error_subtype
;
538 case MCE_ERROR_TYPE_USER
:
539 mce_err
->u
.user_error_type
= table
[i
].error_subtype
;
541 case MCE_ERROR_TYPE_RA
:
542 mce_err
->u
.ra_error_type
= table
[i
].error_subtype
;
544 case MCE_ERROR_TYPE_LINK
:
545 mce_err
->u
.link_error_type
= table
[i
].error_subtype
;
548 mce_err
->sync_error
= table
[i
].sync_error
;
549 mce_err
->severity
= table
[i
].severity
;
550 mce_err
->initiator
= table
[i
].initiator
;
551 if (table
[i
].dar_valid
)
553 else if (mce_err
->sync_error
&&
554 table
[i
].error_type
== MCE_ERROR_TYPE_UE
) {
556 * We do a maximum of 4 nested MCE calls, see
557 * kernel/exception-64s.h
559 if (get_paca()->in_mce
< MAX_MCE_DEPTH
)
560 mce_find_instr_ea_and_phys(regs
, addr
,
569 mce_err
->error_type
= MCE_ERROR_TYPE_UNKNOWN
;
570 mce_err
->error_class
= MCE_ECLASS_UNKNOWN
;
571 mce_err
->severity
= MCE_SEV_SEVERE
;
572 mce_err
->initiator
= MCE_INITIATOR_CPU
;
573 mce_err
->sync_error
= true;
578 static long mce_handle_ue_error(struct pt_regs
*regs
,
579 struct mce_error_info
*mce_err
)
582 const struct exception_table_entry
*entry
;
584 entry
= search_kernel_exception_table(regs
->nip
);
586 mce_err
->ignore_event
= true;
587 regs
->nip
= extable_fixup(entry
);
592 * On specific SCOM read via MMIO we may get a machine check
593 * exception with SRR0 pointing inside opal. If that is the
594 * case OPAL may have recovery address to re-read SCOM data in
595 * different way and hence we can recover from this MC.
598 if (ppc_md
.mce_check_early_recovery
) {
599 if (ppc_md
.mce_check_early_recovery(regs
))
605 static long mce_handle_error(struct pt_regs
*regs
,
606 const struct mce_derror_table dtable
[],
607 const struct mce_ierror_table itable
[])
609 struct mce_error_info mce_err
= { 0 };
610 uint64_t addr
, phys_addr
= ULONG_MAX
;
611 uint64_t srr1
= regs
->msr
;
614 if (SRR1_MC_LOADSTORE(srr1
))
615 handled
= mce_handle_derror(regs
, dtable
, &mce_err
, &addr
,
618 handled
= mce_handle_ierror(regs
, itable
, &mce_err
, &addr
,
621 if (!handled
&& mce_err
.error_type
== MCE_ERROR_TYPE_UE
)
622 handled
= mce_handle_ue_error(regs
, &mce_err
);
624 save_mce_event(regs
, handled
, &mce_err
, regs
->nip
, addr
, phys_addr
);
629 long __machine_check_early_realmode_p7(struct pt_regs
*regs
)
631 /* P7 DD1 leaves top bits of DSISR undefined */
632 regs
->dsisr
&= 0x0000ffff;
634 return mce_handle_error(regs
, mce_p7_derror_table
, mce_p7_ierror_table
);
637 long __machine_check_early_realmode_p8(struct pt_regs
*regs
)
639 return mce_handle_error(regs
, mce_p8_derror_table
, mce_p8_ierror_table
);
642 long __machine_check_early_realmode_p9(struct pt_regs
*regs
)
645 * On POWER9 DD2.1 and below, it's possible to get a machine check
646 * caused by a paste instruction where only DSISR bit 25 is set. This
647 * will result in the MCE handler seeing an unknown event and the kernel
648 * crashing. An MCE that occurs like this is spurious, so we don't need
649 * to do anything in terms of servicing it. If there is something that
650 * needs to be serviced, the CPU will raise the MCE again with the
651 * correct DSISR so that it can be serviced properly. So detect this
652 * case and mark it as handled.
654 if (SRR1_MC_LOADSTORE(regs
->msr
) && regs
->dsisr
== 0x02000000)
657 return mce_handle_error(regs
, mce_p9_derror_table
, mce_p9_ierror_table
);