2 * Machine check exception handling CPU-side for power7 and power8
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * Copyright 2013 IBM Corporation
19 * Author: Mahesh Salgaonkar <mahesh@linux.vnet.ibm.com>
23 #define pr_fmt(fmt) "mce_power: " fmt
25 #include <linux/types.h>
26 #include <linux/ptrace.h>
29 #include <asm/machdep.h>
31 static void flush_tlb_206(unsigned int num_sets
, unsigned int action
)
37 case TLB_INVAL_SCOPE_GLOBAL
:
38 rb
= TLBIEL_INVAL_SET
;
40 case TLB_INVAL_SCOPE_LPID
:
41 rb
= TLBIEL_INVAL_SET_LPID
;
48 asm volatile("ptesync" : : : "memory");
49 for (i
= 0; i
< num_sets
; i
++) {
50 asm volatile("tlbiel %0" : : "r" (rb
));
51 rb
+= 1 << TLBIEL_INVAL_SET_SHIFT
;
53 asm volatile("ptesync" : : : "memory");
57 * Generic routine to flush TLB on power7. This routine is used as
58 * flush_tlb hook in cpu_spec for Power7 processor.
60 * action => TLB_INVAL_SCOPE_GLOBAL: Invalidate all TLBs.
61 * TLB_INVAL_SCOPE_LPID: Invalidate TLB for current LPID.
63 void __flush_tlb_power7(unsigned int action
)
65 flush_tlb_206(POWER7_TLB_SETS
, action
);
69 * Generic routine to flush TLB on power8. This routine is used as
70 * flush_tlb hook in cpu_spec for power8 processor.
72 * action => TLB_INVAL_SCOPE_GLOBAL: Invalidate all TLBs.
73 * TLB_INVAL_SCOPE_LPID: Invalidate TLB for current LPID.
75 void __flush_tlb_power8(unsigned int action
)
77 flush_tlb_206(POWER8_TLB_SETS
, action
);
80 /* flush SLBs and reload */
81 static void flush_and_reload_slb(void)
83 struct slb_shadow
*slb
;
86 /* Invalidate all SLBs */
87 asm volatile("slbmte %0,%0; slbia" : : "r" (0));
89 #ifdef CONFIG_KVM_BOOK3S_HANDLER
91 * If machine check is hit when in guest or in transition, we will
92 * only flush the SLBs and continue.
94 if (get_paca()->kvm_hstate
.in_guest
)
98 /* For host kernel, reload the SLBs from shadow SLB buffer. */
99 slb
= get_slb_shadow();
103 n
= min_t(u32
, be32_to_cpu(slb
->persistent
), SLB_MIN_SIZE
);
105 /* Load up the SLB entries from shadow SLB */
106 for (i
= 0; i
< n
; i
++) {
107 unsigned long rb
= be64_to_cpu(slb
->save_area
[i
].esid
);
108 unsigned long rs
= be64_to_cpu(slb
->save_area
[i
].vsid
);
110 rb
= (rb
& ~0xFFFul
) | i
;
111 asm volatile("slbmte %0,%1" : : "r" (rs
), "r" (rb
));
115 static long mce_handle_derror(uint64_t dsisr
, uint64_t slb_error_bits
)
120 * flush and reload SLBs for SLB errors and flush TLBs for TLB errors.
121 * reset the error bits whenever we handle them so that at the end
122 * we can check whether we handled all of them or not.
124 if (dsisr
& slb_error_bits
) {
125 flush_and_reload_slb();
126 /* reset error bits */
127 dsisr
&= ~(slb_error_bits
);
129 if (dsisr
& P7_DSISR_MC_TLB_MULTIHIT_MFTLB
) {
130 if (cur_cpu_spec
&& cur_cpu_spec
->flush_tlb
)
131 cur_cpu_spec
->flush_tlb(TLB_INVAL_SCOPE_GLOBAL
);
132 /* reset error bits */
133 dsisr
&= ~P7_DSISR_MC_TLB_MULTIHIT_MFTLB
;
135 /* Any other errors we don't understand? */
136 if (dsisr
& 0xffffffffUL
)
142 static long mce_handle_derror_p7(uint64_t dsisr
)
144 return mce_handle_derror(dsisr
, P7_DSISR_MC_SLB_ERRORS
);
147 static long mce_handle_common_ierror(uint64_t srr1
)
151 switch (P7_SRR1_MC_IFETCH(srr1
)) {
154 case P7_SRR1_MC_IFETCH_SLB_PARITY
:
155 case P7_SRR1_MC_IFETCH_SLB_MULTIHIT
:
156 /* flush and reload SLBs for SLB errors. */
157 flush_and_reload_slb();
160 case P7_SRR1_MC_IFETCH_TLB_MULTIHIT
:
161 if (cur_cpu_spec
&& cur_cpu_spec
->flush_tlb
) {
162 cur_cpu_spec
->flush_tlb(TLB_INVAL_SCOPE_GLOBAL
);
173 static long mce_handle_ierror_p7(uint64_t srr1
)
177 handled
= mce_handle_common_ierror(srr1
);
179 if (P7_SRR1_MC_IFETCH(srr1
) == P7_SRR1_MC_IFETCH_SLB_BOTH
) {
180 flush_and_reload_slb();
186 static void mce_get_common_ierror(struct mce_error_info
*mce_err
, uint64_t srr1
)
188 switch (P7_SRR1_MC_IFETCH(srr1
)) {
189 case P7_SRR1_MC_IFETCH_SLB_PARITY
:
190 mce_err
->error_type
= MCE_ERROR_TYPE_SLB
;
191 mce_err
->u
.slb_error_type
= MCE_SLB_ERROR_PARITY
;
193 case P7_SRR1_MC_IFETCH_SLB_MULTIHIT
:
194 mce_err
->error_type
= MCE_ERROR_TYPE_SLB
;
195 mce_err
->u
.slb_error_type
= MCE_SLB_ERROR_MULTIHIT
;
197 case P7_SRR1_MC_IFETCH_TLB_MULTIHIT
:
198 mce_err
->error_type
= MCE_ERROR_TYPE_TLB
;
199 mce_err
->u
.tlb_error_type
= MCE_TLB_ERROR_MULTIHIT
;
201 case P7_SRR1_MC_IFETCH_UE
:
202 case P7_SRR1_MC_IFETCH_UE_IFU_INTERNAL
:
203 mce_err
->error_type
= MCE_ERROR_TYPE_UE
;
204 mce_err
->u
.ue_error_type
= MCE_UE_ERROR_IFETCH
;
206 case P7_SRR1_MC_IFETCH_UE_TLB_RELOAD
:
207 mce_err
->error_type
= MCE_ERROR_TYPE_UE
;
208 mce_err
->u
.ue_error_type
=
209 MCE_UE_ERROR_PAGE_TABLE_WALK_IFETCH
;
214 static void mce_get_ierror_p7(struct mce_error_info
*mce_err
, uint64_t srr1
)
216 mce_get_common_ierror(mce_err
, srr1
);
217 if (P7_SRR1_MC_IFETCH(srr1
) == P7_SRR1_MC_IFETCH_SLB_BOTH
) {
218 mce_err
->error_type
= MCE_ERROR_TYPE_SLB
;
219 mce_err
->u
.slb_error_type
= MCE_SLB_ERROR_INDETERMINATE
;
223 static void mce_get_derror_p7(struct mce_error_info
*mce_err
, uint64_t dsisr
)
225 if (dsisr
& P7_DSISR_MC_UE
) {
226 mce_err
->error_type
= MCE_ERROR_TYPE_UE
;
227 mce_err
->u
.ue_error_type
= MCE_UE_ERROR_LOAD_STORE
;
228 } else if (dsisr
& P7_DSISR_MC_UE_TABLEWALK
) {
229 mce_err
->error_type
= MCE_ERROR_TYPE_UE
;
230 mce_err
->u
.ue_error_type
=
231 MCE_UE_ERROR_PAGE_TABLE_WALK_LOAD_STORE
;
232 } else if (dsisr
& P7_DSISR_MC_ERAT_MULTIHIT
) {
233 mce_err
->error_type
= MCE_ERROR_TYPE_ERAT
;
234 mce_err
->u
.erat_error_type
= MCE_ERAT_ERROR_MULTIHIT
;
235 } else if (dsisr
& P7_DSISR_MC_SLB_MULTIHIT
) {
236 mce_err
->error_type
= MCE_ERROR_TYPE_SLB
;
237 mce_err
->u
.slb_error_type
= MCE_SLB_ERROR_MULTIHIT
;
238 } else if (dsisr
& P7_DSISR_MC_SLB_PARITY_MFSLB
) {
239 mce_err
->error_type
= MCE_ERROR_TYPE_SLB
;
240 mce_err
->u
.slb_error_type
= MCE_SLB_ERROR_PARITY
;
241 } else if (dsisr
& P7_DSISR_MC_TLB_MULTIHIT_MFTLB
) {
242 mce_err
->error_type
= MCE_ERROR_TYPE_TLB
;
243 mce_err
->u
.tlb_error_type
= MCE_TLB_ERROR_MULTIHIT
;
244 } else if (dsisr
& P7_DSISR_MC_SLB_MULTIHIT_PARITY
) {
245 mce_err
->error_type
= MCE_ERROR_TYPE_SLB
;
246 mce_err
->u
.slb_error_type
= MCE_SLB_ERROR_INDETERMINATE
;
250 static long mce_handle_ue_error(struct pt_regs
*regs
)
255 * On specific SCOM read via MMIO we may get a machine check
256 * exception with SRR0 pointing inside opal. If that is the
257 * case OPAL may have recovery address to re-read SCOM data in
258 * different way and hence we can recover from this MC.
261 if (ppc_md
.mce_check_early_recovery
) {
262 if (ppc_md
.mce_check_early_recovery(regs
))
268 long __machine_check_early_realmode_p7(struct pt_regs
*regs
)
270 uint64_t srr1
, nip
, addr
;
272 struct mce_error_info mce_error_info
= { 0 };
278 * Handle memory errors depending whether this was a load/store or
279 * ifetch exception. Also, populate the mce error_type and
280 * type-specific error_type from either SRR1 or DSISR, depending
281 * whether this was a load/store or ifetch exception
283 if (P7_SRR1_MC_LOADSTORE(srr1
)) {
284 handled
= mce_handle_derror_p7(regs
->dsisr
);
285 mce_get_derror_p7(&mce_error_info
, regs
->dsisr
);
288 handled
= mce_handle_ierror_p7(srr1
);
289 mce_get_ierror_p7(&mce_error_info
, srr1
);
293 /* Handle UE error. */
294 if (mce_error_info
.error_type
== MCE_ERROR_TYPE_UE
)
295 handled
= mce_handle_ue_error(regs
);
297 save_mce_event(regs
, handled
, &mce_error_info
, nip
, addr
);
301 static void mce_get_ierror_p8(struct mce_error_info
*mce_err
, uint64_t srr1
)
303 mce_get_common_ierror(mce_err
, srr1
);
304 if (P7_SRR1_MC_IFETCH(srr1
) == P8_SRR1_MC_IFETCH_ERAT_MULTIHIT
) {
305 mce_err
->error_type
= MCE_ERROR_TYPE_ERAT
;
306 mce_err
->u
.erat_error_type
= MCE_ERAT_ERROR_MULTIHIT
;
310 static void mce_get_derror_p8(struct mce_error_info
*mce_err
, uint64_t dsisr
)
312 mce_get_derror_p7(mce_err
, dsisr
);
313 if (dsisr
& P8_DSISR_MC_ERAT_MULTIHIT_SEC
) {
314 mce_err
->error_type
= MCE_ERROR_TYPE_ERAT
;
315 mce_err
->u
.erat_error_type
= MCE_ERAT_ERROR_MULTIHIT
;
319 static long mce_handle_ierror_p8(uint64_t srr1
)
323 handled
= mce_handle_common_ierror(srr1
);
325 if (P7_SRR1_MC_IFETCH(srr1
) == P8_SRR1_MC_IFETCH_ERAT_MULTIHIT
) {
326 flush_and_reload_slb();
332 static long mce_handle_derror_p8(uint64_t dsisr
)
334 return mce_handle_derror(dsisr
, P8_DSISR_MC_SLB_ERRORS
);
337 long __machine_check_early_realmode_p8(struct pt_regs
*regs
)
339 uint64_t srr1
, nip
, addr
;
341 struct mce_error_info mce_error_info
= { 0 };
346 if (P7_SRR1_MC_LOADSTORE(srr1
)) {
347 handled
= mce_handle_derror_p8(regs
->dsisr
);
348 mce_get_derror_p8(&mce_error_info
, regs
->dsisr
);
351 handled
= mce_handle_ierror_p8(srr1
);
352 mce_get_ierror_p8(&mce_error_info
, srr1
);
356 /* Handle UE error. */
357 if (mce_error_info
.error_type
== MCE_ERROR_TYPE_UE
)
358 handled
= mce_handle_ue_error(regs
);
360 save_mce_event(regs
, handled
, &mce_error_info
, nip
, addr
);