fed up with those stupid warnings
[mmotm.git] / arch / powerpc / platforms / cell / ras.c
blob5e0a191764fc0158b5eb7377af019615c3540767
1 /*
2 * Copyright 2006-2008, IBM Corporation.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 */
10 #undef DEBUG
12 #include <linux/types.h>
13 #include <linux/kernel.h>
14 #include <linux/smp.h>
15 #include <linux/reboot.h>
16 #include <linux/kexec.h>
17 #include <linux/crash_dump.h>
19 #include <asm/kexec.h>
20 #include <asm/reg.h>
21 #include <asm/io.h>
22 #include <asm/prom.h>
23 #include <asm/machdep.h>
24 #include <asm/rtas.h>
25 #include <asm/cell-regs.h>
27 #include "ras.h"
30 static void dump_fir(int cpu)
32 struct cbe_pmd_regs __iomem *pregs = cbe_get_cpu_pmd_regs(cpu);
33 struct cbe_iic_regs __iomem *iregs = cbe_get_cpu_iic_regs(cpu);
35 if (pregs == NULL)
36 return;
38 /* Todo: do some nicer parsing of bits and based on them go down
39 * to other sub-units FIRs and not only IIC
41 printk(KERN_ERR "Global Checkstop FIR : 0x%016llx\n",
42 in_be64(&pregs->checkstop_fir));
43 printk(KERN_ERR "Global Recoverable FIR : 0x%016llx\n",
44 in_be64(&pregs->checkstop_fir));
45 printk(KERN_ERR "Global MachineCheck FIR : 0x%016llx\n",
46 in_be64(&pregs->spec_att_mchk_fir));
48 if (iregs == NULL)
49 return;
50 printk(KERN_ERR "IOC FIR : 0x%016llx\n",
51 in_be64(&iregs->ioc_fir));
55 void cbe_system_error_exception(struct pt_regs *regs)
57 int cpu = smp_processor_id();
59 printk(KERN_ERR "System Error Interrupt on CPU %d !\n", cpu);
60 dump_fir(cpu);
61 dump_stack();
64 void cbe_maintenance_exception(struct pt_regs *regs)
66 int cpu = smp_processor_id();
69 * Nothing implemented for the maintenance interrupt at this point
72 printk(KERN_ERR "Unhandled Maintenance interrupt on CPU %d !\n", cpu);
73 dump_stack();
76 void cbe_thermal_exception(struct pt_regs *regs)
78 int cpu = smp_processor_id();
81 * Nothing implemented for the thermal interrupt at this point
84 printk(KERN_ERR "Unhandled Thermal interrupt on CPU %d !\n", cpu);
85 dump_stack();
88 static int cbe_machine_check_handler(struct pt_regs *regs)
90 int cpu = smp_processor_id();
92 printk(KERN_ERR "Machine Check Interrupt on CPU %d !\n", cpu);
93 dump_fir(cpu);
95 /* No recovery from this code now, lets continue */
96 return 0;
99 struct ptcal_area {
100 struct list_head list;
101 int nid;
102 int order;
103 struct page *pages;
106 static LIST_HEAD(ptcal_list);
108 static int ptcal_start_tok, ptcal_stop_tok;
110 static int __init cbe_ptcal_enable_on_node(int nid, int order)
112 struct ptcal_area *area;
113 int ret = -ENOMEM;
114 unsigned long addr;
116 if (is_kdump_kernel())
117 rtas_call(ptcal_stop_tok, 1, 1, NULL, nid);
119 area = kmalloc(sizeof(*area), GFP_KERNEL);
120 if (!area)
121 goto out_err;
123 area->nid = nid;
124 area->order = order;
125 area->pages = alloc_pages_exact_node(area->nid, GFP_KERNEL|GFP_THISNODE,
126 area->order);
128 if (!area->pages) {
129 printk(KERN_WARNING "%s: no page on node %d\n",
130 __func__, area->nid);
131 goto out_free_area;
135 * We move the ptcal area to the middle of the allocated
136 * page, in order to avoid prefetches in memcpy and similar
137 * functions stepping on it.
139 addr = __pa(page_address(area->pages)) + (PAGE_SIZE >> 1);
140 printk(KERN_DEBUG "%s: enabling PTCAL on node %d address=0x%016lx\n",
141 __func__, area->nid, addr);
143 ret = -EIO;
144 if (rtas_call(ptcal_start_tok, 3, 1, NULL, area->nid,
145 (unsigned int)(addr >> 32),
146 (unsigned int)(addr & 0xffffffff))) {
147 printk(KERN_ERR "%s: error enabling PTCAL on node %d!\n",
148 __func__, nid);
149 goto out_free_pages;
152 list_add(&area->list, &ptcal_list);
154 return 0;
156 out_free_pages:
157 __free_pages(area->pages, area->order);
158 out_free_area:
159 kfree(area);
160 out_err:
161 return ret;
164 static int __init cbe_ptcal_enable(void)
166 const u32 *size;
167 struct device_node *np;
168 int order, found_mic = 0;
170 np = of_find_node_by_path("/rtas");
171 if (!np)
172 return -ENODEV;
174 size = of_get_property(np, "ibm,cbe-ptcal-size", NULL);
175 if (!size)
176 return -ENODEV;
178 pr_debug("%s: enabling PTCAL, size = 0x%x\n", __func__, *size);
179 order = get_order(*size);
180 of_node_put(np);
182 /* support for malta device trees, with be@/mic@ nodes */
183 for_each_node_by_type(np, "mic-tm") {
184 cbe_ptcal_enable_on_node(of_node_to_nid(np), order);
185 found_mic = 1;
188 if (found_mic)
189 return 0;
191 /* support for older device tree - use cpu nodes */
192 for_each_node_by_type(np, "cpu") {
193 const u32 *nid = of_get_property(np, "node-id", NULL);
194 if (!nid) {
195 printk(KERN_ERR "%s: node %s is missing node-id?\n",
196 __func__, np->full_name);
197 continue;
199 cbe_ptcal_enable_on_node(*nid, order);
200 found_mic = 1;
203 return found_mic ? 0 : -ENODEV;
206 static int cbe_ptcal_disable(void)
208 struct ptcal_area *area, *tmp;
209 int ret = 0;
211 pr_debug("%s: disabling PTCAL\n", __func__);
213 list_for_each_entry_safe(area, tmp, &ptcal_list, list) {
214 /* disable ptcal on this node */
215 if (rtas_call(ptcal_stop_tok, 1, 1, NULL, area->nid)) {
216 printk(KERN_ERR "%s: error disabling PTCAL "
217 "on node %d!\n", __func__,
218 area->nid);
219 ret = -EIO;
220 continue;
223 /* ensure we can access the PTCAL area */
224 memset(page_address(area->pages), 0,
225 1 << (area->order + PAGE_SHIFT));
227 /* clean up */
228 list_del(&area->list);
229 __free_pages(area->pages, area->order);
230 kfree(area);
233 return ret;
236 static int cbe_ptcal_notify_reboot(struct notifier_block *nb,
237 unsigned long code, void *data)
239 return cbe_ptcal_disable();
242 static void cbe_ptcal_crash_shutdown(void)
244 cbe_ptcal_disable();
247 static struct notifier_block cbe_ptcal_reboot_notifier = {
248 .notifier_call = cbe_ptcal_notify_reboot
251 #ifdef CONFIG_PPC_IBM_CELL_RESETBUTTON
252 static int sysreset_hack;
254 static int __init cbe_sysreset_init(void)
256 struct cbe_pmd_regs __iomem *regs;
258 sysreset_hack = machine_is_compatible("IBM,CBPLUS-1.0");
259 if (!sysreset_hack)
260 return 0;
262 regs = cbe_get_cpu_pmd_regs(0);
263 if (!regs)
264 return 0;
266 /* Enable JTAG system-reset hack */
267 out_be32(&regs->fir_mode_reg,
268 in_be32(&regs->fir_mode_reg) |
269 CBE_PMD_FIR_MODE_M8);
271 return 0;
273 device_initcall(cbe_sysreset_init);
275 int cbe_sysreset_hack(void)
277 struct cbe_pmd_regs __iomem *regs;
280 * The BMC can inject user triggered system reset exceptions,
281 * but cannot set the system reset reason in srr1,
282 * so check an extra register here.
284 if (sysreset_hack && (smp_processor_id() == 0)) {
285 regs = cbe_get_cpu_pmd_regs(0);
286 if (!regs)
287 return 0;
288 if (in_be64(&regs->ras_esc_0) & 0x0000ffff) {
289 out_be64(&regs->ras_esc_0, 0);
290 return 0;
293 return 1;
295 #endif /* CONFIG_PPC_IBM_CELL_RESETBUTTON */
297 int __init cbe_ptcal_init(void)
299 int ret;
300 ptcal_start_tok = rtas_token("ibm,cbe-start-ptcal");
301 ptcal_stop_tok = rtas_token("ibm,cbe-stop-ptcal");
303 if (ptcal_start_tok == RTAS_UNKNOWN_SERVICE
304 || ptcal_stop_tok == RTAS_UNKNOWN_SERVICE)
305 return -ENODEV;
307 ret = register_reboot_notifier(&cbe_ptcal_reboot_notifier);
308 if (ret)
309 goto out1;
311 ret = crash_shutdown_register(&cbe_ptcal_crash_shutdown);
312 if (ret)
313 goto out2;
315 return cbe_ptcal_enable();
317 out2:
318 unregister_reboot_notifier(&cbe_ptcal_reboot_notifier);
319 out1:
320 printk(KERN_ERR "Can't disable PTCAL, so not enabling\n");
321 return ret;
324 arch_initcall(cbe_ptcal_init);
326 void __init cbe_ras_init(void)
328 unsigned long hid0;
331 * Enable System Error & thermal interrupts and wakeup conditions
334 hid0 = mfspr(SPRN_HID0);
335 hid0 |= HID0_CBE_THERM_INT_EN | HID0_CBE_THERM_WAKEUP |
336 HID0_CBE_SYSERR_INT_EN | HID0_CBE_SYSERR_WAKEUP;
337 mtspr(SPRN_HID0, hid0);
338 mb();
341 * Install machine check handler. Leave setting of precise mode to
342 * what the firmware did for now
344 ppc_md.machine_check_exception = cbe_machine_check_handler;
345 mb();
348 * For now, we assume that IOC_FIR is already set to forward some
349 * error conditions to the System Error handler. If that is not true
350 * then it will have to be fixed up here.