2 * PowerNV OPAL high level interfaces
4 * Copyright 2011 IBM Corp.
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
12 #define pr_fmt(fmt) "opal: " fmt
14 #include <linux/printk.h>
15 #include <linux/types.h>
17 #include <linux/of_fdt.h>
18 #include <linux/of_platform.h>
19 #include <linux/interrupt.h>
20 #include <linux/notifier.h>
21 #include <linux/slab.h>
22 #include <linux/sched.h>
23 #include <linux/kobject.h>
24 #include <linux/delay.h>
25 #include <linux/memblock.h>
26 #include <linux/kthread.h>
27 #include <linux/freezer.h>
29 #include <asm/machdep.h>
31 #include <asm/firmware.h>
36 /* /sys/firmware/opal */
37 struct kobject
*opal_kobj
;
45 struct mcheck_recoverable_range
{
51 static struct mcheck_recoverable_range
*mc_recoverable_range
;
52 static int mc_recoverable_range_len
;
54 struct device_node
*opal_node
;
55 static DEFINE_SPINLOCK(opal_write_lock
);
56 static struct atomic_notifier_head opal_msg_notifier_head
[OPAL_MSG_TYPE_MAX
];
57 static uint32_t opal_heartbeat
;
59 static void opal_reinit_cores(void)
61 /* Do the actual re-init, This will clobber all FPRs, VRs, etc...
63 * It will preserve non volatile GPRs and HSPRG0/1. It will
64 * also restore HIDs and other SPRs to their original value
65 * but it might clobber a bunch.
68 opal_reinit_cpus(OPAL_REINIT_CPUS_HILE_BE
);
70 opal_reinit_cpus(OPAL_REINIT_CPUS_HILE_LE
);
74 int __init
early_init_dt_scan_opal(unsigned long node
,
75 const char *uname
, int depth
, void *data
)
77 const void *basep
, *entryp
, *sizep
;
78 int basesz
, entrysz
, runtimesz
;
80 if (depth
!= 1 || strcmp(uname
, "ibm,opal") != 0)
83 basep
= of_get_flat_dt_prop(node
, "opal-base-address", &basesz
);
84 entryp
= of_get_flat_dt_prop(node
, "opal-entry-address", &entrysz
);
85 sizep
= of_get_flat_dt_prop(node
, "opal-runtime-size", &runtimesz
);
87 if (!basep
|| !entryp
|| !sizep
)
90 opal
.base
= of_read_number(basep
, basesz
/4);
91 opal
.entry
= of_read_number(entryp
, entrysz
/4);
92 opal
.size
= of_read_number(sizep
, runtimesz
/4);
94 pr_debug("OPAL Base = 0x%llx (basep=%p basesz=%d)\n",
95 opal
.base
, basep
, basesz
);
96 pr_debug("OPAL Entry = 0x%llx (entryp=%p basesz=%d)\n",
97 opal
.entry
, entryp
, entrysz
);
98 pr_debug("OPAL Entry = 0x%llx (sizep=%p runtimesz=%d)\n",
99 opal
.size
, sizep
, runtimesz
);
101 powerpc_firmware_features
|= FW_FEATURE_OPAL
;
102 if (of_flat_dt_is_compatible(node
, "ibm,opal-v3")) {
103 powerpc_firmware_features
|= FW_FEATURE_OPALv2
;
104 powerpc_firmware_features
|= FW_FEATURE_OPALv3
;
105 pr_info("OPAL V3 detected !\n");
106 } else if (of_flat_dt_is_compatible(node
, "ibm,opal-v2")) {
107 powerpc_firmware_features
|= FW_FEATURE_OPALv2
;
108 pr_info("OPAL V2 detected !\n");
110 pr_info("OPAL V1 detected !\n");
113 /* Reinit all cores with the right endian */
116 /* Restore some bits */
117 if (cur_cpu_spec
->cpu_restore
)
118 cur_cpu_spec
->cpu_restore();
123 int __init
early_init_dt_scan_recoverable_ranges(unsigned long node
,
124 const char *uname
, int depth
, void *data
)
129 if (depth
!= 1 || strcmp(uname
, "ibm,opal") != 0)
132 prop
= of_get_flat_dt_prop(node
, "mcheck-recoverable-ranges", &psize
);
137 pr_debug("Found machine check recoverable ranges.\n");
140 * Calculate number of available entries.
142 * Each recoverable address range entry is (start address, len,
143 * recovery address), 2 cells each for start and recovery address,
144 * 1 cell for len, totalling 5 cells per entry.
146 mc_recoverable_range_len
= psize
/ (sizeof(*prop
) * 5);
149 if (!mc_recoverable_range_len
)
152 /* Size required to hold all the entries. */
153 size
= mc_recoverable_range_len
*
154 sizeof(struct mcheck_recoverable_range
);
157 * Allocate a buffer to hold the MC recoverable ranges. We would be
158 * accessing them in real mode, hence it needs to be within
161 mc_recoverable_range
=__va(memblock_alloc_base(size
, __alignof__(u64
),
163 memset(mc_recoverable_range
, 0, size
);
165 for (i
= 0; i
< mc_recoverable_range_len
; i
++) {
166 mc_recoverable_range
[i
].start_addr
=
167 of_read_number(prop
+ (i
* 5) + 0, 2);
168 mc_recoverable_range
[i
].end_addr
=
169 mc_recoverable_range
[i
].start_addr
+
170 of_read_number(prop
+ (i
* 5) + 2, 1);
171 mc_recoverable_range
[i
].recover_addr
=
172 of_read_number(prop
+ (i
* 5) + 3, 2);
174 pr_debug("Machine check recoverable range: %llx..%llx: %llx\n",
175 mc_recoverable_range
[i
].start_addr
,
176 mc_recoverable_range
[i
].end_addr
,
177 mc_recoverable_range
[i
].recover_addr
);
182 static int __init
opal_register_exception_handlers(void)
184 #ifdef __BIG_ENDIAN__
187 if (!(powerpc_firmware_features
& FW_FEATURE_OPAL
))
190 /* Hookup some exception handlers except machine check. We use the
191 * fwnmi area at 0x7000 to provide the glue space to OPAL
196 * Check if we are running on newer firmware that exports
197 * OPAL_HANDLE_HMI token. If yes, then don't ask OPAL to patch
198 * the HMI interrupt and we catch it directly in Linux.
200 * For older firmware (i.e currently released POWER8 System Firmware
201 * as of today <= SV810_087), we fallback to old behavior and let OPAL
202 * patch the HMI vector and handle it inside OPAL firmware.
204 * For newer firmware (in development/yet to be released) we will
205 * start catching/handling HMI directly in Linux.
207 if (!opal_check_token(OPAL_HANDLE_HMI
)) {
208 pr_info("Old firmware detected, OPAL handles HMIs.\n");
209 opal_register_exception_handler(
210 OPAL_HYPERVISOR_MAINTENANCE_HANDLER
,
215 opal_register_exception_handler(OPAL_SOFTPATCH_HANDLER
, 0, glue
);
220 machine_early_initcall(powernv
, opal_register_exception_handlers
);
223 * Opal message notifier based on message type. Allow subscribers to get
224 * notified for specific messgae type.
226 int opal_message_notifier_register(enum opal_msg_type msg_type
,
227 struct notifier_block
*nb
)
229 if (!nb
|| msg_type
>= OPAL_MSG_TYPE_MAX
) {
230 pr_warning("%s: Invalid arguments, msg_type:%d\n",
235 return atomic_notifier_chain_register(
236 &opal_msg_notifier_head
[msg_type
], nb
);
238 EXPORT_SYMBOL_GPL(opal_message_notifier_register
);
240 int opal_message_notifier_unregister(enum opal_msg_type msg_type
,
241 struct notifier_block
*nb
)
243 return atomic_notifier_chain_unregister(
244 &opal_msg_notifier_head
[msg_type
], nb
);
246 EXPORT_SYMBOL_GPL(opal_message_notifier_unregister
);
248 static void opal_message_do_notify(uint32_t msg_type
, void *msg
)
250 /* notify subscribers */
251 atomic_notifier_call_chain(&opal_msg_notifier_head
[msg_type
],
255 static void opal_handle_message(void)
259 * TODO: pre-allocate a message buffer depending on opal-msg-size
260 * value in /proc/device-tree.
262 static struct opal_msg msg
;
265 ret
= opal_get_msg(__pa(&msg
), sizeof(msg
));
266 /* No opal message pending. */
267 if (ret
== OPAL_RESOURCE
)
270 /* check for errors. */
272 pr_warning("%s: Failed to retrieve opal message, err=%lld\n",
277 type
= be32_to_cpu(msg
.msg_type
);
280 if (type
>= OPAL_MSG_TYPE_MAX
) {
281 pr_warning("%s: Unknown message type: %u\n", __func__
, type
);
284 opal_message_do_notify(type
, (void *)&msg
);
287 static irqreturn_t
opal_message_notify(int irq
, void *data
)
289 opal_handle_message();
293 static int __init
opal_message_init(void)
297 for (i
= 0; i
< OPAL_MSG_TYPE_MAX
; i
++)
298 ATOMIC_INIT_NOTIFIER_HEAD(&opal_msg_notifier_head
[i
]);
300 irq
= opal_event_request(ilog2(OPAL_EVENT_MSG_PENDING
));
302 pr_err("%s: Can't register OPAL event irq (%d)\n",
307 ret
= request_irq(irq
, opal_message_notify
,
308 IRQ_TYPE_LEVEL_HIGH
, "opal-msg", NULL
);
310 pr_err("%s: Can't request OPAL event irq (%d)\n",
318 int opal_get_chars(uint32_t vtermno
, char *buf
, int count
)
325 opal_poll_events(&evt
);
326 if ((be64_to_cpu(evt
) & OPAL_EVENT_CONSOLE_INPUT
) == 0)
328 len
= cpu_to_be64(count
);
329 rc
= opal_console_read(vtermno
, &len
, buf
);
330 if (rc
== OPAL_SUCCESS
)
331 return be64_to_cpu(len
);
335 int opal_put_chars(uint32_t vtermno
, const char *data
, int total_len
)
346 /* We want put_chars to be atomic to avoid mangling of hvsi
347 * packets. To do that, we first test for room and return
348 * -EAGAIN if there isn't enough.
350 * Unfortunately, opal_console_write_buffer_space() doesn't
351 * appear to work on opal v1, so we just assume there is
352 * enough room and be done with it
354 spin_lock_irqsave(&opal_write_lock
, flags
);
355 if (firmware_has_feature(FW_FEATURE_OPALv2
)) {
356 rc
= opal_console_write_buffer_space(vtermno
, &olen
);
357 len
= be64_to_cpu(olen
);
358 if (rc
|| len
< total_len
) {
359 spin_unlock_irqrestore(&opal_write_lock
, flags
);
360 /* Closed -> drop characters */
363 opal_poll_events(NULL
);
368 /* We still try to handle partial completions, though they
369 * should no longer happen.
372 while(total_len
> 0 && (rc
== OPAL_BUSY
||
373 rc
== OPAL_BUSY_EVENT
|| rc
== OPAL_SUCCESS
)) {
374 olen
= cpu_to_be64(total_len
);
375 rc
= opal_console_write(vtermno
, &olen
, data
);
376 len
= be64_to_cpu(olen
);
378 /* Closed or other error drop */
379 if (rc
!= OPAL_SUCCESS
&& rc
!= OPAL_BUSY
&&
380 rc
!= OPAL_BUSY_EVENT
) {
384 if (rc
== OPAL_SUCCESS
) {
389 /* This is a bit nasty but we need that for the console to
390 * flush when there aren't any interrupts. We will clean
391 * things a bit later to limit that to synchronous path
392 * such as the kernel console and xmon/udbg
395 opal_poll_events(&evt
);
396 while(rc
== OPAL_SUCCESS
&&
397 (be64_to_cpu(evt
) & OPAL_EVENT_CONSOLE_OUTPUT
));
399 spin_unlock_irqrestore(&opal_write_lock
, flags
);
403 static int opal_recover_mce(struct pt_regs
*regs
,
404 struct machine_check_event
*evt
)
407 uint64_t ea
= get_mce_fault_addr(evt
);
409 if (!(regs
->msr
& MSR_RI
)) {
410 /* If MSR_RI isn't set, we cannot recover */
412 } else if (evt
->disposition
== MCE_DISPOSITION_RECOVERED
) {
413 /* Platform corrected itself */
415 } else if (ea
&& !is_kernel_addr(ea
)) {
417 * Faulting address is not in kernel text. We should be fine.
418 * We need to find which process uses this address.
419 * For now, kill the task if we have received exception when
422 * TODO: Queue up this address for hwpoisioning later.
424 if (user_mode(regs
) && !is_global_init(current
)) {
425 _exception(SIGBUS
, regs
, BUS_MCEERR_AR
, regs
->nip
);
429 } else if (user_mode(regs
) && !is_global_init(current
) &&
430 evt
->severity
== MCE_SEV_ERROR_SYNC
) {
432 * If we have received a synchronous error when in userspace
435 _exception(SIGBUS
, regs
, BUS_MCEERR_AR
, regs
->nip
);
441 int opal_machine_check(struct pt_regs
*regs
)
443 struct machine_check_event evt
;
445 if (!get_mce_event(&evt
, MCE_EVENT_RELEASE
))
448 /* Print things out */
449 if (evt
.version
!= MCE_V1
) {
450 pr_err("Machine Check Exception, Unknown event version %d !\n",
454 machine_check_print_event_info(&evt
);
456 if (opal_recover_mce(regs
, &evt
))
461 /* Early hmi handler called in real mode. */
462 int opal_hmi_exception_early(struct pt_regs
*regs
)
467 * call opal hmi handler. Pass paca address as token.
468 * The return value OPAL_SUCCESS is an indication that there is
469 * an HMI event generated waiting to pull by Linux.
471 rc
= opal_handle_hmi();
472 if (rc
== OPAL_SUCCESS
) {
473 local_paca
->hmi_event_available
= 1;
479 /* HMI exception handler called in virtual mode during check_irq_replay. */
480 int opal_handle_hmi_exception(struct pt_regs
*regs
)
486 * Check if HMI event is available.
487 * if Yes, then call opal_poll_events to pull opal messages and
490 if (!local_paca
->hmi_event_available
)
493 local_paca
->hmi_event_available
= 0;
494 rc
= opal_poll_events(&evt
);
495 if (rc
== OPAL_SUCCESS
&& evt
)
496 opal_handle_events(be64_to_cpu(evt
));
501 static uint64_t find_recovery_address(uint64_t nip
)
505 for (i
= 0; i
< mc_recoverable_range_len
; i
++)
506 if ((nip
>= mc_recoverable_range
[i
].start_addr
) &&
507 (nip
< mc_recoverable_range
[i
].end_addr
))
508 return mc_recoverable_range
[i
].recover_addr
;
512 bool opal_mce_check_early_recovery(struct pt_regs
*regs
)
514 uint64_t recover_addr
= 0;
516 if (!opal
.base
|| !opal
.size
)
519 if ((regs
->nip
>= opal
.base
) &&
520 (regs
->nip
<= (opal
.base
+ opal
.size
)))
521 recover_addr
= find_recovery_address(regs
->nip
);
524 * Setup regs->nip to rfi into fixup address.
527 regs
->nip
= recover_addr
;
530 return !!recover_addr
;
533 static int opal_sysfs_init(void)
535 opal_kobj
= kobject_create_and_add("opal", firmware_kobj
);
537 pr_warn("kobject_create_and_add opal failed\n");
544 static ssize_t
symbol_map_read(struct file
*fp
, struct kobject
*kobj
,
545 struct bin_attribute
*bin_attr
,
546 char *buf
, loff_t off
, size_t count
)
548 return memory_read_from_buffer(buf
, count
, &off
, bin_attr
->private,
552 static BIN_ATTR_RO(symbol_map
, 0);
554 static void opal_export_symmap(void)
558 struct device_node
*fw
;
561 fw
= of_find_node_by_path("/ibm,opal/firmware");
564 syms
= of_get_property(fw
, "symbol-map", &size
);
565 if (!syms
|| size
!= 2 * sizeof(__be64
))
568 /* Setup attributes */
569 bin_attr_symbol_map
.private = __va(be64_to_cpu(syms
[0]));
570 bin_attr_symbol_map
.size
= be64_to_cpu(syms
[1]);
572 rc
= sysfs_create_bin_file(opal_kobj
, &bin_attr_symbol_map
);
574 pr_warn("Error %d creating OPAL symbols file\n", rc
);
577 static void __init
opal_dump_region_init(void)
583 if (!opal_check_token(OPAL_REGISTER_DUMP_REGION
))
586 /* Register kernel log buffer */
587 addr
= log_buf_addr_get();
591 size
= log_buf_len_get();
595 rc
= opal_register_dump_region(OPAL_DUMP_REGION_LOG_BUF
,
597 /* Don't warn if this is just an older OPAL that doesn't
598 * know about that call
600 if (rc
&& rc
!= OPAL_UNSUPPORTED
)
601 pr_warn("DUMP: Failed to register kernel log buffer. "
605 static void opal_pdev_init(struct device_node
*opal_node
,
606 const char *compatible
)
608 struct device_node
*np
;
610 for_each_child_of_node(opal_node
, np
)
611 if (of_device_is_compatible(np
, compatible
))
612 of_platform_device_create(np
, NULL
, NULL
);
615 static void opal_i2c_create_devs(void)
617 struct device_node
*np
;
619 for_each_compatible_node(np
, NULL
, "ibm,opal-i2c")
620 of_platform_device_create(np
, NULL
, NULL
);
623 static int kopald(void *unused
)
630 opal_poll_events(&events
);
631 opal_handle_events(be64_to_cpu(events
));
632 msleep_interruptible(opal_heartbeat
);
633 } while (!kthread_should_stop());
638 static void opal_init_heartbeat(void)
640 /* Old firwmware, we assume the HVC heartbeat is sufficient */
641 if (of_property_read_u32(opal_node
, "ibm,heartbeat-ms",
642 &opal_heartbeat
) != 0)
646 kthread_run(kopald
, NULL
, "kopald");
649 static int __init
opal_init(void)
651 struct device_node
*np
, *consoles
;
654 opal_node
= of_find_node_by_path("/ibm,opal");
656 pr_warn("Device node not found\n");
660 /* Register OPAL consoles if any ports */
661 if (firmware_has_feature(FW_FEATURE_OPALv2
))
662 consoles
= of_find_node_by_path("/ibm,opal/consoles");
664 consoles
= of_node_get(opal_node
);
666 for_each_child_of_node(consoles
, np
) {
667 if (strcmp(np
->name
, "serial"))
669 of_platform_device_create(np
, NULL
, NULL
);
671 of_node_put(consoles
);
674 /* Initialise OPAL messaging system */
677 /* Initialise OPAL asynchronous completion interface */
678 opal_async_comp_init();
680 /* Initialise OPAL sensor interface */
683 /* Initialise OPAL hypervisor maintainence interrupt handling */
684 opal_hmi_handler_init();
686 /* Create i2c platform devices */
687 opal_i2c_create_devs();
689 /* Setup a heatbeat thread if requested by OPAL */
690 opal_init_heartbeat();
692 /* Create "opal" kobject under /sys/firmware */
693 rc
= opal_sysfs_init();
695 /* Export symbol map to userspace */
696 opal_export_symmap();
697 /* Setup dump region interface */
698 opal_dump_region_init();
699 /* Setup error log interface */
700 rc
= opal_elog_init();
701 /* Setup code update interface */
702 opal_flash_update_init();
703 /* Setup platform dump extract interface */
704 opal_platform_dump_init();
705 /* Setup system parameters interface */
706 opal_sys_param_init();
707 /* Setup message log interface. */
711 /* Initialize platform devices: IPMI backend, PRD & flash interface */
712 opal_pdev_init(opal_node
, "ibm,opal-ipmi");
713 opal_pdev_init(opal_node
, "ibm,opal-flash");
714 opal_pdev_init(opal_node
, "ibm,opal-prd");
718 machine_subsys_initcall(powernv
, opal_init
);
720 void opal_shutdown(void)
724 opal_event_shutdown();
727 * Then sync with OPAL which ensure anything that can
728 * potentially write to our memory has completed such
729 * as an ongoing dump retrieval
731 while (rc
== OPAL_BUSY
|| rc
== OPAL_BUSY_EVENT
) {
732 rc
= opal_sync_host_reboot();
734 opal_poll_events(NULL
);
739 /* Unregister memory dump region */
740 if (opal_check_token(OPAL_UNREGISTER_DUMP_REGION
))
741 opal_unregister_dump_region(OPAL_DUMP_REGION_LOG_BUF
);
744 /* Export this so that test modules can use it */
745 EXPORT_SYMBOL_GPL(opal_invalid_call
);
746 EXPORT_SYMBOL_GPL(opal_xscom_read
);
747 EXPORT_SYMBOL_GPL(opal_xscom_write
);
748 EXPORT_SYMBOL_GPL(opal_ipmi_send
);
749 EXPORT_SYMBOL_GPL(opal_ipmi_recv
);
750 EXPORT_SYMBOL_GPL(opal_flash_read
);
751 EXPORT_SYMBOL_GPL(opal_flash_write
);
752 EXPORT_SYMBOL_GPL(opal_flash_erase
);
753 EXPORT_SYMBOL_GPL(opal_prd_msg
);
755 /* Convert a region of vmalloc memory to an opal sg list */
756 struct opal_sg_list
*opal_vmalloc_to_sg_list(void *vmalloc_addr
,
757 unsigned long vmalloc_size
)
759 struct opal_sg_list
*sg
, *first
= NULL
;
762 sg
= kzalloc(PAGE_SIZE
, GFP_KERNEL
);
768 while (vmalloc_size
> 0) {
769 uint64_t data
= vmalloc_to_pfn(vmalloc_addr
) << PAGE_SHIFT
;
770 uint64_t length
= min(vmalloc_size
, PAGE_SIZE
);
772 sg
->entry
[i
].data
= cpu_to_be64(data
);
773 sg
->entry
[i
].length
= cpu_to_be64(length
);
776 if (i
>= SG_ENTRIES_PER_NODE
) {
777 struct opal_sg_list
*next
;
779 next
= kzalloc(PAGE_SIZE
, GFP_KERNEL
);
783 sg
->length
= cpu_to_be64(
784 i
* sizeof(struct opal_sg_entry
) + 16);
786 sg
->next
= cpu_to_be64(__pa(next
));
790 vmalloc_addr
+= length
;
791 vmalloc_size
-= length
;
794 sg
->length
= cpu_to_be64(i
* sizeof(struct opal_sg_entry
) + 16);
799 pr_err("%s : Failed to allocate memory\n", __func__
);
800 opal_free_sg_list(first
);
804 void opal_free_sg_list(struct opal_sg_list
*sg
)
807 uint64_t next
= be64_to_cpu(sg
->next
);
818 int opal_error_code(int rc
)
821 case OPAL_SUCCESS
: return 0;
823 case OPAL_PARAMETER
: return -EINVAL
;
824 case OPAL_ASYNC_COMPLETION
: return -EINPROGRESS
;
825 case OPAL_BUSY_EVENT
: return -EBUSY
;
826 case OPAL_NO_MEM
: return -ENOMEM
;
827 case OPAL_PERMISSION
: return -EPERM
;
829 case OPAL_UNSUPPORTED
: return -EIO
;
830 case OPAL_HARDWARE
: return -EIO
;
831 case OPAL_INTERNAL_ERROR
: return -EIO
;
833 pr_err("%s: unexpected OPAL error %d\n", __func__
, rc
);
838 EXPORT_SYMBOL_GPL(opal_poll_events
);
839 EXPORT_SYMBOL_GPL(opal_rtc_read
);
840 EXPORT_SYMBOL_GPL(opal_rtc_write
);
841 EXPORT_SYMBOL_GPL(opal_tpo_read
);
842 EXPORT_SYMBOL_GPL(opal_tpo_write
);
843 EXPORT_SYMBOL_GPL(opal_i2c_request
);