]> git.proxmox.com Git - mirror_ubuntu-eoan-kernel.git/blame - arch/powerpc/platforms/powernv/opal.c
powerpc/powernv: Add IMC OPAL APIs
[mirror_ubuntu-eoan-kernel.git] / arch / powerpc / platforms / powernv / opal.c
CommitLineData
14a43e69
BH
1/*
2 * PowerNV OPAL high level interfaces
3 *
4 * Copyright 2011 IBM Corp.
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
c8742f85 12#define pr_fmt(fmt) "opal: " fmt
14a43e69 13
c8742f85 14#include <linux/printk.h>
14a43e69
BH
15#include <linux/types.h>
16#include <linux/of.h>
26a2056e 17#include <linux/of_fdt.h>
14a43e69 18#include <linux/of_platform.h>
a125e092 19#include <linux/interrupt.h>
1bc98de2 20#include <linux/notifier.h>
73ed148a 21#include <linux/slab.h>
b63a0ffe 22#include <linux/sched.h>
6f68b5e2 23#include <linux/kobject.h>
f7d98d18 24#include <linux/delay.h>
55672ecf 25#include <linux/memblock.h>
3bf57561
BH
26#include <linux/kthread.h>
27#include <linux/freezer.h>
b14726c5
ME
28
29#include <asm/machdep.h>
14a43e69
BH
30#include <asm/opal.h>
31#include <asm/firmware.h>
36df96f8 32#include <asm/mce.h>
14a43e69
BH
33
34#include "powernv.h"
35
6f68b5e2
VH
36/* /sys/firmware/opal */
37struct kobject *opal_kobj;
38
14a43e69
BH
39struct opal {
40 u64 base;
41 u64 entry;
55672ecf 42 u64 size;
14a43e69
BH
43} opal;
44
55672ecf
MS
45struct mcheck_recoverable_range {
46 u64 start_addr;
47 u64 end_addr;
48 u64 recover_addr;
49};
50
51static struct mcheck_recoverable_range *mc_recoverable_range;
52static int mc_recoverable_range_len;
53
bfc36894 54struct device_node *opal_node;
14a43e69 55static DEFINE_SPINLOCK(opal_write_lock);
24366360 56static struct atomic_notifier_head opal_msg_notifier_head[OPAL_MSG_TYPE_MAX];
3bf57561 57static uint32_t opal_heartbeat;
a203658b 58static struct task_struct *kopald_tsk;
14a43e69 59
d3cbff1b 60void opal_configure_cores(void)
4926616c 61{
1c0eaf0f
BH
62 u64 reinit_flags = 0;
63
4926616c
BH
64 /* Do the actual re-init, This will clobber all FPRs, VRs, etc...
65 *
66 * It will preserve non volatile GPRs and HSPRG0/1. It will
67 * also restore HIDs and other SPRs to their original value
68 * but it might clobber a bunch.
69 */
70#ifdef __BIG_ENDIAN__
1c0eaf0f 71 reinit_flags |= OPAL_REINIT_CPUS_HILE_BE;
4926616c 72#else
1c0eaf0f 73 reinit_flags |= OPAL_REINIT_CPUS_HILE_LE;
4926616c 74#endif
d3cbff1b 75
1c0eaf0f
BH
76 /*
77 * POWER9 always support running hash:
78 * ie. Host hash supports hash guests
79 * Host radix supports hash/radix guests
80 */
a70b487b 81 if (early_cpu_has_feature(CPU_FTR_ARCH_300)) {
1c0eaf0f
BH
82 reinit_flags |= OPAL_REINIT_CPUS_MMU_HASH;
83 if (early_radix_enabled())
84 reinit_flags |= OPAL_REINIT_CPUS_MMU_RADIX;
85 }
86
87 opal_reinit_cpus(reinit_flags);
88
d3cbff1b
BH
89 /* Restore some bits */
90 if (cur_cpu_spec->cpu_restore)
91 cur_cpu_spec->cpu_restore();
4926616c
BH
92}
93
14a43e69
BH
94int __init early_init_dt_scan_opal(unsigned long node,
95 const char *uname, int depth, void *data)
96{
55672ecf 97 const void *basep, *entryp, *sizep;
9d0c4dfe 98 int basesz, entrysz, runtimesz;
14a43e69
BH
99
100 if (depth != 1 || strcmp(uname, "ibm,opal") != 0)
101 return 0;
102
103 basep = of_get_flat_dt_prop(node, "opal-base-address", &basesz);
104 entryp = of_get_flat_dt_prop(node, "opal-entry-address", &entrysz);
55672ecf 105 sizep = of_get_flat_dt_prop(node, "opal-runtime-size", &runtimesz);
14a43e69 106
55672ecf 107 if (!basep || !entryp || !sizep)
14a43e69
BH
108 return 1;
109
110 opal.base = of_read_number(basep, basesz/4);
111 opal.entry = of_read_number(entryp, entrysz/4);
55672ecf 112 opal.size = of_read_number(sizep, runtimesz/4);
14a43e69 113
9d0c4dfe 114 pr_debug("OPAL Base = 0x%llx (basep=%p basesz=%d)\n",
14a43e69 115 opal.base, basep, basesz);
9d0c4dfe 116 pr_debug("OPAL Entry = 0x%llx (entryp=%p basesz=%d)\n",
14a43e69 117 opal.entry, entryp, entrysz);
9d0c4dfe 118 pr_debug("OPAL Entry = 0x%llx (sizep=%p runtimesz=%d)\n",
55672ecf 119 opal.size, sizep, runtimesz);
14a43e69 120
75b93da4 121 if (of_flat_dt_is_compatible(node, "ibm,opal-v3")) {
e4d54f71
SS
122 powerpc_firmware_features |= FW_FEATURE_OPAL;
123 pr_info("OPAL detected !\n");
14a43e69 124 } else {
786842b6 125 panic("OPAL != V3 detected, no longer supported.\n");
14a43e69
BH
126 }
127
c4463b37
JK
128 return 1;
129}
130
55672ecf
MS
131int __init early_init_dt_scan_recoverable_ranges(unsigned long node,
132 const char *uname, int depth, void *data)
133{
9d0c4dfe 134 int i, psize, size;
55672ecf
MS
135 const __be32 *prop;
136
137 if (depth != 1 || strcmp(uname, "ibm,opal") != 0)
138 return 0;
139
6e556b47 140 prop = of_get_flat_dt_prop(node, "mcheck-recoverable-ranges", &psize);
55672ecf
MS
141
142 if (!prop)
143 return 1;
144
145 pr_debug("Found machine check recoverable ranges.\n");
146
6e556b47
MS
147 /*
148 * Calculate number of available entries.
149 *
150 * Each recoverable address range entry is (start address, len,
151 * recovery address), 2 cells each for start and recovery address,
152 * 1 cell for len, totalling 5 cells per entry.
153 */
154 mc_recoverable_range_len = psize / (sizeof(*prop) * 5);
155
156 /* Sanity check */
157 if (!mc_recoverable_range_len)
158 return 1;
159
160 /* Size required to hold all the entries. */
161 size = mc_recoverable_range_len *
162 sizeof(struct mcheck_recoverable_range);
163
55672ecf
MS
164 /*
165 * Allocate a buffer to hold the MC recoverable ranges. We would be
166 * accessing them in real mode, hence it needs to be within
167 * RMO region.
168 */
169 mc_recoverable_range =__va(memblock_alloc_base(size, __alignof__(u64),
170 ppc64_rma_size));
171 memset(mc_recoverable_range, 0, size);
172
6e556b47 173 for (i = 0; i < mc_recoverable_range_len; i++) {
55672ecf
MS
174 mc_recoverable_range[i].start_addr =
175 of_read_number(prop + (i * 5) + 0, 2);
176 mc_recoverable_range[i].end_addr =
177 mc_recoverable_range[i].start_addr +
178 of_read_number(prop + (i * 5) + 2, 1);
179 mc_recoverable_range[i].recover_addr =
180 of_read_number(prop + (i * 5) + 3, 2);
181
182 pr_debug("Machine check recoverable range: %llx..%llx: %llx\n",
183 mc_recoverable_range[i].start_addr,
184 mc_recoverable_range[i].end_addr,
185 mc_recoverable_range[i].recover_addr);
186 }
55672ecf
MS
187 return 1;
188}
189
c4463b37
JK
190static int __init opal_register_exception_handlers(void)
191{
29186097 192#ifdef __BIG_ENDIAN__
c4463b37
JK
193 u64 glue;
194
195 if (!(powerpc_firmware_features & FW_FEATURE_OPAL))
196 return -ENODEV;
197
28446de2
MS
198 /* Hookup some exception handlers except machine check. We use the
199 * fwnmi area at 0x7000 to provide the glue space to OPAL
ed79ba9e
BH
200 */
201 glue = 0x7000;
6507955c
MS
202
203 /*
204 * Check if we are running on newer firmware that exports
205 * OPAL_HANDLE_HMI token. If yes, then don't ask OPAL to patch
206 * the HMI interrupt and we catch it directly in Linux.
207 *
208 * For older firmware (i.e currently released POWER8 System Firmware
209 * as of today <= SV810_087), we fallback to old behavior and let OPAL
210 * patch the HMI vector and handle it inside OPAL firmware.
211 *
212 * For newer firmware (in development/yet to be released) we will
213 * start catching/handling HMI directly in Linux.
214 */
215 if (!opal_check_token(OPAL_HANDLE_HMI)) {
08135139 216 pr_info("Old firmware detected, OPAL handles HMIs.\n");
6507955c
MS
217 opal_register_exception_handler(
218 OPAL_HYPERVISOR_MAINTENANCE_HANDLER,
219 0, glue);
220 glue += 128;
221 }
222
ed79ba9e 223 opal_register_exception_handler(OPAL_SOFTPATCH_HANDLER, 0, glue);
29186097 224#endif
ed79ba9e 225
c4463b37 226 return 0;
14a43e69 227}
b14726c5 228machine_early_initcall(powernv, opal_register_exception_handlers);
c4463b37 229
24366360
MS
230/*
231 * Opal message notifier based on message type. Allow subscribers to get
232 * notified for specific messgae type.
233 */
d7cf83fc 234int opal_message_notifier_register(enum opal_msg_type msg_type,
24366360
MS
235 struct notifier_block *nb)
236{
792f96e9
NG
237 if (!nb || msg_type >= OPAL_MSG_TYPE_MAX) {
238 pr_warning("%s: Invalid arguments, msg_type:%d\n",
24366360
MS
239 __func__, msg_type);
240 return -EINVAL;
241 }
792f96e9 242
24366360
MS
243 return atomic_notifier_chain_register(
244 &opal_msg_notifier_head[msg_type], nb);
245}
594fcb9e 246EXPORT_SYMBOL_GPL(opal_message_notifier_register);
24366360 247
df60f576 248int opal_message_notifier_unregister(enum opal_msg_type msg_type,
b921e902
NG
249 struct notifier_block *nb)
250{
251 return atomic_notifier_chain_unregister(
252 &opal_msg_notifier_head[msg_type], nb);
253}
594fcb9e 254EXPORT_SYMBOL_GPL(opal_message_notifier_unregister);
b921e902 255
24366360
MS
256static void opal_message_do_notify(uint32_t msg_type, void *msg)
257{
258 /* notify subscribers */
259 atomic_notifier_call_chain(&opal_msg_notifier_head[msg_type],
260 msg_type, msg);
261}
262
263static void opal_handle_message(void)
264{
265 s64 ret;
266 /*
267 * TODO: pre-allocate a message buffer depending on opal-msg-size
268 * value in /proc/device-tree.
269 */
270 static struct opal_msg msg;
bb4398e1 271 u32 type;
24366360
MS
272
273 ret = opal_get_msg(__pa(&msg), sizeof(msg));
274 /* No opal message pending. */
275 if (ret == OPAL_RESOURCE)
276 return;
277
278 /* check for errors. */
279 if (ret) {
1a84db56 280 pr_warning("%s: Failed to retrieve opal message, err=%lld\n",
24366360
MS
281 __func__, ret);
282 return;
283 }
284
bb4398e1
AB
285 type = be32_to_cpu(msg.msg_type);
286
24366360 287 /* Sanity check */
792f96e9 288 if (type >= OPAL_MSG_TYPE_MAX) {
98da62b7 289 pr_warn_once("%s: Unknown message type: %u\n", __func__, type);
24366360
MS
290 return;
291 }
bb4398e1 292 opal_message_do_notify(type, (void *)&msg);
24366360
MS
293}
294
a295af24 295static irqreturn_t opal_message_notify(int irq, void *data)
24366360 296{
a295af24
AP
297 opal_handle_message();
298 return IRQ_HANDLED;
24366360
MS
299}
300
24366360
MS
301static int __init opal_message_init(void)
302{
a295af24 303 int ret, i, irq;
24366360
MS
304
305 for (i = 0; i < OPAL_MSG_TYPE_MAX; i++)
306 ATOMIC_INIT_NOTIFIER_HEAD(&opal_msg_notifier_head[i]);
307
a295af24
AP
308 irq = opal_event_request(ilog2(OPAL_EVENT_MSG_PENDING));
309 if (!irq) {
310 pr_err("%s: Can't register OPAL event irq (%d)\n",
311 __func__, irq);
312 return irq;
313 }
314
315 ret = request_irq(irq, opal_message_notify,
316 IRQ_TYPE_LEVEL_HIGH, "opal-msg", NULL);
24366360 317 if (ret) {
a295af24 318 pr_err("%s: Can't request OPAL event irq (%d)\n",
24366360
MS
319 __func__, ret);
320 return ret;
321 }
a295af24 322
24366360
MS
323 return 0;
324}
24366360 325
14a43e69
BH
326int opal_get_chars(uint32_t vtermno, char *buf, int count)
327{
4f89363b
BH
328 s64 rc;
329 __be64 evt, len;
14a43e69
BH
330
331 if (!opal.entry)
daea1175 332 return -ENODEV;
14a43e69 333 opal_poll_events(&evt);
4f89363b 334 if ((be64_to_cpu(evt) & OPAL_EVENT_CONSOLE_INPUT) == 0)
14a43e69 335 return 0;
4f89363b 336 len = cpu_to_be64(count);
9d0c4dfe 337 rc = opal_console_read(vtermno, &len, buf);
14a43e69 338 if (rc == OPAL_SUCCESS)
4f89363b 339 return be64_to_cpu(len);
14a43e69
BH
340 return 0;
341}
342
343int opal_put_chars(uint32_t vtermno, const char *data, int total_len)
344{
345 int written = 0;
4f89363b 346 __be64 olen;
daea1175 347 s64 len, rc;
14a43e69 348 unsigned long flags;
4f89363b 349 __be64 evt;
14a43e69
BH
350
351 if (!opal.entry)
daea1175 352 return -ENODEV;
14a43e69
BH
353
354 /* We want put_chars to be atomic to avoid mangling of hvsi
355 * packets. To do that, we first test for room and return
daea1175
BH
356 * -EAGAIN if there isn't enough.
357 *
358 * Unfortunately, opal_console_write_buffer_space() doesn't
359 * appear to work on opal v1, so we just assume there is
360 * enough room and be done with it
14a43e69
BH
361 */
362 spin_lock_irqsave(&opal_write_lock, flags);
e4d54f71
SS
363 rc = opal_console_write_buffer_space(vtermno, &olen);
364 len = be64_to_cpu(olen);
365 if (rc || len < total_len) {
366 spin_unlock_irqrestore(&opal_write_lock, flags);
367 /* Closed -> drop characters */
368 if (rc)
369 return total_len;
370 opal_poll_events(NULL);
371 return -EAGAIN;
14a43e69
BH
372 }
373
374 /* We still try to handle partial completions, though they
375 * should no longer happen.
376 */
daea1175 377 rc = OPAL_BUSY;
14a43e69
BH
378 while(total_len > 0 && (rc == OPAL_BUSY ||
379 rc == OPAL_BUSY_EVENT || rc == OPAL_SUCCESS)) {
4f89363b
BH
380 olen = cpu_to_be64(total_len);
381 rc = opal_console_write(vtermno, &olen, data);
382 len = be64_to_cpu(olen);
1de1455f
BH
383
384 /* Closed or other error drop */
385 if (rc != OPAL_SUCCESS && rc != OPAL_BUSY &&
386 rc != OPAL_BUSY_EVENT) {
387 written = total_len;
388 break;
389 }
14a43e69
BH
390 if (rc == OPAL_SUCCESS) {
391 total_len -= len;
392 data += len;
393 written += len;
394 }
395 /* This is a bit nasty but we need that for the console to
396 * flush when there aren't any interrupts. We will clean
397 * things a bit later to limit that to synchronous path
398 * such as the kernel console and xmon/udbg
399 */
400 do
401 opal_poll_events(&evt);
4f89363b
BH
402 while(rc == OPAL_SUCCESS &&
403 (be64_to_cpu(evt) & OPAL_EVENT_CONSOLE_OUTPUT));
14a43e69
BH
404 }
405 spin_unlock_irqrestore(&opal_write_lock, flags);
406 return written;
407}
408
b63a0ffe
MS
409static int opal_recover_mce(struct pt_regs *regs,
410 struct machine_check_event *evt)
411{
412 int recovered = 0;
b63a0ffe
MS
413
414 if (!(regs->msr & MSR_RI)) {
415 /* If MSR_RI isn't set, we cannot recover */
c74dd88e 416 pr_err("Machine check interrupt unrecoverable: MSR(RI=0)\n");
b63a0ffe
MS
417 recovered = 0;
418 } else if (evt->disposition == MCE_DISPOSITION_RECOVERED) {
419 /* Platform corrected itself */
420 recovered = 1;
1363875b
NP
421 } else if (evt->severity == MCE_SEV_FATAL) {
422 /* Fatal machine check */
423 pr_err("Machine check interrupt is fatal\n");
424 recovered = 0;
425 } else if ((evt->severity == MCE_SEV_ERROR_SYNC) &&
426 (user_mode(regs) && !is_global_init(current))) {
b63a0ffe 427 /*
b63a0ffe
MS
428 * For now, kill the task if we have received exception when
429 * in userspace.
430 *
431 * TODO: Queue up this address for hwpoisioning later.
432 */
b63a0ffe
MS
433 _exception(SIGBUS, regs, BUS_MCEERR_AR, regs->nip);
434 recovered = 1;
435 }
436 return recovered;
437}
438
ed79ba9e
BH
439int opal_machine_check(struct pt_regs *regs)
440{
36df96f8 441 struct machine_check_event evt;
e784b649 442 int ret;
ed79ba9e 443
36df96f8
MS
444 if (!get_mce_event(&evt, MCE_EVENT_RELEASE))
445 return 0;
ed79ba9e
BH
446
447 /* Print things out */
36df96f8 448 if (evt.version != MCE_V1) {
ed79ba9e
BH
449 pr_err("Machine Check Exception, Unknown event version %d !\n",
450 evt.version);
451 return 0;
452 }
63f44d65 453 machine_check_print_event_info(&evt, user_mode(regs));
ed79ba9e 454
b63a0ffe
MS
455 if (opal_recover_mce(regs, &evt))
456 return 1;
e784b649
MS
457
458 /*
459 * Unrecovered machine check, we are heading to panic path.
460 *
461 * We may have hit this MCE in very early stage of kernel
462 * initialization even before opal-prd has started running. If
463 * this is the case then this MCE error may go un-noticed or
464 * un-analyzed if we go down panic path. We need to inform
465 * BMC/OCC about this error so that they can collect relevant
466 * data for error analysis before rebooting.
467 * Use opal_cec_reboot2(OPAL_REBOOT_PLATFORM_ERROR) to do so.
468 * This function may not return on BMC based system.
469 */
470 ret = opal_cec_reboot2(OPAL_REBOOT_PLATFORM_ERROR,
471 "Unrecoverable Machine Check exception");
472 if (ret == OPAL_UNSUPPORTED) {
473 pr_emerg("Reboot type %d not supported\n",
474 OPAL_REBOOT_PLATFORM_ERROR);
475 }
476
477 /*
478 * We reached here. There can be three possibilities:
479 * 1. We are running on a firmware level that do not support
480 * opal_cec_reboot2()
481 * 2. We are running on a firmware level that do not support
482 * OPAL_REBOOT_PLATFORM_ERROR reboot type.
483 * 3. We are running on FSP based system that does not need opal
484 * to trigger checkstop explicitly for error analysis. The FSP
485 * PRD component would have already got notified about this
486 * error through other channels.
487 *
f2dd80ec
DA
488 * If hardware marked this as an unrecoverable MCE, we are
489 * going to panic anyway. Even if it didn't, it's not safe to
490 * continue at this point, so we should explicitly panic.
e784b649 491 */
f2dd80ec
DA
492
493 panic("PowerNV Unrecovered Machine Check");
b63a0ffe 494 return 0;
ed79ba9e
BH
495}
496
0869b6fd
MS
497/* Early hmi handler called in real mode. */
498int opal_hmi_exception_early(struct pt_regs *regs)
499{
0ef95b41
MS
500 s64 rc;
501
502 /*
503 * call opal hmi handler. Pass paca address as token.
504 * The return value OPAL_SUCCESS is an indication that there is
505 * an HMI event generated waiting to pull by Linux.
506 */
507 rc = opal_handle_hmi();
508 if (rc == OPAL_SUCCESS) {
509 local_paca->hmi_event_available = 1;
510 return 1;
511 }
0869b6fd
MS
512 return 0;
513}
514
515/* HMI exception handler called in virtual mode during check_irq_replay. */
516int opal_handle_hmi_exception(struct pt_regs *regs)
517{
0ef95b41
MS
518 s64 rc;
519 __be64 evt = 0;
520
521 /*
522 * Check if HMI event is available.
523 * if Yes, then call opal_poll_events to pull opal messages and
524 * process them.
525 */
526 if (!local_paca->hmi_event_available)
527 return 0;
528
529 local_paca->hmi_event_available = 0;
530 rc = opal_poll_events(&evt);
81f2f7ce 531 if (rc == OPAL_SUCCESS && evt)
9f0fd049 532 opal_handle_events(be64_to_cpu(evt));
0ef95b41
MS
533
534 return 1;
0869b6fd
MS
535}
536
55672ecf
MS
537static uint64_t find_recovery_address(uint64_t nip)
538{
539 int i;
540
541 for (i = 0; i < mc_recoverable_range_len; i++)
542 if ((nip >= mc_recoverable_range[i].start_addr) &&
543 (nip < mc_recoverable_range[i].end_addr))
544 return mc_recoverable_range[i].recover_addr;
545 return 0;
546}
547
548bool opal_mce_check_early_recovery(struct pt_regs *regs)
549{
550 uint64_t recover_addr = 0;
551
552 if (!opal.base || !opal.size)
553 goto out;
554
555 if ((regs->nip >= opal.base) &&
dc3799bb 556 (regs->nip < (opal.base + opal.size)))
55672ecf
MS
557 recover_addr = find_recovery_address(regs->nip);
558
559 /*
560 * Setup regs->nip to rfi into fixup address.
561 */
562 if (recover_addr)
563 regs->nip = recover_addr;
564
565out:
566 return !!recover_addr;
567}
568
6f68b5e2
VH
569static int opal_sysfs_init(void)
570{
571 opal_kobj = kobject_create_and_add("opal", firmware_kobj);
572 if (!opal_kobj) {
573 pr_warn("kobject_create_and_add opal failed\n");
574 return -ENOMEM;
575 }
576
577 return 0;
578}
579
c8742f85
BH
580static ssize_t symbol_map_read(struct file *fp, struct kobject *kobj,
581 struct bin_attribute *bin_attr,
582 char *buf, loff_t off, size_t count)
583{
584 return memory_read_from_buffer(buf, count, &off, bin_attr->private,
585 bin_attr->size);
586}
587
588static BIN_ATTR_RO(symbol_map, 0);
589
590static void opal_export_symmap(void)
591{
592 const __be64 *syms;
593 unsigned int size;
594 struct device_node *fw;
595 int rc;
596
597 fw = of_find_node_by_path("/ibm,opal/firmware");
598 if (!fw)
599 return;
600 syms = of_get_property(fw, "symbol-map", &size);
601 if (!syms || size != 2 * sizeof(__be64))
602 return;
603
604 /* Setup attributes */
605 bin_attr_symbol_map.private = __va(be64_to_cpu(syms[0]));
606 bin_attr_symbol_map.size = be64_to_cpu(syms[1]);
607
608 rc = sysfs_create_bin_file(opal_kobj, &bin_attr_symbol_map);
609 if (rc)
610 pr_warn("Error %d creating OPAL symbols file\n", rc);
611}
612
11fe909d
MB
613static ssize_t export_attr_read(struct file *fp, struct kobject *kobj,
614 struct bin_attribute *bin_attr, char *buf,
615 loff_t off, size_t count)
616{
617 return memory_read_from_buffer(buf, count, &off, bin_attr->private,
618 bin_attr->size);
619}
620
621/*
622 * opal_export_attrs: creates a sysfs node for each property listed in
623 * the device-tree under /ibm,opal/firmware/exports/
624 * All new sysfs nodes are created under /opal/exports/.
625 * This allows for reserved memory regions (e.g. HDAT) to be read.
626 * The new sysfs nodes are only readable by root.
627 */
628static void opal_export_attrs(void)
629{
630 struct bin_attribute *attr;
631 struct device_node *np;
632 struct property *prop;
633 struct kobject *kobj;
634 u64 vals[2];
635 int rc;
636
637 np = of_find_node_by_path("/ibm,opal/firmware/exports");
638 if (!np)
639 return;
640
641 /* Create new 'exports' directory - /sys/firmware/opal/exports */
642 kobj = kobject_create_and_add("exports", opal_kobj);
643 if (!kobj) {
644 pr_warn("kobject_create_and_add() of exports failed\n");
645 return;
646 }
647
648 for_each_property_of_node(np, prop) {
649 if (!strcmp(prop->name, "name") || !strcmp(prop->name, "phandle"))
650 continue;
651
652 if (of_property_read_u64_array(np, prop->name, &vals[0], 2))
653 continue;
654
83c49190 655 attr = kzalloc(sizeof(*attr), GFP_KERNEL);
11fe909d
MB
656
657 if (attr == NULL) {
658 pr_warn("Failed kmalloc for bin_attribute!");
659 continue;
660 }
661
83c49190 662 sysfs_bin_attr_init(attr);
11fe909d
MB
663 attr->attr.name = kstrdup(prop->name, GFP_KERNEL);
664 attr->attr.mode = 0400;
665 attr->read = export_attr_read;
666 attr->private = __va(vals[0]);
667 attr->size = vals[1];
668
669 if (attr->attr.name == NULL) {
670 pr_warn("Failed kstrdup for bin_attribute attr.name");
671 kfree(attr);
672 continue;
673 }
674
675 rc = sysfs_create_bin_file(kobj, attr);
676 if (rc) {
677 pr_warn("Error %d creating OPAL sysfs exports/%s file\n",
678 rc, prop->name);
679 kfree(attr->attr.name);
680 kfree(attr);
681 }
682 }
683
684 of_node_put(np);
685}
686
b09c2ec4
VH
687static void __init opal_dump_region_init(void)
688{
689 void *addr;
690 uint64_t size;
691 int rc;
692
b962f5a4
SS
693 if (!opal_check_token(OPAL_REGISTER_DUMP_REGION))
694 return;
695
b09c2ec4
VH
696 /* Register kernel log buffer */
697 addr = log_buf_addr_get();
6501ab5e
PK
698 if (addr == NULL)
699 return;
700
b09c2ec4 701 size = log_buf_len_get();
6501ab5e
PK
702 if (size == 0)
703 return;
704
b09c2ec4
VH
705 rc = opal_register_dump_region(OPAL_DUMP_REGION_LOG_BUF,
706 __pa(addr), size);
707 /* Don't warn if this is just an older OPAL that doesn't
708 * know about that call
709 */
710 if (rc && rc != OPAL_UNSUPPORTED)
711 pr_warn("DUMP: Failed to register kernel log buffer. "
712 "rc = %d\n", rc);
713}
608b286d 714
9e4f51bd 715static void opal_pdev_init(const char *compatible)
ed59190e
CB
716{
717 struct device_node *np;
718
9e4f51bd 719 for_each_compatible_node(np, NULL, compatible)
47083450
NG
720 of_platform_device_create(np, NULL, NULL);
721}
722
3bf57561
BH
723static int kopald(void *unused)
724{
a203658b 725 unsigned long timeout = msecs_to_jiffies(opal_heartbeat) + 1;
9f0fd049
AP
726 __be64 events;
727
3bf57561
BH
728 set_freezable();
729 do {
730 try_to_freeze();
9f0fd049
AP
731 opal_poll_events(&events);
732 opal_handle_events(be64_to_cpu(events));
a203658b 733 schedule_timeout_interruptible(timeout);
3bf57561
BH
734 } while (!kthread_should_stop());
735
736 return 0;
737}
738
a203658b
BH
739void opal_wake_poller(void)
740{
741 if (kopald_tsk)
742 wake_up_process(kopald_tsk);
743}
744
3bf57561
BH
745static void opal_init_heartbeat(void)
746{
747 /* Old firwmware, we assume the HVC heartbeat is sufficient */
748 if (of_property_read_u32(opal_node, "ibm,heartbeat-ms",
749 &opal_heartbeat) != 0)
750 opal_heartbeat = 0;
751
752 if (opal_heartbeat)
a203658b 753 kopald_tsk = kthread_run(kopald, NULL, "kopald");
3bf57561
BH
754}
755
14a43e69
BH
756static int __init opal_init(void)
757{
c159b596 758 struct device_node *np, *consoles, *leds;
c1c3a526 759 int rc;
14a43e69
BH
760
761 opal_node = of_find_node_by_path("/ibm,opal");
762 if (!opal_node) {
08135139 763 pr_warn("Device node not found\n");
14a43e69
BH
764 return -ENODEV;
765 }
2db29d28
BH
766
767 /* Register OPAL consoles if any ports */
7261aafc 768 consoles = of_find_node_by_path("/ibm,opal/consoles");
2db29d28
BH
769 if (consoles) {
770 for_each_child_of_node(consoles, np) {
771 if (strcmp(np->name, "serial"))
772 continue;
773 of_platform_device_create(np, NULL, NULL);
774 }
775 of_node_put(consoles);
14a43e69 776 }
a125e092 777
96e023e7
AP
778 /* Initialise OPAL messaging system */
779 opal_message_init();
780
781 /* Initialise OPAL asynchronous completion interface */
782 opal_async_comp_init();
783
784 /* Initialise OPAL sensor interface */
785 opal_sensor_init();
786
787 /* Initialise OPAL hypervisor maintainence interrupt handling */
788 opal_hmi_handler_init();
789
47083450 790 /* Create i2c platform devices */
9e4f51bd 791 opal_pdev_init("ibm,opal-i2c");
47083450 792
3bf57561
BH
793 /* Setup a heatbeat thread if requested by OPAL */
794 opal_init_heartbeat();
795
c159b596
VH
796 /* Create leds platform devices */
797 leds = of_find_node_by_path("/ibm,opal/leds");
798 if (leds) {
799 of_platform_device_create(leds, "opal_leds", NULL);
800 of_node_put(leds);
801 }
802
9b4fffa1
AD
803 /* Initialise OPAL message log interface */
804 opal_msglog_init();
805
6f68b5e2
VH
806 /* Create "opal" kobject under /sys/firmware */
807 rc = opal_sysfs_init();
50bd6153 808 if (rc == 0) {
c8742f85
BH
809 /* Export symbol map to userspace */
810 opal_export_symmap();
b09c2ec4
VH
811 /* Setup dump region interface */
812 opal_dump_region_init();
774fea1a
SS
813 /* Setup error log interface */
814 rc = opal_elog_init();
50bd6153 815 /* Setup code update interface */
ed59190e 816 opal_flash_update_init();
c7e64b9c
SS
817 /* Setup platform dump extract interface */
818 opal_platform_dump_init();
4029cd66
NG
819 /* Setup system parameters interface */
820 opal_sys_param_init();
9b4fffa1
AD
821 /* Setup message log sysfs interface. */
822 opal_msglog_sysfs_init();
50bd6153 823 }
6f68b5e2 824
11fe909d
MB
825 /* Export all properties */
826 opal_export_attrs();
827
0d7cd855 828 /* Initialize platform devices: IPMI backend, PRD & flash interface */
9e4f51bd
JM
829 opal_pdev_init("ibm,opal-ipmi");
830 opal_pdev_init("ibm,opal-flash");
831 opal_pdev_init("ibm,opal-prd");
ed59190e 832
43a1dd9b 833 /* Initialise platform device: oppanel interface */
9e4f51bd 834 opal_pdev_init("ibm,opal-oppanel");
43a1dd9b 835
affddff6
RC
836 /* Initialise OPAL kmsg dumper for flushing console on panic */
837 opal_kmsg_init();
838
14a43e69
BH
839 return 0;
840}
b14726c5 841machine_subsys_initcall(powernv, opal_init);
73ed148a
BH
842
843void opal_shutdown(void)
844{
f7d98d18 845 long rc = OPAL_BUSY;
73ed148a 846
9f0fd049 847 opal_event_shutdown();
f7d98d18
VH
848
849 /*
850 * Then sync with OPAL which ensure anything that can
851 * potentially write to our memory has completed such
852 * as an ongoing dump retrieval
853 */
854 while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) {
855 rc = opal_sync_host_reboot();
856 if (rc == OPAL_BUSY)
857 opal_poll_events(NULL);
858 else
859 mdelay(10);
860 }
b09c2ec4
VH
861
862 /* Unregister memory dump region */
b962f5a4
SS
863 if (opal_check_token(OPAL_UNREGISTER_DUMP_REGION))
864 opal_unregister_dump_region(OPAL_DUMP_REGION_LOG_BUF);
73ed148a 865}
e28b05e7
JS
866
867/* Export this so that test modules can use it */
868EXPORT_SYMBOL_GPL(opal_invalid_call);
594fcb9e
JK
869EXPORT_SYMBOL_GPL(opal_xscom_read);
870EXPORT_SYMBOL_GPL(opal_xscom_write);
608b286d
JK
871EXPORT_SYMBOL_GPL(opal_ipmi_send);
872EXPORT_SYMBOL_GPL(opal_ipmi_recv);
ed59190e
CB
873EXPORT_SYMBOL_GPL(opal_flash_read);
874EXPORT_SYMBOL_GPL(opal_flash_write);
875EXPORT_SYMBOL_GPL(opal_flash_erase);
0d7cd855 876EXPORT_SYMBOL_GPL(opal_prd_msg);
3441f04b
AB
877
878/* Convert a region of vmalloc memory to an opal sg list */
879struct opal_sg_list *opal_vmalloc_to_sg_list(void *vmalloc_addr,
880 unsigned long vmalloc_size)
881{
882 struct opal_sg_list *sg, *first = NULL;
883 unsigned long i = 0;
884
885 sg = kzalloc(PAGE_SIZE, GFP_KERNEL);
886 if (!sg)
887 goto nomem;
888
889 first = sg;
890
891 while (vmalloc_size > 0) {
892 uint64_t data = vmalloc_to_pfn(vmalloc_addr) << PAGE_SHIFT;
893 uint64_t length = min(vmalloc_size, PAGE_SIZE);
894
895 sg->entry[i].data = cpu_to_be64(data);
896 sg->entry[i].length = cpu_to_be64(length);
897 i++;
898
899 if (i >= SG_ENTRIES_PER_NODE) {
900 struct opal_sg_list *next;
901
902 next = kzalloc(PAGE_SIZE, GFP_KERNEL);
903 if (!next)
904 goto nomem;
905
906 sg->length = cpu_to_be64(
907 i * sizeof(struct opal_sg_entry) + 16);
908 i = 0;
909 sg->next = cpu_to_be64(__pa(next));
910 sg = next;
911 }
912
913 vmalloc_addr += length;
914 vmalloc_size -= length;
915 }
916
917 sg->length = cpu_to_be64(i * sizeof(struct opal_sg_entry) + 16);
918
919 return first;
920
921nomem:
922 pr_err("%s : Failed to allocate memory\n", __func__);
923 opal_free_sg_list(first);
924 return NULL;
925}
926
927void opal_free_sg_list(struct opal_sg_list *sg)
928{
929 while (sg) {
930 uint64_t next = be64_to_cpu(sg->next);
931
932 kfree(sg);
933
934 if (next)
935 sg = __va(next);
936 else
937 sg = NULL;
938 }
939}
16b1d26e 940
e3c5c2e0
CLG
941int opal_error_code(int rc)
942{
943 switch (rc) {
944 case OPAL_SUCCESS: return 0;
945
946 case OPAL_PARAMETER: return -EINVAL;
947 case OPAL_ASYNC_COMPLETION: return -EINPROGRESS;
948 case OPAL_BUSY_EVENT: return -EBUSY;
949 case OPAL_NO_MEM: return -ENOMEM;
14aae78f 950 case OPAL_PERMISSION: return -EPERM;
e3c5c2e0
CLG
951
952 case OPAL_UNSUPPORTED: return -EIO;
953 case OPAL_HARDWARE: return -EIO;
954 case OPAL_INTERNAL_ERROR: return -EIO;
955 default:
956 pr_err("%s: unexpected OPAL error %d\n", __func__, rc);
957 return -EIO;
958 }
959}
960
1d0761d2
AP
961void powernv_set_nmmu_ptcr(unsigned long ptcr)
962{
963 int rc;
964
965 if (firmware_has_feature(FW_FEATURE_OPAL)) {
966 rc = opal_nmmu_set_ptcr(-1UL, ptcr);
967 if (rc != OPAL_SUCCESS && rc != OPAL_UNSUPPORTED)
968 pr_warn("%s: Unable to set nest mmu ptcr\n", __func__);
969 }
970}
971
16b1d26e
NG
972EXPORT_SYMBOL_GPL(opal_poll_events);
973EXPORT_SYMBOL_GPL(opal_rtc_read);
974EXPORT_SYMBOL_GPL(opal_rtc_write);
975EXPORT_SYMBOL_GPL(opal_tpo_read);
976EXPORT_SYMBOL_GPL(opal_tpo_write);
47083450 977EXPORT_SYMBOL_GPL(opal_i2c_request);
c159b596
VH
978/* Export these symbols for PowerNV LED class driver */
979EXPORT_SYMBOL_GPL(opal_leds_get_ind);
980EXPORT_SYMBOL_GPL(opal_leds_set_ind);
43a1dd9b
SJS
981/* Export this symbol for PowerNV Operator Panel class driver */
982EXPORT_SYMBOL_GPL(opal_write_oppanel_async);
ffe6d810
PM
983/* Export this for KVM */
984EXPORT_SYMBOL_GPL(opal_int_set_mfrr);
5af50993 985EXPORT_SYMBOL_GPL(opal_int_eoi);