Commit | Line | Data |
---|---|---|
14a43e69 BH |
1 | /* |
2 | * PowerNV OPAL high level interfaces | |
3 | * | |
4 | * Copyright 2011 IBM Corp. | |
5 | * | |
6 | * This program is free software; you can redistribute it and/or | |
7 | * modify it under the terms of the GNU General Public License | |
8 | * as published by the Free Software Foundation; either version | |
9 | * 2 of the License, or (at your option) any later version. | |
10 | */ | |
11 | ||
c8742f85 | 12 | #define pr_fmt(fmt) "opal: " fmt |
14a43e69 | 13 | |
c8742f85 | 14 | #include <linux/printk.h> |
14a43e69 BH |
15 | #include <linux/types.h> |
16 | #include <linux/of.h> | |
26a2056e | 17 | #include <linux/of_fdt.h> |
14a43e69 | 18 | #include <linux/of_platform.h> |
a125e092 | 19 | #include <linux/interrupt.h> |
1bc98de2 | 20 | #include <linux/notifier.h> |
73ed148a | 21 | #include <linux/slab.h> |
b63a0ffe | 22 | #include <linux/sched.h> |
6f68b5e2 | 23 | #include <linux/kobject.h> |
f7d98d18 | 24 | #include <linux/delay.h> |
55672ecf | 25 | #include <linux/memblock.h> |
3bf57561 BH |
26 | #include <linux/kthread.h> |
27 | #include <linux/freezer.h> | |
b14726c5 ME |
28 | |
29 | #include <asm/machdep.h> | |
14a43e69 BH |
30 | #include <asm/opal.h> |
31 | #include <asm/firmware.h> | |
36df96f8 | 32 | #include <asm/mce.h> |
14a43e69 BH |
33 | |
34 | #include "powernv.h" | |
35 | ||
6f68b5e2 VH |
36 | /* /sys/firmware/opal */ |
37 | struct kobject *opal_kobj; | |
38 | ||
14a43e69 BH |
39 | struct opal { |
40 | u64 base; | |
41 | u64 entry; | |
55672ecf | 42 | u64 size; |
14a43e69 BH |
43 | } opal; |
44 | ||
55672ecf MS |
45 | struct mcheck_recoverable_range { |
46 | u64 start_addr; | |
47 | u64 end_addr; | |
48 | u64 recover_addr; | |
49 | }; | |
50 | ||
51 | static struct mcheck_recoverable_range *mc_recoverable_range; | |
52 | static int mc_recoverable_range_len; | |
53 | ||
bfc36894 | 54 | struct device_node *opal_node; |
14a43e69 | 55 | static DEFINE_SPINLOCK(opal_write_lock); |
73ed148a BH |
56 | static unsigned int *opal_irqs; |
57 | static unsigned int opal_irq_count; | |
1bc98de2 | 58 | static ATOMIC_NOTIFIER_HEAD(opal_notifier_head); |
24366360 | 59 | static struct atomic_notifier_head opal_msg_notifier_head[OPAL_MSG_TYPE_MAX]; |
1bc98de2 GS |
60 | static DEFINE_SPINLOCK(opal_notifier_lock); |
61 | static uint64_t last_notified_mask = 0x0ul; | |
62 | static atomic_t opal_notifier_hold = ATOMIC_INIT(0); | |
3bf57561 | 63 | static uint32_t opal_heartbeat; |
14a43e69 | 64 | |
4926616c BH |
65 | static void opal_reinit_cores(void) |
66 | { | |
67 | /* Do the actual re-init, This will clobber all FPRs, VRs, etc... | |
68 | * | |
69 | * It will preserve non volatile GPRs and HSPRG0/1. It will | |
70 | * also restore HIDs and other SPRs to their original value | |
71 | * but it might clobber a bunch. | |
72 | */ | |
73 | #ifdef __BIG_ENDIAN__ | |
74 | opal_reinit_cpus(OPAL_REINIT_CPUS_HILE_BE); | |
75 | #else | |
76 | opal_reinit_cpus(OPAL_REINIT_CPUS_HILE_LE); | |
77 | #endif | |
78 | } | |
79 | ||
14a43e69 BH |
80 | int __init early_init_dt_scan_opal(unsigned long node, |
81 | const char *uname, int depth, void *data) | |
82 | { | |
55672ecf | 83 | const void *basep, *entryp, *sizep; |
9d0c4dfe | 84 | int basesz, entrysz, runtimesz; |
14a43e69 BH |
85 | |
86 | if (depth != 1 || strcmp(uname, "ibm,opal") != 0) | |
87 | return 0; | |
88 | ||
89 | basep = of_get_flat_dt_prop(node, "opal-base-address", &basesz); | |
90 | entryp = of_get_flat_dt_prop(node, "opal-entry-address", &entrysz); | |
55672ecf | 91 | sizep = of_get_flat_dt_prop(node, "opal-runtime-size", &runtimesz); |
14a43e69 | 92 | |
55672ecf | 93 | if (!basep || !entryp || !sizep) |
14a43e69 BH |
94 | return 1; |
95 | ||
96 | opal.base = of_read_number(basep, basesz/4); | |
97 | opal.entry = of_read_number(entryp, entrysz/4); | |
55672ecf | 98 | opal.size = of_read_number(sizep, runtimesz/4); |
14a43e69 | 99 | |
9d0c4dfe | 100 | pr_debug("OPAL Base = 0x%llx (basep=%p basesz=%d)\n", |
14a43e69 | 101 | opal.base, basep, basesz); |
9d0c4dfe | 102 | pr_debug("OPAL Entry = 0x%llx (entryp=%p basesz=%d)\n", |
14a43e69 | 103 | opal.entry, entryp, entrysz); |
9d0c4dfe | 104 | pr_debug("OPAL Entry = 0x%llx (sizep=%p runtimesz=%d)\n", |
55672ecf | 105 | opal.size, sizep, runtimesz); |
14a43e69 BH |
106 | |
107 | powerpc_firmware_features |= FW_FEATURE_OPAL; | |
75b93da4 BH |
108 | if (of_flat_dt_is_compatible(node, "ibm,opal-v3")) { |
109 | powerpc_firmware_features |= FW_FEATURE_OPALv2; | |
110 | powerpc_firmware_features |= FW_FEATURE_OPALv3; | |
9a4f5cd0 | 111 | pr_info("OPAL V3 detected !\n"); |
75b93da4 | 112 | } else if (of_flat_dt_is_compatible(node, "ibm,opal-v2")) { |
14a43e69 | 113 | powerpc_firmware_features |= FW_FEATURE_OPALv2; |
9a4f5cd0 | 114 | pr_info("OPAL V2 detected !\n"); |
14a43e69 | 115 | } else { |
9a4f5cd0 | 116 | pr_info("OPAL V1 detected !\n"); |
14a43e69 BH |
117 | } |
118 | ||
4926616c BH |
119 | /* Reinit all cores with the right endian */ |
120 | opal_reinit_cores(); | |
121 | ||
122 | /* Restore some bits */ | |
123 | if (cur_cpu_spec->cpu_restore) | |
124 | cur_cpu_spec->cpu_restore(); | |
125 | ||
c4463b37 JK |
126 | return 1; |
127 | } | |
128 | ||
55672ecf MS |
129 | int __init early_init_dt_scan_recoverable_ranges(unsigned long node, |
130 | const char *uname, int depth, void *data) | |
131 | { | |
9d0c4dfe | 132 | int i, psize, size; |
55672ecf MS |
133 | const __be32 *prop; |
134 | ||
135 | if (depth != 1 || strcmp(uname, "ibm,opal") != 0) | |
136 | return 0; | |
137 | ||
6e556b47 | 138 | prop = of_get_flat_dt_prop(node, "mcheck-recoverable-ranges", &psize); |
55672ecf MS |
139 | |
140 | if (!prop) | |
141 | return 1; | |
142 | ||
143 | pr_debug("Found machine check recoverable ranges.\n"); | |
144 | ||
6e556b47 MS |
145 | /* |
146 | * Calculate number of available entries. | |
147 | * | |
148 | * Each recoverable address range entry is (start address, len, | |
149 | * recovery address), 2 cells each for start and recovery address, | |
150 | * 1 cell for len, totalling 5 cells per entry. | |
151 | */ | |
152 | mc_recoverable_range_len = psize / (sizeof(*prop) * 5); | |
153 | ||
154 | /* Sanity check */ | |
155 | if (!mc_recoverable_range_len) | |
156 | return 1; | |
157 | ||
158 | /* Size required to hold all the entries. */ | |
159 | size = mc_recoverable_range_len * | |
160 | sizeof(struct mcheck_recoverable_range); | |
161 | ||
55672ecf MS |
162 | /* |
163 | * Allocate a buffer to hold the MC recoverable ranges. We would be | |
164 | * accessing them in real mode, hence it needs to be within | |
165 | * RMO region. | |
166 | */ | |
167 | mc_recoverable_range =__va(memblock_alloc_base(size, __alignof__(u64), | |
168 | ppc64_rma_size)); | |
169 | memset(mc_recoverable_range, 0, size); | |
170 | ||
6e556b47 | 171 | for (i = 0; i < mc_recoverable_range_len; i++) { |
55672ecf MS |
172 | mc_recoverable_range[i].start_addr = |
173 | of_read_number(prop + (i * 5) + 0, 2); | |
174 | mc_recoverable_range[i].end_addr = | |
175 | mc_recoverable_range[i].start_addr + | |
176 | of_read_number(prop + (i * 5) + 2, 1); | |
177 | mc_recoverable_range[i].recover_addr = | |
178 | of_read_number(prop + (i * 5) + 3, 2); | |
179 | ||
180 | pr_debug("Machine check recoverable range: %llx..%llx: %llx\n", | |
181 | mc_recoverable_range[i].start_addr, | |
182 | mc_recoverable_range[i].end_addr, | |
183 | mc_recoverable_range[i].recover_addr); | |
184 | } | |
55672ecf MS |
185 | return 1; |
186 | } | |
187 | ||
c4463b37 JK |
188 | static int __init opal_register_exception_handlers(void) |
189 | { | |
29186097 | 190 | #ifdef __BIG_ENDIAN__ |
c4463b37 JK |
191 | u64 glue; |
192 | ||
193 | if (!(powerpc_firmware_features & FW_FEATURE_OPAL)) | |
194 | return -ENODEV; | |
195 | ||
28446de2 MS |
196 | /* Hookup some exception handlers except machine check. We use the |
197 | * fwnmi area at 0x7000 to provide the glue space to OPAL | |
ed79ba9e BH |
198 | */ |
199 | glue = 0x7000; | |
6507955c MS |
200 | |
201 | /* | |
202 | * Check if we are running on newer firmware that exports | |
203 | * OPAL_HANDLE_HMI token. If yes, then don't ask OPAL to patch | |
204 | * the HMI interrupt and we catch it directly in Linux. | |
205 | * | |
206 | * For older firmware (i.e currently released POWER8 System Firmware | |
207 | * as of today <= SV810_087), we fallback to old behavior and let OPAL | |
208 | * patch the HMI vector and handle it inside OPAL firmware. | |
209 | * | |
210 | * For newer firmware (in development/yet to be released) we will | |
211 | * start catching/handling HMI directly in Linux. | |
212 | */ | |
213 | if (!opal_check_token(OPAL_HANDLE_HMI)) { | |
08135139 | 214 | pr_info("Old firmware detected, OPAL handles HMIs.\n"); |
6507955c MS |
215 | opal_register_exception_handler( |
216 | OPAL_HYPERVISOR_MAINTENANCE_HANDLER, | |
217 | 0, glue); | |
218 | glue += 128; | |
219 | } | |
220 | ||
ed79ba9e | 221 | opal_register_exception_handler(OPAL_SOFTPATCH_HANDLER, 0, glue); |
29186097 | 222 | #endif |
ed79ba9e | 223 | |
c4463b37 | 224 | return 0; |
14a43e69 | 225 | } |
b14726c5 | 226 | machine_early_initcall(powernv, opal_register_exception_handlers); |
c4463b37 | 227 | |
1bc98de2 GS |
228 | int opal_notifier_register(struct notifier_block *nb) |
229 | { | |
230 | if (!nb) { | |
231 | pr_warning("%s: Invalid argument (%p)\n", | |
232 | __func__, nb); | |
233 | return -EINVAL; | |
234 | } | |
235 | ||
236 | atomic_notifier_chain_register(&opal_notifier_head, nb); | |
237 | return 0; | |
238 | } | |
798af00c BH |
239 | EXPORT_SYMBOL_GPL(opal_notifier_register); |
240 | ||
241 | int opal_notifier_unregister(struct notifier_block *nb) | |
242 | { | |
243 | if (!nb) { | |
244 | pr_warning("%s: Invalid argument (%p)\n", | |
245 | __func__, nb); | |
246 | return -EINVAL; | |
247 | } | |
248 | ||
249 | atomic_notifier_chain_unregister(&opal_notifier_head, nb); | |
250 | return 0; | |
251 | } | |
252 | EXPORT_SYMBOL_GPL(opal_notifier_unregister); | |
1bc98de2 GS |
253 | |
254 | static void opal_do_notifier(uint64_t events) | |
255 | { | |
256 | unsigned long flags; | |
257 | uint64_t changed_mask; | |
258 | ||
259 | if (atomic_read(&opal_notifier_hold)) | |
260 | return; | |
261 | ||
262 | spin_lock_irqsave(&opal_notifier_lock, flags); | |
263 | changed_mask = last_notified_mask ^ events; | |
264 | last_notified_mask = events; | |
265 | spin_unlock_irqrestore(&opal_notifier_lock, flags); | |
266 | ||
267 | /* | |
268 | * We feed with the event bits and changed bits for | |
269 | * enough information to the callback. | |
270 | */ | |
271 | atomic_notifier_call_chain(&opal_notifier_head, | |
272 | events, (void *)changed_mask); | |
273 | } | |
274 | ||
275 | void opal_notifier_update_evt(uint64_t evt_mask, | |
276 | uint64_t evt_val) | |
277 | { | |
278 | unsigned long flags; | |
279 | ||
280 | spin_lock_irqsave(&opal_notifier_lock, flags); | |
281 | last_notified_mask &= ~evt_mask; | |
282 | last_notified_mask |= evt_val; | |
283 | spin_unlock_irqrestore(&opal_notifier_lock, flags); | |
284 | } | |
285 | ||
286 | void opal_notifier_enable(void) | |
287 | { | |
288 | int64_t rc; | |
56b4c993 | 289 | __be64 evt = 0; |
1bc98de2 GS |
290 | |
291 | atomic_set(&opal_notifier_hold, 0); | |
292 | ||
293 | /* Process pending events */ | |
294 | rc = opal_poll_events(&evt); | |
295 | if (rc == OPAL_SUCCESS && evt) | |
56b4c993 | 296 | opal_do_notifier(be64_to_cpu(evt)); |
1bc98de2 GS |
297 | } |
298 | ||
299 | void opal_notifier_disable(void) | |
300 | { | |
301 | atomic_set(&opal_notifier_hold, 1); | |
302 | } | |
303 | ||
24366360 MS |
304 | /* |
305 | * Opal message notifier based on message type. Allow subscribers to get | |
306 | * notified for specific messgae type. | |
307 | */ | |
d7cf83fc | 308 | int opal_message_notifier_register(enum opal_msg_type msg_type, |
24366360 MS |
309 | struct notifier_block *nb) |
310 | { | |
792f96e9 NG |
311 | if (!nb || msg_type >= OPAL_MSG_TYPE_MAX) { |
312 | pr_warning("%s: Invalid arguments, msg_type:%d\n", | |
24366360 MS |
313 | __func__, msg_type); |
314 | return -EINVAL; | |
315 | } | |
792f96e9 | 316 | |
24366360 MS |
317 | return atomic_notifier_chain_register( |
318 | &opal_msg_notifier_head[msg_type], nb); | |
319 | } | |
320 | ||
df60f576 | 321 | int opal_message_notifier_unregister(enum opal_msg_type msg_type, |
b921e902 NG |
322 | struct notifier_block *nb) |
323 | { | |
324 | return atomic_notifier_chain_unregister( | |
325 | &opal_msg_notifier_head[msg_type], nb); | |
326 | } | |
327 | ||
24366360 MS |
328 | static void opal_message_do_notify(uint32_t msg_type, void *msg) |
329 | { | |
330 | /* notify subscribers */ | |
331 | atomic_notifier_call_chain(&opal_msg_notifier_head[msg_type], | |
332 | msg_type, msg); | |
333 | } | |
334 | ||
335 | static void opal_handle_message(void) | |
336 | { | |
337 | s64 ret; | |
338 | /* | |
339 | * TODO: pre-allocate a message buffer depending on opal-msg-size | |
340 | * value in /proc/device-tree. | |
341 | */ | |
342 | static struct opal_msg msg; | |
bb4398e1 | 343 | u32 type; |
24366360 MS |
344 | |
345 | ret = opal_get_msg(__pa(&msg), sizeof(msg)); | |
346 | /* No opal message pending. */ | |
347 | if (ret == OPAL_RESOURCE) | |
348 | return; | |
349 | ||
350 | /* check for errors. */ | |
351 | if (ret) { | |
1a84db56 | 352 | pr_warning("%s: Failed to retrieve opal message, err=%lld\n", |
24366360 MS |
353 | __func__, ret); |
354 | return; | |
355 | } | |
356 | ||
bb4398e1 AB |
357 | type = be32_to_cpu(msg.msg_type); |
358 | ||
24366360 | 359 | /* Sanity check */ |
792f96e9 | 360 | if (type >= OPAL_MSG_TYPE_MAX) { |
bb4398e1 | 361 | pr_warning("%s: Unknown message type: %u\n", __func__, type); |
24366360 MS |
362 | return; |
363 | } | |
bb4398e1 | 364 | opal_message_do_notify(type, (void *)&msg); |
24366360 MS |
365 | } |
366 | ||
367 | static int opal_message_notify(struct notifier_block *nb, | |
368 | unsigned long events, void *change) | |
369 | { | |
370 | if (events & OPAL_EVENT_MSG_PENDING) | |
371 | opal_handle_message(); | |
372 | return 0; | |
373 | } | |
374 | ||
375 | static struct notifier_block opal_message_nb = { | |
376 | .notifier_call = opal_message_notify, | |
377 | .next = NULL, | |
378 | .priority = 0, | |
379 | }; | |
380 | ||
381 | static int __init opal_message_init(void) | |
382 | { | |
383 | int ret, i; | |
384 | ||
385 | for (i = 0; i < OPAL_MSG_TYPE_MAX; i++) | |
386 | ATOMIC_INIT_NOTIFIER_HEAD(&opal_msg_notifier_head[i]); | |
387 | ||
388 | ret = opal_notifier_register(&opal_message_nb); | |
389 | if (ret) { | |
390 | pr_err("%s: Can't register OPAL event notifier (%d)\n", | |
391 | __func__, ret); | |
392 | return ret; | |
393 | } | |
394 | return 0; | |
395 | } | |
b14726c5 | 396 | machine_early_initcall(powernv, opal_message_init); |
24366360 | 397 | |
14a43e69 BH |
398 | int opal_get_chars(uint32_t vtermno, char *buf, int count) |
399 | { | |
4f89363b BH |
400 | s64 rc; |
401 | __be64 evt, len; | |
14a43e69 BH |
402 | |
403 | if (!opal.entry) | |
daea1175 | 404 | return -ENODEV; |
14a43e69 | 405 | opal_poll_events(&evt); |
4f89363b | 406 | if ((be64_to_cpu(evt) & OPAL_EVENT_CONSOLE_INPUT) == 0) |
14a43e69 | 407 | return 0; |
4f89363b | 408 | len = cpu_to_be64(count); |
9d0c4dfe | 409 | rc = opal_console_read(vtermno, &len, buf); |
14a43e69 | 410 | if (rc == OPAL_SUCCESS) |
4f89363b | 411 | return be64_to_cpu(len); |
14a43e69 BH |
412 | return 0; |
413 | } | |
414 | ||
415 | int opal_put_chars(uint32_t vtermno, const char *data, int total_len) | |
416 | { | |
417 | int written = 0; | |
4f89363b | 418 | __be64 olen; |
daea1175 | 419 | s64 len, rc; |
14a43e69 | 420 | unsigned long flags; |
4f89363b | 421 | __be64 evt; |
14a43e69 BH |
422 | |
423 | if (!opal.entry) | |
daea1175 | 424 | return -ENODEV; |
14a43e69 BH |
425 | |
426 | /* We want put_chars to be atomic to avoid mangling of hvsi | |
427 | * packets. To do that, we first test for room and return | |
daea1175 BH |
428 | * -EAGAIN if there isn't enough. |
429 | * | |
430 | * Unfortunately, opal_console_write_buffer_space() doesn't | |
431 | * appear to work on opal v1, so we just assume there is | |
432 | * enough room and be done with it | |
14a43e69 BH |
433 | */ |
434 | spin_lock_irqsave(&opal_write_lock, flags); | |
daea1175 | 435 | if (firmware_has_feature(FW_FEATURE_OPALv2)) { |
4f89363b BH |
436 | rc = opal_console_write_buffer_space(vtermno, &olen); |
437 | len = be64_to_cpu(olen); | |
daea1175 BH |
438 | if (rc || len < total_len) { |
439 | spin_unlock_irqrestore(&opal_write_lock, flags); | |
440 | /* Closed -> drop characters */ | |
441 | if (rc) | |
442 | return total_len; | |
4f89363b | 443 | opal_poll_events(NULL); |
daea1175 BH |
444 | return -EAGAIN; |
445 | } | |
14a43e69 BH |
446 | } |
447 | ||
448 | /* We still try to handle partial completions, though they | |
449 | * should no longer happen. | |
450 | */ | |
daea1175 | 451 | rc = OPAL_BUSY; |
14a43e69 BH |
452 | while(total_len > 0 && (rc == OPAL_BUSY || |
453 | rc == OPAL_BUSY_EVENT || rc == OPAL_SUCCESS)) { | |
4f89363b BH |
454 | olen = cpu_to_be64(total_len); |
455 | rc = opal_console_write(vtermno, &olen, data); | |
456 | len = be64_to_cpu(olen); | |
1de1455f BH |
457 | |
458 | /* Closed or other error drop */ | |
459 | if (rc != OPAL_SUCCESS && rc != OPAL_BUSY && | |
460 | rc != OPAL_BUSY_EVENT) { | |
461 | written = total_len; | |
462 | break; | |
463 | } | |
14a43e69 BH |
464 | if (rc == OPAL_SUCCESS) { |
465 | total_len -= len; | |
466 | data += len; | |
467 | written += len; | |
468 | } | |
469 | /* This is a bit nasty but we need that for the console to | |
470 | * flush when there aren't any interrupts. We will clean | |
471 | * things a bit later to limit that to synchronous path | |
472 | * such as the kernel console and xmon/udbg | |
473 | */ | |
474 | do | |
475 | opal_poll_events(&evt); | |
4f89363b BH |
476 | while(rc == OPAL_SUCCESS && |
477 | (be64_to_cpu(evt) & OPAL_EVENT_CONSOLE_OUTPUT)); | |
14a43e69 BH |
478 | } |
479 | spin_unlock_irqrestore(&opal_write_lock, flags); | |
480 | return written; | |
481 | } | |
482 | ||
b63a0ffe MS |
483 | static int opal_recover_mce(struct pt_regs *regs, |
484 | struct machine_check_event *evt) | |
485 | { | |
486 | int recovered = 0; | |
487 | uint64_t ea = get_mce_fault_addr(evt); | |
488 | ||
489 | if (!(regs->msr & MSR_RI)) { | |
490 | /* If MSR_RI isn't set, we cannot recover */ | |
491 | recovered = 0; | |
492 | } else if (evt->disposition == MCE_DISPOSITION_RECOVERED) { | |
493 | /* Platform corrected itself */ | |
494 | recovered = 1; | |
495 | } else if (ea && !is_kernel_addr(ea)) { | |
496 | /* | |
497 | * Faulting address is not in kernel text. We should be fine. | |
498 | * We need to find which process uses this address. | |
499 | * For now, kill the task if we have received exception when | |
500 | * in userspace. | |
501 | * | |
502 | * TODO: Queue up this address for hwpoisioning later. | |
503 | */ | |
504 | if (user_mode(regs) && !is_global_init(current)) { | |
505 | _exception(SIGBUS, regs, BUS_MCEERR_AR, regs->nip); | |
506 | recovered = 1; | |
507 | } else | |
508 | recovered = 0; | |
509 | } else if (user_mode(regs) && !is_global_init(current) && | |
510 | evt->severity == MCE_SEV_ERROR_SYNC) { | |
511 | /* | |
512 | * If we have received a synchronous error when in userspace | |
513 | * kill the task. | |
514 | */ | |
515 | _exception(SIGBUS, regs, BUS_MCEERR_AR, regs->nip); | |
516 | recovered = 1; | |
517 | } | |
518 | return recovered; | |
519 | } | |
520 | ||
ed79ba9e BH |
521 | int opal_machine_check(struct pt_regs *regs) |
522 | { | |
36df96f8 | 523 | struct machine_check_event evt; |
ed79ba9e | 524 | |
36df96f8 MS |
525 | if (!get_mce_event(&evt, MCE_EVENT_RELEASE)) |
526 | return 0; | |
ed79ba9e BH |
527 | |
528 | /* Print things out */ | |
36df96f8 | 529 | if (evt.version != MCE_V1) { |
ed79ba9e BH |
530 | pr_err("Machine Check Exception, Unknown event version %d !\n", |
531 | evt.version); | |
532 | return 0; | |
533 | } | |
b5ff4211 | 534 | machine_check_print_event_info(&evt); |
ed79ba9e | 535 | |
b63a0ffe MS |
536 | if (opal_recover_mce(regs, &evt)) |
537 | return 1; | |
538 | return 0; | |
ed79ba9e BH |
539 | } |
540 | ||
0869b6fd MS |
541 | /* Early hmi handler called in real mode. */ |
542 | int opal_hmi_exception_early(struct pt_regs *regs) | |
543 | { | |
0ef95b41 MS |
544 | s64 rc; |
545 | ||
546 | /* | |
547 | * call opal hmi handler. Pass paca address as token. | |
548 | * The return value OPAL_SUCCESS is an indication that there is | |
549 | * an HMI event generated waiting to pull by Linux. | |
550 | */ | |
551 | rc = opal_handle_hmi(); | |
552 | if (rc == OPAL_SUCCESS) { | |
553 | local_paca->hmi_event_available = 1; | |
554 | return 1; | |
555 | } | |
0869b6fd MS |
556 | return 0; |
557 | } | |
558 | ||
559 | /* HMI exception handler called in virtual mode during check_irq_replay. */ | |
560 | int opal_handle_hmi_exception(struct pt_regs *regs) | |
561 | { | |
0ef95b41 MS |
562 | s64 rc; |
563 | __be64 evt = 0; | |
564 | ||
565 | /* | |
566 | * Check if HMI event is available. | |
567 | * if Yes, then call opal_poll_events to pull opal messages and | |
568 | * process them. | |
569 | */ | |
570 | if (!local_paca->hmi_event_available) | |
571 | return 0; | |
572 | ||
573 | local_paca->hmi_event_available = 0; | |
574 | rc = opal_poll_events(&evt); | |
575 | if (rc == OPAL_SUCCESS && evt) | |
576 | opal_do_notifier(be64_to_cpu(evt)); | |
577 | ||
578 | return 1; | |
0869b6fd MS |
579 | } |
580 | ||
55672ecf MS |
581 | static uint64_t find_recovery_address(uint64_t nip) |
582 | { | |
583 | int i; | |
584 | ||
585 | for (i = 0; i < mc_recoverable_range_len; i++) | |
586 | if ((nip >= mc_recoverable_range[i].start_addr) && | |
587 | (nip < mc_recoverable_range[i].end_addr)) | |
588 | return mc_recoverable_range[i].recover_addr; | |
589 | return 0; | |
590 | } | |
591 | ||
592 | bool opal_mce_check_early_recovery(struct pt_regs *regs) | |
593 | { | |
594 | uint64_t recover_addr = 0; | |
595 | ||
596 | if (!opal.base || !opal.size) | |
597 | goto out; | |
598 | ||
599 | if ((regs->nip >= opal.base) && | |
600 | (regs->nip <= (opal.base + opal.size))) | |
601 | recover_addr = find_recovery_address(regs->nip); | |
602 | ||
603 | /* | |
604 | * Setup regs->nip to rfi into fixup address. | |
605 | */ | |
606 | if (recover_addr) | |
607 | regs->nip = recover_addr; | |
608 | ||
609 | out: | |
610 | return !!recover_addr; | |
611 | } | |
612 | ||
a125e092 BH |
613 | static irqreturn_t opal_interrupt(int irq, void *data) |
614 | { | |
5e4da530 | 615 | __be64 events; |
a125e092 BH |
616 | |
617 | opal_handle_interrupt(virq_to_hw(irq), &events); | |
618 | ||
56b4c993 | 619 | opal_do_notifier(be64_to_cpu(events)); |
a125e092 BH |
620 | |
621 | return IRQ_HANDLED; | |
622 | } | |
623 | ||
6f68b5e2 VH |
624 | static int opal_sysfs_init(void) |
625 | { | |
626 | opal_kobj = kobject_create_and_add("opal", firmware_kobj); | |
627 | if (!opal_kobj) { | |
628 | pr_warn("kobject_create_and_add opal failed\n"); | |
629 | return -ENOMEM; | |
630 | } | |
631 | ||
632 | return 0; | |
633 | } | |
634 | ||
c8742f85 BH |
635 | static ssize_t symbol_map_read(struct file *fp, struct kobject *kobj, |
636 | struct bin_attribute *bin_attr, | |
637 | char *buf, loff_t off, size_t count) | |
638 | { | |
639 | return memory_read_from_buffer(buf, count, &off, bin_attr->private, | |
640 | bin_attr->size); | |
641 | } | |
642 | ||
643 | static BIN_ATTR_RO(symbol_map, 0); | |
644 | ||
645 | static void opal_export_symmap(void) | |
646 | { | |
647 | const __be64 *syms; | |
648 | unsigned int size; | |
649 | struct device_node *fw; | |
650 | int rc; | |
651 | ||
652 | fw = of_find_node_by_path("/ibm,opal/firmware"); | |
653 | if (!fw) | |
654 | return; | |
655 | syms = of_get_property(fw, "symbol-map", &size); | |
656 | if (!syms || size != 2 * sizeof(__be64)) | |
657 | return; | |
658 | ||
659 | /* Setup attributes */ | |
660 | bin_attr_symbol_map.private = __va(be64_to_cpu(syms[0])); | |
661 | bin_attr_symbol_map.size = be64_to_cpu(syms[1]); | |
662 | ||
663 | rc = sysfs_create_bin_file(opal_kobj, &bin_attr_symbol_map); | |
664 | if (rc) | |
665 | pr_warn("Error %d creating OPAL symbols file\n", rc); | |
666 | } | |
667 | ||
b09c2ec4 VH |
668 | static void __init opal_dump_region_init(void) |
669 | { | |
670 | void *addr; | |
671 | uint64_t size; | |
672 | int rc; | |
673 | ||
b962f5a4 SS |
674 | if (!opal_check_token(OPAL_REGISTER_DUMP_REGION)) |
675 | return; | |
676 | ||
b09c2ec4 VH |
677 | /* Register kernel log buffer */ |
678 | addr = log_buf_addr_get(); | |
6501ab5e PK |
679 | if (addr == NULL) |
680 | return; | |
681 | ||
b09c2ec4 | 682 | size = log_buf_len_get(); |
6501ab5e PK |
683 | if (size == 0) |
684 | return; | |
685 | ||
b09c2ec4 VH |
686 | rc = opal_register_dump_region(OPAL_DUMP_REGION_LOG_BUF, |
687 | __pa(addr), size); | |
688 | /* Don't warn if this is just an older OPAL that doesn't | |
689 | * know about that call | |
690 | */ | |
691 | if (rc && rc != OPAL_UNSUPPORTED) | |
692 | pr_warn("DUMP: Failed to register kernel log buffer. " | |
693 | "rc = %d\n", rc); | |
694 | } | |
608b286d JK |
695 | |
696 | static void opal_ipmi_init(struct device_node *opal_node) | |
697 | { | |
698 | struct device_node *np; | |
699 | ||
700 | for_each_child_of_node(opal_node, np) | |
701 | if (of_device_is_compatible(np, "ibm,opal-ipmi")) | |
702 | of_platform_device_create(np, NULL, NULL); | |
703 | } | |
704 | ||
47083450 NG |
705 | static void opal_i2c_create_devs(void) |
706 | { | |
707 | struct device_node *np; | |
708 | ||
709 | for_each_compatible_node(np, NULL, "ibm,opal-i2c") | |
710 | of_platform_device_create(np, NULL, NULL); | |
711 | } | |
712 | ||
c1c3a526 GS |
713 | static void __init opal_irq_init(struct device_node *dn) |
714 | { | |
715 | const __be32 *irqs; | |
716 | int i, irqlen; | |
717 | ||
718 | /* Get interrupt property */ | |
719 | irqs = of_get_property(opal_node, "opal-interrupts", &irqlen); | |
31494cf3 GS |
720 | opal_irq_count = irqs ? (irqlen / 4) : 0; |
721 | pr_debug("Found %d interrupts reserved for OPAL\n", opal_irq_count); | |
722 | if (!opal_irq_count) | |
723 | return; | |
c1c3a526 GS |
724 | |
725 | /* Install interrupt handlers */ | |
c1c3a526 GS |
726 | opal_irqs = kzalloc(opal_irq_count * sizeof(unsigned int), GFP_KERNEL); |
727 | for (i = 0; irqs && i < opal_irq_count; i++, irqs++) { | |
728 | unsigned int irq, virq; | |
729 | int rc; | |
730 | ||
731 | /* Get hardware and virtual IRQ */ | |
732 | irq = be32_to_cpup(irqs); | |
733 | virq = irq_create_mapping(NULL, irq); | |
734 | if (virq == NO_IRQ) { | |
735 | pr_warn("Failed to map irq 0x%x\n", irq); | |
736 | continue; | |
737 | } | |
738 | ||
739 | /* Install interrupt handler */ | |
740 | rc = request_irq(virq, opal_interrupt, 0, "opal", NULL); | |
741 | if (rc) { | |
742 | irq_dispose_mapping(virq); | |
743 | pr_warn("Error %d requesting irq %d (0x%x)\n", | |
744 | rc, virq, irq); | |
745 | continue; | |
746 | } | |
747 | ||
748 | /* Cache IRQ */ | |
749 | opal_irqs[i] = virq; | |
750 | } | |
751 | } | |
752 | ||
3bf57561 BH |
753 | static int kopald(void *unused) |
754 | { | |
755 | set_freezable(); | |
756 | do { | |
757 | try_to_freeze(); | |
758 | opal_poll_events(NULL); | |
759 | msleep_interruptible(opal_heartbeat); | |
760 | } while (!kthread_should_stop()); | |
761 | ||
762 | return 0; | |
763 | } | |
764 | ||
765 | static void opal_init_heartbeat(void) | |
766 | { | |
767 | /* Old firwmware, we assume the HVC heartbeat is sufficient */ | |
768 | if (of_property_read_u32(opal_node, "ibm,heartbeat-ms", | |
769 | &opal_heartbeat) != 0) | |
770 | opal_heartbeat = 0; | |
771 | ||
772 | if (opal_heartbeat) | |
773 | kthread_run(kopald, NULL, "kopald"); | |
774 | } | |
775 | ||
14a43e69 BH |
776 | static int __init opal_init(void) |
777 | { | |
778 | struct device_node *np, *consoles; | |
c1c3a526 | 779 | int rc; |
14a43e69 BH |
780 | |
781 | opal_node = of_find_node_by_path("/ibm,opal"); | |
782 | if (!opal_node) { | |
08135139 | 783 | pr_warn("Device node not found\n"); |
14a43e69 BH |
784 | return -ENODEV; |
785 | } | |
2db29d28 BH |
786 | |
787 | /* Register OPAL consoles if any ports */ | |
14a43e69 BH |
788 | if (firmware_has_feature(FW_FEATURE_OPALv2)) |
789 | consoles = of_find_node_by_path("/ibm,opal/consoles"); | |
790 | else | |
791 | consoles = of_node_get(opal_node); | |
2db29d28 BH |
792 | if (consoles) { |
793 | for_each_child_of_node(consoles, np) { | |
794 | if (strcmp(np->name, "serial")) | |
795 | continue; | |
796 | of_platform_device_create(np, NULL, NULL); | |
797 | } | |
798 | of_node_put(consoles); | |
14a43e69 | 799 | } |
a125e092 | 800 | |
47083450 NG |
801 | /* Create i2c platform devices */ |
802 | opal_i2c_create_devs(); | |
803 | ||
3bf57561 BH |
804 | /* Setup a heatbeat thread if requested by OPAL */ |
805 | opal_init_heartbeat(); | |
806 | ||
a125e092 | 807 | /* Find all OPAL interrupts and request them */ |
c1c3a526 | 808 | opal_irq_init(opal_node); |
6f68b5e2 VH |
809 | |
810 | /* Create "opal" kobject under /sys/firmware */ | |
811 | rc = opal_sysfs_init(); | |
50bd6153 | 812 | if (rc == 0) { |
c8742f85 BH |
813 | /* Export symbol map to userspace */ |
814 | opal_export_symmap(); | |
b09c2ec4 VH |
815 | /* Setup dump region interface */ |
816 | opal_dump_region_init(); | |
774fea1a SS |
817 | /* Setup error log interface */ |
818 | rc = opal_elog_init(); | |
50bd6153 VH |
819 | /* Setup code update interface */ |
820 | opal_flash_init(); | |
c7e64b9c SS |
821 | /* Setup platform dump extract interface */ |
822 | opal_platform_dump_init(); | |
4029cd66 NG |
823 | /* Setup system parameters interface */ |
824 | opal_sys_param_init(); | |
bfc36894 JS |
825 | /* Setup message log interface. */ |
826 | opal_msglog_init(); | |
50bd6153 | 827 | } |
6f68b5e2 | 828 | |
3bf57561 | 829 | /* Initialize OPAL IPMI backend */ |
608b286d JK |
830 | opal_ipmi_init(opal_node); |
831 | ||
14a43e69 BH |
832 | return 0; |
833 | } | |
b14726c5 | 834 | machine_subsys_initcall(powernv, opal_init); |
73ed148a BH |
835 | |
836 | void opal_shutdown(void) | |
837 | { | |
838 | unsigned int i; | |
f7d98d18 | 839 | long rc = OPAL_BUSY; |
73ed148a | 840 | |
f7d98d18 | 841 | /* First free interrupts, which will also mask them */ |
73ed148a BH |
842 | for (i = 0; i < opal_irq_count; i++) { |
843 | if (opal_irqs[i]) | |
b0d436c7 | 844 | free_irq(opal_irqs[i], NULL); |
73ed148a BH |
845 | opal_irqs[i] = 0; |
846 | } | |
f7d98d18 VH |
847 | |
848 | /* | |
849 | * Then sync with OPAL which ensure anything that can | |
850 | * potentially write to our memory has completed such | |
851 | * as an ongoing dump retrieval | |
852 | */ | |
853 | while (rc == OPAL_BUSY || rc == OPAL_BUSY_EVENT) { | |
854 | rc = opal_sync_host_reboot(); | |
855 | if (rc == OPAL_BUSY) | |
856 | opal_poll_events(NULL); | |
857 | else | |
858 | mdelay(10); | |
859 | } | |
b09c2ec4 VH |
860 | |
861 | /* Unregister memory dump region */ | |
b962f5a4 SS |
862 | if (opal_check_token(OPAL_UNREGISTER_DUMP_REGION)) |
863 | opal_unregister_dump_region(OPAL_DUMP_REGION_LOG_BUF); | |
73ed148a | 864 | } |
e28b05e7 JS |
865 | |
866 | /* Export this so that test modules can use it */ | |
867 | EXPORT_SYMBOL_GPL(opal_invalid_call); | |
608b286d JK |
868 | EXPORT_SYMBOL_GPL(opal_ipmi_send); |
869 | EXPORT_SYMBOL_GPL(opal_ipmi_recv); | |
3441f04b AB |
870 | |
871 | /* Convert a region of vmalloc memory to an opal sg list */ | |
872 | struct opal_sg_list *opal_vmalloc_to_sg_list(void *vmalloc_addr, | |
873 | unsigned long vmalloc_size) | |
874 | { | |
875 | struct opal_sg_list *sg, *first = NULL; | |
876 | unsigned long i = 0; | |
877 | ||
878 | sg = kzalloc(PAGE_SIZE, GFP_KERNEL); | |
879 | if (!sg) | |
880 | goto nomem; | |
881 | ||
882 | first = sg; | |
883 | ||
884 | while (vmalloc_size > 0) { | |
885 | uint64_t data = vmalloc_to_pfn(vmalloc_addr) << PAGE_SHIFT; | |
886 | uint64_t length = min(vmalloc_size, PAGE_SIZE); | |
887 | ||
888 | sg->entry[i].data = cpu_to_be64(data); | |
889 | sg->entry[i].length = cpu_to_be64(length); | |
890 | i++; | |
891 | ||
892 | if (i >= SG_ENTRIES_PER_NODE) { | |
893 | struct opal_sg_list *next; | |
894 | ||
895 | next = kzalloc(PAGE_SIZE, GFP_KERNEL); | |
896 | if (!next) | |
897 | goto nomem; | |
898 | ||
899 | sg->length = cpu_to_be64( | |
900 | i * sizeof(struct opal_sg_entry) + 16); | |
901 | i = 0; | |
902 | sg->next = cpu_to_be64(__pa(next)); | |
903 | sg = next; | |
904 | } | |
905 | ||
906 | vmalloc_addr += length; | |
907 | vmalloc_size -= length; | |
908 | } | |
909 | ||
910 | sg->length = cpu_to_be64(i * sizeof(struct opal_sg_entry) + 16); | |
911 | ||
912 | return first; | |
913 | ||
914 | nomem: | |
915 | pr_err("%s : Failed to allocate memory\n", __func__); | |
916 | opal_free_sg_list(first); | |
917 | return NULL; | |
918 | } | |
919 | ||
920 | void opal_free_sg_list(struct opal_sg_list *sg) | |
921 | { | |
922 | while (sg) { | |
923 | uint64_t next = be64_to_cpu(sg->next); | |
924 | ||
925 | kfree(sg); | |
926 | ||
927 | if (next) | |
928 | sg = __va(next); | |
929 | else | |
930 | sg = NULL; | |
931 | } | |
932 | } | |
16b1d26e NG |
933 | |
934 | EXPORT_SYMBOL_GPL(opal_poll_events); | |
935 | EXPORT_SYMBOL_GPL(opal_rtc_read); | |
936 | EXPORT_SYMBOL_GPL(opal_rtc_write); | |
937 | EXPORT_SYMBOL_GPL(opal_tpo_read); | |
938 | EXPORT_SYMBOL_GPL(opal_tpo_write); | |
47083450 | 939 | EXPORT_SYMBOL_GPL(opal_i2c_request); |