]>
Commit | Line | Data |
---|---|---|
d334a491 HY |
1 | /* |
2 | * APEI Generic Hardware Error Source support | |
3 | * | |
4 | * Generic Hardware Error Source provides a way to report platform | |
5 | * hardware errors (such as that from chipset). It works in so called | |
6 | * "Firmware First" mode, that is, hardware errors are reported to | |
7 | * firmware firstly, then reported to Linux by firmware. This way, | |
8 | * some non-standard hardware error registers or non-standard hardware | |
9 | * link can be checked by firmware to produce more hardware error | |
10 | * information for Linux. | |
11 | * | |
12 | * For more information about Generic Hardware Error Source, please | |
13 | * refer to ACPI Specification version 4.0, section 17.3.2.6 | |
14 | * | |
67eb2e99 | 15 | * Copyright 2010,2011 Intel Corp. |
d334a491 HY |
16 | * Author: Huang Ying <ying.huang@intel.com> |
17 | * | |
18 | * This program is free software; you can redistribute it and/or | |
19 | * modify it under the terms of the GNU General Public License version | |
20 | * 2 as published by the Free Software Foundation; | |
21 | * | |
22 | * This program is distributed in the hope that it will be useful, | |
23 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
24 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
25 | * GNU General Public License for more details. | |
26 | * | |
27 | * You should have received a copy of the GNU General Public License | |
28 | * along with this program; if not, write to the Free Software | |
29 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | |
30 | */ | |
31 | ||
32 | #include <linux/kernel.h> | |
33 | #include <linux/module.h> | |
34 | #include <linux/init.h> | |
35 | #include <linux/acpi.h> | |
36 | #include <linux/io.h> | |
37 | #include <linux/interrupt.h> | |
81e88fdc | 38 | #include <linux/timer.h> |
d334a491 HY |
39 | #include <linux/cper.h> |
40 | #include <linux/kdebug.h> | |
7ad6e943 HY |
41 | #include <linux/platform_device.h> |
42 | #include <linux/mutex.h> | |
32c361f5 | 43 | #include <linux/ratelimit.h> |
81e88fdc | 44 | #include <linux/vmalloc.h> |
67eb2e99 HY |
45 | #include <linux/irq_work.h> |
46 | #include <linux/llist.h> | |
47 | #include <linux/genalloc.h> | |
a654e5ee HY |
48 | #include <linux/pci.h> |
49 | #include <linux/aer.h> | |
44a69f61 | 50 | #include <linux/nmi.h> |
40e06415 MCC |
51 | |
52 | #include <acpi/ghes.h> | |
9dae3d0d | 53 | #include <acpi/apei.h> |
81e88fdc | 54 | #include <asm/tlbflush.h> |
d334a491 HY |
55 | |
56 | #include "apei-internal.h" | |
57 | ||
58 | #define GHES_PFX "GHES: " | |
59 | ||
60 | #define GHES_ESTATUS_MAX_SIZE 65536 | |
67eb2e99 HY |
61 | #define GHES_ESOURCE_PREALLOC_MAX_SIZE 65536 |
62 | ||
63 | #define GHES_ESTATUS_POOL_MIN_ALLOC_ORDER 3 | |
64 | ||
152cef40 HY |
65 | /* This is just an estimation for memory pool allocation */ |
66 | #define GHES_ESTATUS_CACHE_AVG_SIZE 512 | |
67 | ||
68 | #define GHES_ESTATUS_CACHES_SIZE 4 | |
69 | ||
70cb6e1d | 70 | #define GHES_ESTATUS_IN_CACHE_MAX_NSEC 10000000000ULL |
152cef40 HY |
71 | /* Prevent too many caches are allocated because of RCU */ |
72 | #define GHES_ESTATUS_CACHE_ALLOCED_MAX (GHES_ESTATUS_CACHES_SIZE * 3 / 2) | |
73 | ||
74 | #define GHES_ESTATUS_CACHE_LEN(estatus_len) \ | |
75 | (sizeof(struct ghes_estatus_cache) + (estatus_len)) | |
76 | #define GHES_ESTATUS_FROM_CACHE(estatus_cache) \ | |
0a00fd5e | 77 | ((struct acpi_hest_generic_status *) \ |
152cef40 HY |
78 | ((struct ghes_estatus_cache *)(estatus_cache) + 1)) |
79 | ||
67eb2e99 HY |
80 | #define GHES_ESTATUS_NODE_LEN(estatus_len) \ |
81 | (sizeof(struct ghes_estatus_node) + (estatus_len)) | |
88f074f4 | 82 | #define GHES_ESTATUS_FROM_NODE(estatus_node) \ |
0a00fd5e | 83 | ((struct acpi_hest_generic_status *) \ |
67eb2e99 | 84 | ((struct ghes_estatus_node *)(estatus_node) + 1)) |
d334a491 | 85 | |
90ab5ee9 | 86 | bool ghes_disable; |
b6a95016 HY |
87 | module_param_named(disable, ghes_disable, bool, 0); |
88 | ||
d334a491 | 89 | /* |
81e88fdc HY |
90 | * All error sources notified with SCI shares one notifier function, |
91 | * so they need to be linked and checked one by one. This is applied | |
92 | * to NMI too. | |
d334a491 | 93 | * |
81e88fdc HY |
94 | * RCU is used for these lists, so ghes_list_mutex is only used for |
95 | * list changing, not for traversing. | |
d334a491 HY |
96 | */ |
97 | static LIST_HEAD(ghes_sci); | |
7ad6e943 | 98 | static DEFINE_MUTEX(ghes_list_mutex); |
d334a491 | 99 | |
81e88fdc HY |
100 | /* |
101 | * Because the memory area used to transfer hardware error information | |
102 | * from BIOS to Linux can be determined only in NMI, IRQ or timer | |
103 | * handler, but general ioremap can not be used in atomic context, so | |
104 | * a special version of atomic ioremap is implemented for that. | |
105 | */ | |
106 | ||
107 | /* | |
594c7255 TN |
108 | * Two virtual pages are used, one for IRQ/PROCESS context, the other for |
109 | * NMI context (optionally). | |
81e88fdc | 110 | */ |
594c7255 TN |
111 | #ifdef CONFIG_HAVE_ACPI_APEI_NMI |
112 | #define GHES_IOREMAP_PAGES 2 | |
113 | #else | |
114 | #define GHES_IOREMAP_PAGES 1 | |
115 | #endif | |
116 | #define GHES_IOREMAP_IRQ_PAGE(base) (base) | |
117 | #define GHES_IOREMAP_NMI_PAGE(base) ((base) + PAGE_SIZE) | |
81e88fdc HY |
118 | |
119 | /* virtual memory area for atomic ioremap */ | |
120 | static struct vm_struct *ghes_ioremap_area; | |
121 | /* | |
122 | * These 2 spinlock is used to prevent atomic ioremap virtual memory | |
123 | * area from being mapped simultaneously. | |
124 | */ | |
125 | static DEFINE_RAW_SPINLOCK(ghes_ioremap_lock_nmi); | |
126 | static DEFINE_SPINLOCK(ghes_ioremap_lock_irq); | |
127 | ||
67eb2e99 HY |
128 | static struct gen_pool *ghes_estatus_pool; |
129 | static unsigned long ghes_estatus_pool_size_request; | |
67eb2e99 | 130 | |
8f7c31f6 | 131 | static struct ghes_estatus_cache *ghes_estatus_caches[GHES_ESTATUS_CACHES_SIZE]; |
152cef40 HY |
132 | static atomic_t ghes_estatus_cache_alloced; |
133 | ||
81e88fdc HY |
134 | static int ghes_ioremap_init(void) |
135 | { | |
136 | ghes_ioremap_area = __get_vm_area(PAGE_SIZE * GHES_IOREMAP_PAGES, | |
137 | VM_IOREMAP, VMALLOC_START, VMALLOC_END); | |
138 | if (!ghes_ioremap_area) { | |
139 | pr_err(GHES_PFX "Failed to allocate virtual memory area for atomic ioremap.\n"); | |
140 | return -ENOMEM; | |
141 | } | |
142 | ||
143 | return 0; | |
144 | } | |
145 | ||
146 | static void ghes_ioremap_exit(void) | |
147 | { | |
148 | free_vm_area(ghes_ioremap_area); | |
149 | } | |
150 | ||
151 | static void __iomem *ghes_ioremap_pfn_nmi(u64 pfn) | |
152 | { | |
153 | unsigned long vaddr; | |
154 | ||
155 | vaddr = (unsigned long)GHES_IOREMAP_NMI_PAGE(ghes_ioremap_area->addr); | |
156 | ioremap_page_range(vaddr, vaddr + PAGE_SIZE, | |
157 | pfn << PAGE_SHIFT, PAGE_KERNEL); | |
158 | ||
159 | return (void __iomem *)vaddr; | |
160 | } | |
161 | ||
162 | static void __iomem *ghes_ioremap_pfn_irq(u64 pfn) | |
163 | { | |
164 | unsigned long vaddr; | |
165 | ||
166 | vaddr = (unsigned long)GHES_IOREMAP_IRQ_PAGE(ghes_ioremap_area->addr); | |
167 | ioremap_page_range(vaddr, vaddr + PAGE_SIZE, | |
168 | pfn << PAGE_SHIFT, PAGE_KERNEL); | |
169 | ||
170 | return (void __iomem *)vaddr; | |
171 | } | |
172 | ||
173 | static void ghes_iounmap_nmi(void __iomem *vaddr_ptr) | |
174 | { | |
175 | unsigned long vaddr = (unsigned long __force)vaddr_ptr; | |
176 | void *base = ghes_ioremap_area->addr; | |
177 | ||
178 | BUG_ON(vaddr != (unsigned long)GHES_IOREMAP_NMI_PAGE(base)); | |
179 | unmap_kernel_range_noflush(vaddr, PAGE_SIZE); | |
594c7255 | 180 | arch_apei_flush_tlb_one(vaddr); |
81e88fdc HY |
181 | } |
182 | ||
183 | static void ghes_iounmap_irq(void __iomem *vaddr_ptr) | |
184 | { | |
185 | unsigned long vaddr = (unsigned long __force)vaddr_ptr; | |
186 | void *base = ghes_ioremap_area->addr; | |
187 | ||
188 | BUG_ON(vaddr != (unsigned long)GHES_IOREMAP_IRQ_PAGE(base)); | |
189 | unmap_kernel_range_noflush(vaddr, PAGE_SIZE); | |
594c7255 | 190 | arch_apei_flush_tlb_one(vaddr); |
81e88fdc HY |
191 | } |
192 | ||
67eb2e99 HY |
193 | static int ghes_estatus_pool_init(void) |
194 | { | |
195 | ghes_estatus_pool = gen_pool_create(GHES_ESTATUS_POOL_MIN_ALLOC_ORDER, -1); | |
196 | if (!ghes_estatus_pool) | |
197 | return -ENOMEM; | |
198 | return 0; | |
199 | } | |
200 | ||
201 | static void ghes_estatus_pool_free_chunk_page(struct gen_pool *pool, | |
202 | struct gen_pool_chunk *chunk, | |
203 | void *data) | |
204 | { | |
205 | free_page(chunk->start_addr); | |
206 | } | |
207 | ||
208 | static void ghes_estatus_pool_exit(void) | |
209 | { | |
210 | gen_pool_for_each_chunk(ghes_estatus_pool, | |
211 | ghes_estatus_pool_free_chunk_page, NULL); | |
212 | gen_pool_destroy(ghes_estatus_pool); | |
213 | } | |
214 | ||
215 | static int ghes_estatus_pool_expand(unsigned long len) | |
216 | { | |
217 | unsigned long i, pages, size, addr; | |
218 | int ret; | |
219 | ||
220 | ghes_estatus_pool_size_request += PAGE_ALIGN(len); | |
221 | size = gen_pool_size(ghes_estatus_pool); | |
222 | if (size >= ghes_estatus_pool_size_request) | |
223 | return 0; | |
224 | pages = (ghes_estatus_pool_size_request - size) / PAGE_SIZE; | |
225 | for (i = 0; i < pages; i++) { | |
226 | addr = __get_free_page(GFP_KERNEL); | |
227 | if (!addr) | |
228 | return -ENOMEM; | |
229 | ret = gen_pool_add(ghes_estatus_pool, addr, PAGE_SIZE, -1); | |
230 | if (ret) | |
231 | return ret; | |
232 | } | |
233 | ||
234 | return 0; | |
235 | } | |
236 | ||
d334a491 HY |
237 | static struct ghes *ghes_new(struct acpi_hest_generic *generic) |
238 | { | |
239 | struct ghes *ghes; | |
240 | unsigned int error_block_length; | |
241 | int rc; | |
242 | ||
243 | ghes = kzalloc(sizeof(*ghes), GFP_KERNEL); | |
244 | if (!ghes) | |
245 | return ERR_PTR(-ENOMEM); | |
246 | ghes->generic = generic; | |
34ddeb03 | 247 | rc = apei_map_generic_address(&generic->error_status_address); |
d334a491 HY |
248 | if (rc) |
249 | goto err_free; | |
250 | error_block_length = generic->error_block_length; | |
251 | if (error_block_length > GHES_ESTATUS_MAX_SIZE) { | |
252 | pr_warning(FW_WARN GHES_PFX | |
253 | "Error status block length is too long: %u for " | |
254 | "generic hardware error source: %d.\n", | |
255 | error_block_length, generic->header.source_id); | |
256 | error_block_length = GHES_ESTATUS_MAX_SIZE; | |
257 | } | |
258 | ghes->estatus = kmalloc(error_block_length, GFP_KERNEL); | |
259 | if (!ghes->estatus) { | |
260 | rc = -ENOMEM; | |
261 | goto err_unmap; | |
262 | } | |
263 | ||
264 | return ghes; | |
265 | ||
266 | err_unmap: | |
34ddeb03 | 267 | apei_unmap_generic_address(&generic->error_status_address); |
d334a491 HY |
268 | err_free: |
269 | kfree(ghes); | |
270 | return ERR_PTR(rc); | |
271 | } | |
272 | ||
273 | static void ghes_fini(struct ghes *ghes) | |
274 | { | |
275 | kfree(ghes->estatus); | |
34ddeb03 | 276 | apei_unmap_generic_address(&ghes->generic->error_status_address); |
d334a491 HY |
277 | } |
278 | ||
d334a491 HY |
279 | static inline int ghes_severity(int severity) |
280 | { | |
281 | switch (severity) { | |
ad4ecef2 HY |
282 | case CPER_SEV_INFORMATIONAL: |
283 | return GHES_SEV_NO; | |
284 | case CPER_SEV_CORRECTED: | |
285 | return GHES_SEV_CORRECTED; | |
286 | case CPER_SEV_RECOVERABLE: | |
287 | return GHES_SEV_RECOVERABLE; | |
288 | case CPER_SEV_FATAL: | |
289 | return GHES_SEV_PANIC; | |
d334a491 | 290 | default: |
25985edc | 291 | /* Unknown, go panic */ |
ad4ecef2 | 292 | return GHES_SEV_PANIC; |
d334a491 HY |
293 | } |
294 | } | |
295 | ||
81e88fdc HY |
296 | static void ghes_copy_tofrom_phys(void *buffer, u64 paddr, u32 len, |
297 | int from_phys) | |
d334a491 | 298 | { |
81e88fdc HY |
299 | void __iomem *vaddr; |
300 | unsigned long flags = 0; | |
301 | int in_nmi = in_nmi(); | |
302 | u64 offset; | |
303 | u32 trunk; | |
304 | ||
305 | while (len > 0) { | |
306 | offset = paddr - (paddr & PAGE_MASK); | |
307 | if (in_nmi) { | |
308 | raw_spin_lock(&ghes_ioremap_lock_nmi); | |
309 | vaddr = ghes_ioremap_pfn_nmi(paddr >> PAGE_SHIFT); | |
310 | } else { | |
311 | spin_lock_irqsave(&ghes_ioremap_lock_irq, flags); | |
312 | vaddr = ghes_ioremap_pfn_irq(paddr >> PAGE_SHIFT); | |
313 | } | |
314 | trunk = PAGE_SIZE - offset; | |
315 | trunk = min(trunk, len); | |
316 | if (from_phys) | |
317 | memcpy_fromio(buffer, vaddr + offset, trunk); | |
318 | else | |
319 | memcpy_toio(vaddr + offset, buffer, trunk); | |
320 | len -= trunk; | |
321 | paddr += trunk; | |
322 | buffer += trunk; | |
323 | if (in_nmi) { | |
324 | ghes_iounmap_nmi(vaddr); | |
325 | raw_spin_unlock(&ghes_ioremap_lock_nmi); | |
326 | } else { | |
327 | ghes_iounmap_irq(vaddr); | |
328 | spin_unlock_irqrestore(&ghes_ioremap_lock_irq, flags); | |
329 | } | |
330 | } | |
d334a491 HY |
331 | } |
332 | ||
333 | static int ghes_read_estatus(struct ghes *ghes, int silent) | |
334 | { | |
335 | struct acpi_hest_generic *g = ghes->generic; | |
336 | u64 buf_paddr; | |
337 | u32 len; | |
338 | int rc; | |
339 | ||
700130b4 | 340 | rc = apei_read(&buf_paddr, &g->error_status_address); |
d334a491 HY |
341 | if (rc) { |
342 | if (!silent && printk_ratelimit()) | |
343 | pr_warning(FW_WARN GHES_PFX | |
344 | "Failed to read error status block address for hardware error source: %d.\n", | |
345 | g->header.source_id); | |
346 | return -EIO; | |
347 | } | |
348 | if (!buf_paddr) | |
349 | return -ENOENT; | |
350 | ||
81e88fdc HY |
351 | ghes_copy_tofrom_phys(ghes->estatus, buf_paddr, |
352 | sizeof(*ghes->estatus), 1); | |
d334a491 HY |
353 | if (!ghes->estatus->block_status) |
354 | return -ENOENT; | |
355 | ||
356 | ghes->buffer_paddr = buf_paddr; | |
357 | ghes->flags |= GHES_TO_CLEAR; | |
358 | ||
359 | rc = -EIO; | |
88f074f4 | 360 | len = cper_estatus_len(ghes->estatus); |
d334a491 HY |
361 | if (len < sizeof(*ghes->estatus)) |
362 | goto err_read_block; | |
363 | if (len > ghes->generic->error_block_length) | |
364 | goto err_read_block; | |
88f074f4 | 365 | if (cper_estatus_check_header(ghes->estatus)) |
d334a491 | 366 | goto err_read_block; |
81e88fdc HY |
367 | ghes_copy_tofrom_phys(ghes->estatus + 1, |
368 | buf_paddr + sizeof(*ghes->estatus), | |
369 | len - sizeof(*ghes->estatus), 1); | |
88f074f4 | 370 | if (cper_estatus_check(ghes->estatus)) |
d334a491 HY |
371 | goto err_read_block; |
372 | rc = 0; | |
373 | ||
374 | err_read_block: | |
81e88fdc | 375 | if (rc && !silent && printk_ratelimit()) |
d334a491 HY |
376 | pr_warning(FW_WARN GHES_PFX |
377 | "Failed to read error status block!\n"); | |
378 | return rc; | |
379 | } | |
380 | ||
381 | static void ghes_clear_estatus(struct ghes *ghes) | |
382 | { | |
383 | ghes->estatus->block_status = 0; | |
384 | if (!(ghes->flags & GHES_TO_CLEAR)) | |
385 | return; | |
386 | ghes_copy_tofrom_phys(ghes->estatus, ghes->buffer_paddr, | |
387 | sizeof(ghes->estatus->block_status), 0); | |
388 | ghes->flags &= ~GHES_TO_CLEAR; | |
389 | } | |
390 | ||
0a00fd5e | 391 | static void ghes_handle_memory_failure(struct acpi_hest_generic_data *gdata, int sev) |
cf870c70 NR |
392 | { |
393 | #ifdef CONFIG_ACPI_APEI_MEMORY_FAILURE | |
394 | unsigned long pfn; | |
ca104edc | 395 | int flags = -1; |
cf870c70 NR |
396 | int sec_sev = ghes_severity(gdata->error_severity); |
397 | struct cper_sec_mem_err *mem_err; | |
398 | mem_err = (struct cper_sec_mem_err *)(gdata + 1); | |
399 | ||
ca104edc CG |
400 | if (!(mem_err->validation_bits & CPER_MEM_VALID_PA)) |
401 | return; | |
402 | ||
403 | pfn = mem_err->physical_addr >> PAGE_SHIFT; | |
404 | if (!pfn_valid(pfn)) { | |
405 | pr_warn_ratelimited(FW_WARN GHES_PFX | |
406 | "Invalid address in generic error data: %#llx\n", | |
407 | mem_err->physical_addr); | |
408 | return; | |
cf870c70 | 409 | } |
ca104edc CG |
410 | |
411 | /* iff following two events can be handled properly by now */ | |
412 | if (sec_sev == GHES_SEV_CORRECTED && | |
413 | (gdata->flags & CPER_SEC_ERROR_THRESHOLD_EXCEEDED)) | |
414 | flags = MF_SOFT_OFFLINE; | |
415 | if (sev == GHES_SEV_RECOVERABLE && sec_sev == GHES_SEV_RECOVERABLE) | |
416 | flags = 0; | |
417 | ||
418 | if (flags != -1) | |
419 | memory_failure_queue(pfn, 0, flags); | |
cf870c70 NR |
420 | #endif |
421 | } | |
422 | ||
21480547 | 423 | static void ghes_do_proc(struct ghes *ghes, |
0a00fd5e | 424 | const struct acpi_hest_generic_status *estatus) |
d334a491 | 425 | { |
ba61ca4a | 426 | int sev, sec_sev; |
0a00fd5e | 427 | struct acpi_hest_generic_data *gdata; |
d334a491 | 428 | |
67eb2e99 HY |
429 | sev = ghes_severity(estatus->error_severity); |
430 | apei_estatus_for_each_section(estatus, gdata) { | |
ba61ca4a | 431 | sec_sev = ghes_severity(gdata->error_severity); |
d334a491 HY |
432 | if (!uuid_le_cmp(*(uuid_le *)gdata->section_type, |
433 | CPER_SEC_PLATFORM_MEM)) { | |
ba61ca4a HY |
434 | struct cper_sec_mem_err *mem_err; |
435 | mem_err = (struct cper_sec_mem_err *)(gdata+1); | |
21480547 MCC |
436 | ghes_edac_report_mem_error(ghes, sev, mem_err); |
437 | ||
9dae3d0d | 438 | arch_apei_report_mem_error(sev, mem_err); |
cf870c70 | 439 | ghes_handle_memory_failure(gdata, sev); |
ba61ca4a | 440 | } |
a654e5ee HY |
441 | #ifdef CONFIG_ACPI_APEI_PCIEAER |
442 | else if (!uuid_le_cmp(*(uuid_le *)gdata->section_type, | |
443 | CPER_SEC_PCIE)) { | |
444 | struct cper_sec_pcie *pcie_err; | |
445 | pcie_err = (struct cper_sec_pcie *)(gdata+1); | |
446 | if (sev == GHES_SEV_RECOVERABLE && | |
447 | sec_sev == GHES_SEV_RECOVERABLE && | |
448 | pcie_err->validation_bits & CPER_PCIE_VALID_DEVICE_ID && | |
449 | pcie_err->validation_bits & CPER_PCIE_VALID_AER_INFO) { | |
450 | unsigned int devfn; | |
451 | int aer_severity; | |
0ba98ec9 | 452 | |
a654e5ee HY |
453 | devfn = PCI_DEVFN(pcie_err->device_id.device, |
454 | pcie_err->device_id.function); | |
455 | aer_severity = cper_severity_to_aer(sev); | |
0ba98ec9 BD |
456 | |
457 | /* | |
458 | * If firmware reset the component to contain | |
459 | * the error, we must reinitialize it before | |
460 | * use, so treat it as a fatal AER error. | |
461 | */ | |
462 | if (gdata->flags & CPER_SEC_RESET) | |
463 | aer_severity = AER_FATAL; | |
464 | ||
a654e5ee HY |
465 | aer_recover_queue(pcie_err->device_id.segment, |
466 | pcie_err->device_id.bus, | |
37448adf LO |
467 | devfn, aer_severity, |
468 | (struct aer_capability_regs *) | |
469 | pcie_err->aer_info); | |
a654e5ee HY |
470 | } |
471 | ||
472 | } | |
473 | #endif | |
d334a491 | 474 | } |
32c361f5 | 475 | } |
d334a491 | 476 | |
67eb2e99 HY |
477 | static void __ghes_print_estatus(const char *pfx, |
478 | const struct acpi_hest_generic *generic, | |
0a00fd5e | 479 | const struct acpi_hest_generic_status *estatus) |
32c361f5 | 480 | { |
5ba82ab5 HY |
481 | static atomic_t seqno; |
482 | unsigned int curr_seqno; | |
483 | char pfx_seq[64]; | |
484 | ||
32c361f5 | 485 | if (pfx == NULL) { |
67eb2e99 | 486 | if (ghes_severity(estatus->error_severity) <= |
32c361f5 | 487 | GHES_SEV_CORRECTED) |
5ba82ab5 | 488 | pfx = KERN_WARNING; |
32c361f5 | 489 | else |
5ba82ab5 | 490 | pfx = KERN_ERR; |
32c361f5 | 491 | } |
5ba82ab5 HY |
492 | curr_seqno = atomic_inc_return(&seqno); |
493 | snprintf(pfx_seq, sizeof(pfx_seq), "%s{%u}" HW_ERR, pfx, curr_seqno); | |
5588340d | 494 | printk("%s""Hardware error from APEI Generic Hardware Error Source: %d\n", |
5ba82ab5 | 495 | pfx_seq, generic->header.source_id); |
88f074f4 | 496 | cper_estatus_print(pfx_seq, estatus); |
5588340d HY |
497 | } |
498 | ||
152cef40 HY |
499 | static int ghes_print_estatus(const char *pfx, |
500 | const struct acpi_hest_generic *generic, | |
0a00fd5e | 501 | const struct acpi_hest_generic_status *estatus) |
5588340d HY |
502 | { |
503 | /* Not more than 2 messages every 5 seconds */ | |
67eb2e99 HY |
504 | static DEFINE_RATELIMIT_STATE(ratelimit_corrected, 5*HZ, 2); |
505 | static DEFINE_RATELIMIT_STATE(ratelimit_uncorrected, 5*HZ, 2); | |
506 | struct ratelimit_state *ratelimit; | |
5588340d | 507 | |
67eb2e99 HY |
508 | if (ghes_severity(estatus->error_severity) <= GHES_SEV_CORRECTED) |
509 | ratelimit = &ratelimit_corrected; | |
510 | else | |
511 | ratelimit = &ratelimit_uncorrected; | |
152cef40 | 512 | if (__ratelimit(ratelimit)) { |
67eb2e99 | 513 | __ghes_print_estatus(pfx, generic, estatus); |
152cef40 HY |
514 | return 1; |
515 | } | |
516 | return 0; | |
517 | } | |
518 | ||
519 | /* | |
520 | * GHES error status reporting throttle, to report more kinds of | |
521 | * errors, instead of just most frequently occurred errors. | |
522 | */ | |
0a00fd5e | 523 | static int ghes_estatus_cached(struct acpi_hest_generic_status *estatus) |
152cef40 HY |
524 | { |
525 | u32 len; | |
526 | int i, cached = 0; | |
527 | unsigned long long now; | |
528 | struct ghes_estatus_cache *cache; | |
0a00fd5e | 529 | struct acpi_hest_generic_status *cache_estatus; |
152cef40 | 530 | |
88f074f4 | 531 | len = cper_estatus_len(estatus); |
152cef40 HY |
532 | rcu_read_lock(); |
533 | for (i = 0; i < GHES_ESTATUS_CACHES_SIZE; i++) { | |
534 | cache = rcu_dereference(ghes_estatus_caches[i]); | |
535 | if (cache == NULL) | |
536 | continue; | |
537 | if (len != cache->estatus_len) | |
538 | continue; | |
539 | cache_estatus = GHES_ESTATUS_FROM_CACHE(cache); | |
540 | if (memcmp(estatus, cache_estatus, len)) | |
541 | continue; | |
542 | atomic_inc(&cache->count); | |
543 | now = sched_clock(); | |
544 | if (now - cache->time_in < GHES_ESTATUS_IN_CACHE_MAX_NSEC) | |
545 | cached = 1; | |
546 | break; | |
547 | } | |
548 | rcu_read_unlock(); | |
549 | return cached; | |
550 | } | |
551 | ||
552 | static struct ghes_estatus_cache *ghes_estatus_cache_alloc( | |
553 | struct acpi_hest_generic *generic, | |
0a00fd5e | 554 | struct acpi_hest_generic_status *estatus) |
152cef40 HY |
555 | { |
556 | int alloced; | |
557 | u32 len, cache_len; | |
558 | struct ghes_estatus_cache *cache; | |
0a00fd5e | 559 | struct acpi_hest_generic_status *cache_estatus; |
152cef40 HY |
560 | |
561 | alloced = atomic_add_return(1, &ghes_estatus_cache_alloced); | |
562 | if (alloced > GHES_ESTATUS_CACHE_ALLOCED_MAX) { | |
563 | atomic_dec(&ghes_estatus_cache_alloced); | |
564 | return NULL; | |
565 | } | |
88f074f4 | 566 | len = cper_estatus_len(estatus); |
152cef40 HY |
567 | cache_len = GHES_ESTATUS_CACHE_LEN(len); |
568 | cache = (void *)gen_pool_alloc(ghes_estatus_pool, cache_len); | |
569 | if (!cache) { | |
570 | atomic_dec(&ghes_estatus_cache_alloced); | |
571 | return NULL; | |
572 | } | |
573 | cache_estatus = GHES_ESTATUS_FROM_CACHE(cache); | |
574 | memcpy(cache_estatus, estatus, len); | |
575 | cache->estatus_len = len; | |
576 | atomic_set(&cache->count, 0); | |
577 | cache->generic = generic; | |
578 | cache->time_in = sched_clock(); | |
579 | return cache; | |
580 | } | |
581 | ||
582 | static void ghes_estatus_cache_free(struct ghes_estatus_cache *cache) | |
583 | { | |
584 | u32 len; | |
585 | ||
88f074f4 | 586 | len = cper_estatus_len(GHES_ESTATUS_FROM_CACHE(cache)); |
152cef40 HY |
587 | len = GHES_ESTATUS_CACHE_LEN(len); |
588 | gen_pool_free(ghes_estatus_pool, (unsigned long)cache, len); | |
589 | atomic_dec(&ghes_estatus_cache_alloced); | |
590 | } | |
591 | ||
592 | static void ghes_estatus_cache_rcu_free(struct rcu_head *head) | |
593 | { | |
594 | struct ghes_estatus_cache *cache; | |
595 | ||
596 | cache = container_of(head, struct ghes_estatus_cache, rcu); | |
597 | ghes_estatus_cache_free(cache); | |
598 | } | |
599 | ||
600 | static void ghes_estatus_cache_add( | |
601 | struct acpi_hest_generic *generic, | |
0a00fd5e | 602 | struct acpi_hest_generic_status *estatus) |
152cef40 HY |
603 | { |
604 | int i, slot = -1, count; | |
605 | unsigned long long now, duration, period, max_period = 0; | |
606 | struct ghes_estatus_cache *cache, *slot_cache = NULL, *new_cache; | |
607 | ||
608 | new_cache = ghes_estatus_cache_alloc(generic, estatus); | |
609 | if (new_cache == NULL) | |
610 | return; | |
611 | rcu_read_lock(); | |
612 | now = sched_clock(); | |
613 | for (i = 0; i < GHES_ESTATUS_CACHES_SIZE; i++) { | |
614 | cache = rcu_dereference(ghes_estatus_caches[i]); | |
615 | if (cache == NULL) { | |
616 | slot = i; | |
617 | slot_cache = NULL; | |
618 | break; | |
619 | } | |
620 | duration = now - cache->time_in; | |
621 | if (duration >= GHES_ESTATUS_IN_CACHE_MAX_NSEC) { | |
622 | slot = i; | |
623 | slot_cache = cache; | |
624 | break; | |
625 | } | |
626 | count = atomic_read(&cache->count); | |
70cb6e1d LB |
627 | period = duration; |
628 | do_div(period, (count + 1)); | |
152cef40 HY |
629 | if (period > max_period) { |
630 | max_period = period; | |
631 | slot = i; | |
632 | slot_cache = cache; | |
633 | } | |
634 | } | |
635 | /* new_cache must be put into array after its contents are written */ | |
636 | smp_wmb(); | |
637 | if (slot != -1 && cmpxchg(ghes_estatus_caches + slot, | |
638 | slot_cache, new_cache) == slot_cache) { | |
639 | if (slot_cache) | |
640 | call_rcu(&slot_cache->rcu, ghes_estatus_cache_rcu_free); | |
641 | } else | |
642 | ghes_estatus_cache_free(new_cache); | |
643 | rcu_read_unlock(); | |
d334a491 HY |
644 | } |
645 | ||
646 | static int ghes_proc(struct ghes *ghes) | |
647 | { | |
648 | int rc; | |
649 | ||
650 | rc = ghes_read_estatus(ghes, 0); | |
651 | if (rc) | |
652 | goto out; | |
152cef40 HY |
653 | if (!ghes_estatus_cached(ghes->estatus)) { |
654 | if (ghes_print_estatus(NULL, ghes->generic, ghes->estatus)) | |
655 | ghes_estatus_cache_add(ghes->generic, ghes->estatus); | |
656 | } | |
21480547 | 657 | ghes_do_proc(ghes, ghes->estatus); |
d334a491 HY |
658 | out: |
659 | ghes_clear_estatus(ghes); | |
660 | return 0; | |
661 | } | |
662 | ||
81e88fdc HY |
663 | static void ghes_add_timer(struct ghes *ghes) |
664 | { | |
665 | struct acpi_hest_generic *g = ghes->generic; | |
666 | unsigned long expire; | |
667 | ||
668 | if (!g->notify.poll_interval) { | |
669 | pr_warning(FW_WARN GHES_PFX "Poll interval is 0 for generic hardware error source: %d, disabled.\n", | |
670 | g->header.source_id); | |
671 | return; | |
672 | } | |
673 | expire = jiffies + msecs_to_jiffies(g->notify.poll_interval); | |
674 | ghes->timer.expires = round_jiffies_relative(expire); | |
675 | add_timer(&ghes->timer); | |
676 | } | |
677 | ||
678 | static void ghes_poll_func(unsigned long data) | |
679 | { | |
680 | struct ghes *ghes = (void *)data; | |
681 | ||
682 | ghes_proc(ghes); | |
683 | if (!(ghes->flags & GHES_EXITING)) | |
684 | ghes_add_timer(ghes); | |
685 | } | |
686 | ||
687 | static irqreturn_t ghes_irq_func(int irq, void *data) | |
688 | { | |
689 | struct ghes *ghes = data; | |
690 | int rc; | |
691 | ||
692 | rc = ghes_proc(ghes); | |
693 | if (rc) | |
694 | return IRQ_NONE; | |
695 | ||
696 | return IRQ_HANDLED; | |
697 | } | |
698 | ||
d334a491 HY |
699 | static int ghes_notify_sci(struct notifier_block *this, |
700 | unsigned long event, void *data) | |
701 | { | |
702 | struct ghes *ghes; | |
703 | int ret = NOTIFY_DONE; | |
704 | ||
705 | rcu_read_lock(); | |
706 | list_for_each_entry_rcu(ghes, &ghes_sci, list) { | |
707 | if (!ghes_proc(ghes)) | |
708 | ret = NOTIFY_OK; | |
709 | } | |
710 | rcu_read_unlock(); | |
711 | ||
712 | return ret; | |
713 | } | |
714 | ||
44a69f61 TN |
715 | static struct notifier_block ghes_notifier_sci = { |
716 | .notifier_call = ghes_notify_sci, | |
717 | }; | |
718 | ||
719 | #ifdef CONFIG_HAVE_ACPI_APEI_NMI | |
720 | /* | |
721 | * printk is not safe in NMI context. So in NMI handler, we allocate | |
722 | * required memory from lock-less memory allocator | |
723 | * (ghes_estatus_pool), save estatus into it, put them into lock-less | |
724 | * list (ghes_estatus_llist), then delay printk into IRQ context via | |
725 | * irq_work (ghes_proc_irq_work). ghes_estatus_size_request record | |
726 | * required pool size by all NMI error source. | |
727 | */ | |
728 | static struct llist_head ghes_estatus_llist; | |
729 | static struct irq_work ghes_proc_irq_work; | |
730 | ||
731 | /* | |
732 | * NMI may be triggered on any CPU, so ghes_nmi_lock is used for | |
733 | * mutual exclusion. | |
734 | */ | |
735 | static DEFINE_RAW_SPINLOCK(ghes_nmi_lock); | |
736 | ||
737 | static LIST_HEAD(ghes_nmi); | |
738 | ||
739 | static int ghes_panic_timeout __read_mostly = 30; | |
740 | ||
67eb2e99 HY |
741 | static void ghes_proc_in_irq(struct irq_work *irq_work) |
742 | { | |
46d12f0b | 743 | struct llist_node *llnode, *next; |
67eb2e99 | 744 | struct ghes_estatus_node *estatus_node; |
152cef40 | 745 | struct acpi_hest_generic *generic; |
0a00fd5e | 746 | struct acpi_hest_generic_status *estatus; |
67eb2e99 HY |
747 | u32 len, node_len; |
748 | ||
46d12f0b | 749 | llnode = llist_del_all(&ghes_estatus_llist); |
67eb2e99 HY |
750 | /* |
751 | * Because the time order of estatus in list is reversed, | |
752 | * revert it back to proper order. | |
753 | */ | |
8d21d4c9 | 754 | llnode = llist_reverse_order(llnode); |
67eb2e99 HY |
755 | while (llnode) { |
756 | next = llnode->next; | |
757 | estatus_node = llist_entry(llnode, struct ghes_estatus_node, | |
758 | llnode); | |
759 | estatus = GHES_ESTATUS_FROM_NODE(estatus_node); | |
88f074f4 | 760 | len = cper_estatus_len(estatus); |
67eb2e99 | 761 | node_len = GHES_ESTATUS_NODE_LEN(len); |
21480547 | 762 | ghes_do_proc(estatus_node->ghes, estatus); |
152cef40 HY |
763 | if (!ghes_estatus_cached(estatus)) { |
764 | generic = estatus_node->generic; | |
765 | if (ghes_print_estatus(NULL, generic, estatus)) | |
766 | ghes_estatus_cache_add(generic, estatus); | |
767 | } | |
67eb2e99 HY |
768 | gen_pool_free(ghes_estatus_pool, (unsigned long)estatus_node, |
769 | node_len); | |
770 | llnode = next; | |
771 | } | |
772 | } | |
773 | ||
46d12f0b HY |
774 | static void ghes_print_queued_estatus(void) |
775 | { | |
776 | struct llist_node *llnode; | |
777 | struct ghes_estatus_node *estatus_node; | |
778 | struct acpi_hest_generic *generic; | |
0a00fd5e | 779 | struct acpi_hest_generic_status *estatus; |
46d12f0b HY |
780 | u32 len, node_len; |
781 | ||
782 | llnode = llist_del_all(&ghes_estatus_llist); | |
783 | /* | |
784 | * Because the time order of estatus in list is reversed, | |
785 | * revert it back to proper order. | |
786 | */ | |
8d21d4c9 | 787 | llnode = llist_reverse_order(llnode); |
46d12f0b HY |
788 | while (llnode) { |
789 | estatus_node = llist_entry(llnode, struct ghes_estatus_node, | |
790 | llnode); | |
791 | estatus = GHES_ESTATUS_FROM_NODE(estatus_node); | |
88f074f4 | 792 | len = cper_estatus_len(estatus); |
46d12f0b HY |
793 | node_len = GHES_ESTATUS_NODE_LEN(len); |
794 | generic = estatus_node->generic; | |
795 | ghes_print_estatus(NULL, generic, estatus); | |
796 | llnode = llnode->next; | |
797 | } | |
798 | } | |
799 | ||
11568496 BP |
800 | /* Save estatus for further processing in IRQ context */ |
801 | static void __process_error(struct ghes *ghes) | |
802 | { | |
803 | #ifdef CONFIG_ARCH_HAVE_NMI_SAFE_CMPXCHG | |
804 | u32 len, node_len; | |
805 | struct ghes_estatus_node *estatus_node; | |
806 | struct acpi_hest_generic_status *estatus; | |
807 | ||
808 | if (ghes_estatus_cached(ghes->estatus)) | |
809 | return; | |
810 | ||
811 | len = cper_estatus_len(ghes->estatus); | |
812 | node_len = GHES_ESTATUS_NODE_LEN(len); | |
813 | ||
814 | estatus_node = (void *)gen_pool_alloc(ghes_estatus_pool, node_len); | |
815 | if (!estatus_node) | |
816 | return; | |
817 | ||
818 | estatus_node->ghes = ghes; | |
819 | estatus_node->generic = ghes->generic; | |
820 | estatus = GHES_ESTATUS_FROM_NODE(estatus_node); | |
821 | memcpy(estatus, ghes->estatus, len); | |
822 | llist_add(&estatus_node->llnode, &ghes_estatus_llist); | |
823 | #endif | |
824 | } | |
825 | ||
e10be03f BP |
826 | static void __ghes_panic(struct ghes *ghes) |
827 | { | |
828 | oops_begin(); | |
829 | ghes_print_queued_estatus(); | |
830 | __ghes_print_estatus(KERN_EMERG, ghes->generic, ghes->estatus); | |
831 | ||
832 | /* reboot to log the error! */ | |
833 | if (panic_timeout == 0) | |
834 | panic_timeout = ghes_panic_timeout; | |
835 | panic("Fatal hardware error!"); | |
836 | } | |
837 | ||
9c48f1c6 | 838 | static int ghes_notify_nmi(unsigned int cmd, struct pt_regs *regs) |
81e88fdc HY |
839 | { |
840 | struct ghes *ghes, *ghes_global = NULL; | |
841 | int sev, sev_global = -1; | |
9c48f1c6 | 842 | int ret = NMI_DONE; |
81e88fdc HY |
843 | |
844 | raw_spin_lock(&ghes_nmi_lock); | |
845 | list_for_each_entry_rcu(ghes, &ghes_nmi, list) { | |
846 | if (ghes_read_estatus(ghes, 1)) { | |
847 | ghes_clear_estatus(ghes); | |
848 | continue; | |
849 | } | |
850 | sev = ghes_severity(ghes->estatus->error_severity); | |
851 | if (sev > sev_global) { | |
852 | sev_global = sev; | |
853 | ghes_global = ghes; | |
854 | } | |
9c48f1c6 | 855 | ret = NMI_HANDLED; |
81e88fdc HY |
856 | } |
857 | ||
9c48f1c6 | 858 | if (ret == NMI_DONE) |
81e88fdc HY |
859 | goto out; |
860 | ||
e10be03f BP |
861 | if (sev_global >= GHES_SEV_PANIC) |
862 | __ghes_panic(ghes_global); | |
81e88fdc HY |
863 | |
864 | list_for_each_entry_rcu(ghes, &ghes_nmi, list) { | |
865 | if (!(ghes->flags & GHES_TO_CLEAR)) | |
866 | continue; | |
11568496 BP |
867 | |
868 | __process_error(ghes); | |
81e88fdc HY |
869 | ghes_clear_estatus(ghes); |
870 | } | |
11568496 | 871 | |
67eb2e99 HY |
872 | #ifdef CONFIG_ARCH_HAVE_NMI_SAFE_CMPXCHG |
873 | irq_work_queue(&ghes_proc_irq_work); | |
874 | #endif | |
81e88fdc HY |
875 | |
876 | out: | |
877 | raw_spin_unlock(&ghes_nmi_lock); | |
878 | return ret; | |
879 | } | |
880 | ||
67eb2e99 HY |
881 | static unsigned long ghes_esource_prealloc_size( |
882 | const struct acpi_hest_generic *generic) | |
883 | { | |
884 | unsigned long block_length, prealloc_records, prealloc_size; | |
885 | ||
886 | block_length = min_t(unsigned long, generic->error_block_length, | |
887 | GHES_ESTATUS_MAX_SIZE); | |
888 | prealloc_records = max_t(unsigned long, | |
889 | generic->records_to_preallocate, 1); | |
890 | prealloc_size = min_t(unsigned long, block_length * prealloc_records, | |
891 | GHES_ESOURCE_PREALLOC_MAX_SIZE); | |
892 | ||
893 | return prealloc_size; | |
894 | } | |
895 | ||
44a69f61 TN |
896 | static void ghes_estatus_pool_shrink(unsigned long len) |
897 | { | |
898 | ghes_estatus_pool_size_request -= PAGE_ALIGN(len); | |
899 | } | |
900 | ||
901 | static void ghes_nmi_add(struct ghes *ghes) | |
902 | { | |
903 | unsigned long len; | |
904 | ||
905 | len = ghes_esource_prealloc_size(ghes->generic); | |
906 | ghes_estatus_pool_expand(len); | |
907 | mutex_lock(&ghes_list_mutex); | |
908 | if (list_empty(&ghes_nmi)) | |
909 | register_nmi_handler(NMI_LOCAL, ghes_notify_nmi, 0, "ghes"); | |
910 | list_add_rcu(&ghes->list, &ghes_nmi); | |
911 | mutex_unlock(&ghes_list_mutex); | |
912 | } | |
913 | ||
914 | static void ghes_nmi_remove(struct ghes *ghes) | |
915 | { | |
916 | unsigned long len; | |
917 | ||
918 | mutex_lock(&ghes_list_mutex); | |
919 | list_del_rcu(&ghes->list); | |
920 | if (list_empty(&ghes_nmi)) | |
921 | unregister_nmi_handler(NMI_LOCAL, "ghes"); | |
922 | mutex_unlock(&ghes_list_mutex); | |
923 | /* | |
924 | * To synchronize with NMI handler, ghes can only be | |
925 | * freed after NMI handler finishes. | |
926 | */ | |
927 | synchronize_rcu(); | |
928 | len = ghes_esource_prealloc_size(ghes->generic); | |
929 | ghes_estatus_pool_shrink(len); | |
930 | } | |
931 | ||
932 | static void ghes_nmi_init_cxt(void) | |
933 | { | |
934 | init_irq_work(&ghes_proc_irq_work, ghes_proc_in_irq); | |
935 | } | |
936 | #else /* CONFIG_HAVE_ACPI_APEI_NMI */ | |
937 | static inline void ghes_nmi_add(struct ghes *ghes) | |
938 | { | |
939 | pr_err(GHES_PFX "ID: %d, trying to add NMI notification which is not supported!\n", | |
940 | ghes->generic->header.source_id); | |
941 | BUG(); | |
942 | } | |
943 | ||
944 | static inline void ghes_nmi_remove(struct ghes *ghes) | |
945 | { | |
946 | pr_err(GHES_PFX "ID: %d, trying to remove NMI notification which is not supported!\n", | |
947 | ghes->generic->header.source_id); | |
948 | BUG(); | |
949 | } | |
950 | ||
951 | static inline void ghes_nmi_init_cxt(void) | |
952 | { | |
953 | } | |
954 | #endif /* CONFIG_HAVE_ACPI_APEI_NMI */ | |
955 | ||
da095fd3 | 956 | static int ghes_probe(struct platform_device *ghes_dev) |
d334a491 HY |
957 | { |
958 | struct acpi_hest_generic *generic; | |
959 | struct ghes *ghes = NULL; | |
44a69f61 | 960 | |
7ad6e943 | 961 | int rc = -EINVAL; |
d334a491 | 962 | |
1dd6b20e | 963 | generic = *(struct acpi_hest_generic **)ghes_dev->dev.platform_data; |
d334a491 | 964 | if (!generic->enabled) |
7ad6e943 | 965 | return -ENODEV; |
d334a491 | 966 | |
81e88fdc HY |
967 | switch (generic->notify.type) { |
968 | case ACPI_HEST_NOTIFY_POLLED: | |
969 | case ACPI_HEST_NOTIFY_EXTERNAL: | |
970 | case ACPI_HEST_NOTIFY_SCI: | |
44a69f61 | 971 | break; |
81e88fdc | 972 | case ACPI_HEST_NOTIFY_NMI: |
44a69f61 TN |
973 | if (!IS_ENABLED(CONFIG_HAVE_ACPI_APEI_NMI)) { |
974 | pr_warn(GHES_PFX "Generic hardware error source: %d notified via NMI interrupt is not supported!\n", | |
975 | generic->header.source_id); | |
976 | goto err; | |
977 | } | |
81e88fdc HY |
978 | break; |
979 | case ACPI_HEST_NOTIFY_LOCAL: | |
980 | pr_warning(GHES_PFX "Generic hardware error source: %d notified via local interrupt is not supported!\n", | |
d334a491 HY |
981 | generic->header.source_id); |
982 | goto err; | |
81e88fdc HY |
983 | default: |
984 | pr_warning(FW_WARN GHES_PFX "Unknown notification type: %u for generic hardware error source: %d\n", | |
985 | generic->notify.type, generic->header.source_id); | |
986 | goto err; | |
d334a491 | 987 | } |
81e88fdc HY |
988 | |
989 | rc = -EIO; | |
990 | if (generic->error_block_length < | |
0a00fd5e | 991 | sizeof(struct acpi_hest_generic_status)) { |
81e88fdc HY |
992 | pr_warning(FW_BUG GHES_PFX "Invalid error block length: %u for generic hardware error source: %d\n", |
993 | generic->error_block_length, | |
d334a491 HY |
994 | generic->header.source_id); |
995 | goto err; | |
996 | } | |
997 | ghes = ghes_new(generic); | |
998 | if (IS_ERR(ghes)) { | |
999 | rc = PTR_ERR(ghes); | |
1000 | ghes = NULL; | |
1001 | goto err; | |
1002 | } | |
21480547 MCC |
1003 | |
1004 | rc = ghes_edac_register(ghes, &ghes_dev->dev); | |
1005 | if (rc < 0) | |
1006 | goto err; | |
1007 | ||
81e88fdc HY |
1008 | switch (generic->notify.type) { |
1009 | case ACPI_HEST_NOTIFY_POLLED: | |
1010 | ghes->timer.function = ghes_poll_func; | |
1011 | ghes->timer.data = (unsigned long)ghes; | |
1012 | init_timer_deferrable(&ghes->timer); | |
1013 | ghes_add_timer(ghes); | |
1014 | break; | |
1015 | case ACPI_HEST_NOTIFY_EXTERNAL: | |
1016 | /* External interrupt vector is GSI */ | |
a98d4f64 WY |
1017 | rc = acpi_gsi_to_irq(generic->notify.vector, &ghes->irq); |
1018 | if (rc) { | |
81e88fdc HY |
1019 | pr_err(GHES_PFX "Failed to map GSI to IRQ for generic hardware error source: %d\n", |
1020 | generic->header.source_id); | |
21480547 | 1021 | goto err_edac_unreg; |
81e88fdc | 1022 | } |
a98d4f64 WY |
1023 | rc = request_irq(ghes->irq, ghes_irq_func, 0, "GHES IRQ", ghes); |
1024 | if (rc) { | |
81e88fdc HY |
1025 | pr_err(GHES_PFX "Failed to register IRQ for generic hardware error source: %d\n", |
1026 | generic->header.source_id); | |
21480547 | 1027 | goto err_edac_unreg; |
81e88fdc HY |
1028 | } |
1029 | break; | |
1030 | case ACPI_HEST_NOTIFY_SCI: | |
7ad6e943 | 1031 | mutex_lock(&ghes_list_mutex); |
d334a491 HY |
1032 | if (list_empty(&ghes_sci)) |
1033 | register_acpi_hed_notifier(&ghes_notifier_sci); | |
1034 | list_add_rcu(&ghes->list, &ghes_sci); | |
7ad6e943 | 1035 | mutex_unlock(&ghes_list_mutex); |
81e88fdc HY |
1036 | break; |
1037 | case ACPI_HEST_NOTIFY_NMI: | |
44a69f61 | 1038 | ghes_nmi_add(ghes); |
81e88fdc HY |
1039 | break; |
1040 | default: | |
1041 | BUG(); | |
d334a491 | 1042 | } |
7ad6e943 | 1043 | platform_set_drvdata(ghes_dev, ghes); |
d334a491 HY |
1044 | |
1045 | return 0; | |
21480547 MCC |
1046 | err_edac_unreg: |
1047 | ghes_edac_unregister(ghes); | |
d334a491 | 1048 | err: |
7ad6e943 | 1049 | if (ghes) { |
d334a491 | 1050 | ghes_fini(ghes); |
7ad6e943 HY |
1051 | kfree(ghes); |
1052 | } | |
d334a491 HY |
1053 | return rc; |
1054 | } | |
1055 | ||
b59bc2fb | 1056 | static int ghes_remove(struct platform_device *ghes_dev) |
d334a491 | 1057 | { |
7ad6e943 HY |
1058 | struct ghes *ghes; |
1059 | struct acpi_hest_generic *generic; | |
d334a491 | 1060 | |
7ad6e943 HY |
1061 | ghes = platform_get_drvdata(ghes_dev); |
1062 | generic = ghes->generic; | |
1063 | ||
81e88fdc | 1064 | ghes->flags |= GHES_EXITING; |
7ad6e943 | 1065 | switch (generic->notify.type) { |
81e88fdc HY |
1066 | case ACPI_HEST_NOTIFY_POLLED: |
1067 | del_timer_sync(&ghes->timer); | |
1068 | break; | |
1069 | case ACPI_HEST_NOTIFY_EXTERNAL: | |
1070 | free_irq(ghes->irq, ghes); | |
1071 | break; | |
7ad6e943 HY |
1072 | case ACPI_HEST_NOTIFY_SCI: |
1073 | mutex_lock(&ghes_list_mutex); | |
1074 | list_del_rcu(&ghes->list); | |
1075 | if (list_empty(&ghes_sci)) | |
1076 | unregister_acpi_hed_notifier(&ghes_notifier_sci); | |
1077 | mutex_unlock(&ghes_list_mutex); | |
1078 | break; | |
81e88fdc | 1079 | case ACPI_HEST_NOTIFY_NMI: |
44a69f61 | 1080 | ghes_nmi_remove(ghes); |
81e88fdc | 1081 | break; |
7ad6e943 HY |
1082 | default: |
1083 | BUG(); | |
1084 | break; | |
1085 | } | |
d334a491 | 1086 | |
7ad6e943 | 1087 | ghes_fini(ghes); |
21480547 MCC |
1088 | |
1089 | ghes_edac_unregister(ghes); | |
1090 | ||
7ad6e943 | 1091 | kfree(ghes); |
d334a491 | 1092 | |
7ad6e943 HY |
1093 | platform_set_drvdata(ghes_dev, NULL); |
1094 | ||
1095 | return 0; | |
d334a491 HY |
1096 | } |
1097 | ||
7ad6e943 HY |
1098 | static struct platform_driver ghes_platform_driver = { |
1099 | .driver = { | |
1100 | .name = "GHES", | |
7ad6e943 HY |
1101 | }, |
1102 | .probe = ghes_probe, | |
1103 | .remove = ghes_remove, | |
1104 | }; | |
1105 | ||
d334a491 HY |
1106 | static int __init ghes_init(void) |
1107 | { | |
81e88fdc HY |
1108 | int rc; |
1109 | ||
d334a491 HY |
1110 | if (acpi_disabled) |
1111 | return -ENODEV; | |
1112 | ||
1113 | if (hest_disable) { | |
1114 | pr_info(GHES_PFX "HEST is not enabled!\n"); | |
1115 | return -EINVAL; | |
1116 | } | |
1117 | ||
b6a95016 HY |
1118 | if (ghes_disable) { |
1119 | pr_info(GHES_PFX "GHES is not enabled!\n"); | |
1120 | return -EINVAL; | |
1121 | } | |
1122 | ||
44a69f61 | 1123 | ghes_nmi_init_cxt(); |
67eb2e99 | 1124 | |
81e88fdc HY |
1125 | rc = ghes_ioremap_init(); |
1126 | if (rc) | |
1127 | goto err; | |
1128 | ||
67eb2e99 | 1129 | rc = ghes_estatus_pool_init(); |
81e88fdc HY |
1130 | if (rc) |
1131 | goto err_ioremap_exit; | |
1132 | ||
152cef40 HY |
1133 | rc = ghes_estatus_pool_expand(GHES_ESTATUS_CACHE_AVG_SIZE * |
1134 | GHES_ESTATUS_CACHE_ALLOCED_MAX); | |
1135 | if (rc) | |
1136 | goto err_pool_exit; | |
1137 | ||
67eb2e99 HY |
1138 | rc = platform_driver_register(&ghes_platform_driver); |
1139 | if (rc) | |
1140 | goto err_pool_exit; | |
1141 | ||
9fb0bfe1 HY |
1142 | rc = apei_osc_setup(); |
1143 | if (rc == 0 && osc_sb_apei_support_acked) | |
1144 | pr_info(GHES_PFX "APEI firmware first mode is enabled by APEI bit and WHEA _OSC.\n"); | |
1145 | else if (rc == 0 && !osc_sb_apei_support_acked) | |
1146 | pr_info(GHES_PFX "APEI firmware first mode is enabled by WHEA _OSC.\n"); | |
1147 | else if (rc && osc_sb_apei_support_acked) | |
1148 | pr_info(GHES_PFX "APEI firmware first mode is enabled by APEI bit.\n"); | |
1149 | else | |
1150 | pr_info(GHES_PFX "Failed to enable APEI firmware first mode.\n"); | |
1151 | ||
81e88fdc | 1152 | return 0; |
67eb2e99 HY |
1153 | err_pool_exit: |
1154 | ghes_estatus_pool_exit(); | |
81e88fdc HY |
1155 | err_ioremap_exit: |
1156 | ghes_ioremap_exit(); | |
1157 | err: | |
1158 | return rc; | |
d334a491 HY |
1159 | } |
1160 | ||
1161 | static void __exit ghes_exit(void) | |
1162 | { | |
7ad6e943 | 1163 | platform_driver_unregister(&ghes_platform_driver); |
67eb2e99 | 1164 | ghes_estatus_pool_exit(); |
81e88fdc | 1165 | ghes_ioremap_exit(); |
d334a491 HY |
1166 | } |
1167 | ||
1168 | module_init(ghes_init); | |
1169 | module_exit(ghes_exit); | |
1170 | ||
1171 | MODULE_AUTHOR("Huang Ying"); | |
1172 | MODULE_DESCRIPTION("APEI Generic Hardware Error Source support"); | |
1173 | MODULE_LICENSE("GPL"); | |
7ad6e943 | 1174 | MODULE_ALIAS("platform:GHES"); |