]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blame - drivers/acpi/nfit/mce.c
Merge branch 'timers-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel...
[mirror_ubuntu-jammy-kernel.git] / drivers / acpi / nfit / mce.c
CommitLineData
5b497af4 1// SPDX-License-Identifier: GPL-2.0-only
6839a6d9
VV
2/*
3 * NFIT - Machine Check Handler
4 *
5 * Copyright(c) 2013-2016 Intel Corporation. All rights reserved.
6839a6d9
VV
6 */
7#include <linux/notifier.h>
8#include <linux/acpi.h>
9ffd6350 9#include <linux/nd.h>
6839a6d9
VV
10#include <asm/mce.h>
11#include "nfit.h"
12
13static int nfit_handle_mce(struct notifier_block *nb, unsigned long val,
14 void *data)
15{
16 struct mce *mce = (struct mce *)data;
17 struct acpi_nfit_desc *acpi_desc;
18 struct nfit_spa *nfit_spa;
19
5d96c934
VV
20 /* We only care about uncorrectable memory errors */
21 if (!mce_is_memory_error(mce) || mce_is_correctable(mce))
6839a6d9
VV
22 return NOTIFY_DONE;
23
e8a308e5
VV
24 /* Verify the address reported in the MCE is valid. */
25 if (!mce_usable_address(mce))
26 return NOTIFY_DONE;
27
6839a6d9
VV
28 /*
29 * mce->addr contains the physical addr accessed that caused the
30 * machine check. We need to walk through the list of NFITs, and see
31 * if any of them matches that address, and only then start a scrub.
32 */
33 mutex_lock(&acpi_desc_lock);
34 list_for_each_entry(acpi_desc, &acpi_descs, list) {
35 struct device *dev = acpi_desc->dev;
36 int found_match = 0;
37
38 mutex_lock(&acpi_desc->init_mutex);
39 list_for_each_entry(nfit_spa, &acpi_desc->spas, list) {
40 struct acpi_nfit_system_address *spa = nfit_spa->spa;
41
2e21807d 42 if (nfit_spa_type(spa) != NFIT_SPA_PM)
6839a6d9
VV
43 continue;
44 /* find the spa that covers the mce addr */
45 if (spa->address > mce->addr)
46 continue;
47 if ((spa->address + spa->length - 1) < mce->addr)
48 continue;
49 found_match = 1;
b814735f
JT
50 dev_dbg(dev, "addr in SPA %d (0x%llx, 0x%llx)\n",
51 spa->range_index, spa->address, spa->length);
6839a6d9
VV
52 /*
53 * We can break at the first match because we're going
54 * to rescan all the SPA ranges. There shouldn't be any
55 * aliasing anyway.
56 */
57 break;
58 }
59 mutex_unlock(&acpi_desc->init_mutex);
60
9ffd6350
VV
61 if (!found_match)
62 continue;
63
64 /* If this fails due to an -ENOMEM, there is little we can do */
aa9ad44a 65 nvdimm_bus_add_badrange(acpi_desc->nvdimm_bus,
9ffd6350
VV
66 ALIGN(mce->addr, L1_CACHE_BYTES),
67 L1_CACHE_BYTES);
68 nvdimm_region_notify(nfit_spa->nd_region,
69 NVDIMM_REVALIDATE_POISON);
70
71 if (acpi_desc->scrub_mode == HW_ERROR_SCRUB_ON) {
72 /*
73 * We can ignore an -EBUSY here because if an ARS is
74 * already in progress, just let that be the last
75 * authoritative one
76 */
80790039 77 acpi_nfit_ars_rescan(acpi_desc, 0);
9ffd6350
VV
78 }
79 break;
6839a6d9
VV
80 }
81
82 mutex_unlock(&acpi_desc_lock);
83 return NOTIFY_DONE;
84}
85
86static struct notifier_block nfit_mce_dec = {
87 .notifier_call = nfit_handle_mce,
9026cc82 88 .priority = MCE_PRIO_NFIT,
6839a6d9
VV
89};
90
91void nfit_mce_register(void)
92{
93 mce_register_decode_chain(&nfit_mce_dec);
94}
95
96void nfit_mce_unregister(void)
97{
98 mce_unregister_decode_chain(&nfit_mce_dec);
99}