xref: /kernel/linux/linux-6.6/drivers/acpi/apei/hest.c (revision 62306a36)
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * APEI Hardware Error Source Table support
4 *
5 * HEST describes error sources in detail; communicates operational
6 * parameters (i.e. severity levels, masking bits, and threshold
7 * values) to Linux as necessary. It also allows the BIOS to report
8 * non-standard error sources to Linux (for example, chipset-specific
9 * error registers).
10 *
11 * For more information about HEST, please refer to ACPI Specification
12 * version 4.0, section 17.3.2.
13 *
14 * Copyright 2009 Intel Corp.
15 *   Author: Huang Ying <ying.huang@intel.com>
16 */
17
18#include <linux/kernel.h>
19#include <linux/module.h>
20#include <linux/init.h>
21#include <linux/acpi.h>
22#include <linux/kdebug.h>
23#include <linux/highmem.h>
24#include <linux/io.h>
25#include <linux/platform_device.h>
26#include <acpi/apei.h>
27#include <acpi/ghes.h>
28
29#include "apei-internal.h"
30
31#define HEST_PFX "HEST: "
32
33int hest_disable;
34EXPORT_SYMBOL_GPL(hest_disable);
35
36/* HEST table parsing */
37
38static struct acpi_table_hest *__read_mostly hest_tab;
39
40static const int hest_esrc_len_tab[ACPI_HEST_TYPE_RESERVED] = {
41	[ACPI_HEST_TYPE_IA32_CHECK] = -1,	/* need further calculation */
42	[ACPI_HEST_TYPE_IA32_CORRECTED_CHECK] = -1,
43	[ACPI_HEST_TYPE_IA32_NMI] = sizeof(struct acpi_hest_ia_nmi),
44	[ACPI_HEST_TYPE_AER_ROOT_PORT] = sizeof(struct acpi_hest_aer_root),
45	[ACPI_HEST_TYPE_AER_ENDPOINT] = sizeof(struct acpi_hest_aer),
46	[ACPI_HEST_TYPE_AER_BRIDGE] = sizeof(struct acpi_hest_aer_bridge),
47	[ACPI_HEST_TYPE_GENERIC_ERROR] = sizeof(struct acpi_hest_generic),
48	[ACPI_HEST_TYPE_GENERIC_ERROR_V2] = sizeof(struct acpi_hest_generic_v2),
49	[ACPI_HEST_TYPE_IA32_DEFERRED_CHECK] = -1,
50};
51
52static inline bool is_generic_error(struct acpi_hest_header *hest_hdr)
53{
54	return hest_hdr->type == ACPI_HEST_TYPE_GENERIC_ERROR ||
55	       hest_hdr->type == ACPI_HEST_TYPE_GENERIC_ERROR_V2;
56}
57
58static int hest_esrc_len(struct acpi_hest_header *hest_hdr)
59{
60	u16 hest_type = hest_hdr->type;
61	int len;
62
63	if (hest_type >= ACPI_HEST_TYPE_RESERVED)
64		return 0;
65
66	len = hest_esrc_len_tab[hest_type];
67
68	if (hest_type == ACPI_HEST_TYPE_IA32_CORRECTED_CHECK) {
69		struct acpi_hest_ia_corrected *cmc;
70		cmc = (struct acpi_hest_ia_corrected *)hest_hdr;
71		len = sizeof(*cmc) + cmc->num_hardware_banks *
72			sizeof(struct acpi_hest_ia_error_bank);
73	} else if (hest_type == ACPI_HEST_TYPE_IA32_CHECK) {
74		struct acpi_hest_ia_machine_check *mc;
75		mc = (struct acpi_hest_ia_machine_check *)hest_hdr;
76		len = sizeof(*mc) + mc->num_hardware_banks *
77			sizeof(struct acpi_hest_ia_error_bank);
78	} else if (hest_type == ACPI_HEST_TYPE_IA32_DEFERRED_CHECK) {
79		struct acpi_hest_ia_deferred_check *mc;
80		mc = (struct acpi_hest_ia_deferred_check *)hest_hdr;
81		len = sizeof(*mc) + mc->num_hardware_banks *
82			sizeof(struct acpi_hest_ia_error_bank);
83	}
84	BUG_ON(len == -1);
85
86	return len;
87};
88
89typedef int (*apei_hest_func_t)(struct acpi_hest_header *hest_hdr, void *data);
90
91static int apei_hest_parse(apei_hest_func_t func, void *data)
92{
93	struct acpi_hest_header *hest_hdr;
94	int i, rc, len;
95
96	if (hest_disable || !hest_tab)
97		return -EINVAL;
98
99	hest_hdr = (struct acpi_hest_header *)(hest_tab + 1);
100	for (i = 0; i < hest_tab->error_source_count; i++) {
101		len = hest_esrc_len(hest_hdr);
102		if (!len) {
103			pr_warn(FW_WARN HEST_PFX
104				"Unknown or unused hardware error source "
105				"type: %d for hardware error source: %d.\n",
106				hest_hdr->type, hest_hdr->source_id);
107			return -EINVAL;
108		}
109		if ((void *)hest_hdr + len >
110		    (void *)hest_tab + hest_tab->header.length) {
111			pr_warn(FW_BUG HEST_PFX
112		"Table contents overflow for hardware error source: %d.\n",
113				hest_hdr->source_id);
114			return -EINVAL;
115		}
116
117		rc = func(hest_hdr, data);
118		if (rc)
119			return rc;
120
121		hest_hdr = (void *)hest_hdr + len;
122	}
123
124	return 0;
125}
126
127/*
128 * Check if firmware advertises firmware first mode. We need FF bit to be set
129 * along with a set of MC banks which work in FF mode.
130 */
131static int __init hest_parse_cmc(struct acpi_hest_header *hest_hdr, void *data)
132{
133	if (hest_hdr->type != ACPI_HEST_TYPE_IA32_CORRECTED_CHECK)
134		return 0;
135
136	if (!acpi_disable_cmcff)
137		return !arch_apei_enable_cmcff(hest_hdr, data);
138
139	return 0;
140}
141
142struct ghes_arr {
143	struct platform_device **ghes_devs;
144	unsigned int count;
145};
146
147static int __init hest_parse_ghes_count(struct acpi_hest_header *hest_hdr, void *data)
148{
149	int *count = data;
150
151	if (is_generic_error(hest_hdr))
152		(*count)++;
153	return 0;
154}
155
156static int __init hest_parse_ghes(struct acpi_hest_header *hest_hdr, void *data)
157{
158	struct platform_device *ghes_dev;
159	struct ghes_arr *ghes_arr = data;
160	int rc, i;
161
162	if (!is_generic_error(hest_hdr))
163		return 0;
164
165	if (!((struct acpi_hest_generic *)hest_hdr)->enabled)
166		return 0;
167	for (i = 0; i < ghes_arr->count; i++) {
168		struct acpi_hest_header *hdr;
169		ghes_dev = ghes_arr->ghes_devs[i];
170		hdr = *(struct acpi_hest_header **)ghes_dev->dev.platform_data;
171		if (hdr->source_id == hest_hdr->source_id) {
172			pr_warn(FW_WARN HEST_PFX "Duplicated hardware error source ID: %d.\n",
173				hdr->source_id);
174			return -EIO;
175		}
176	}
177	ghes_dev = platform_device_alloc("GHES", hest_hdr->source_id);
178	if (!ghes_dev)
179		return -ENOMEM;
180
181	rc = platform_device_add_data(ghes_dev, &hest_hdr, sizeof(void *));
182	if (rc)
183		goto err;
184
185	rc = platform_device_add(ghes_dev);
186	if (rc)
187		goto err;
188	ghes_arr->ghes_devs[ghes_arr->count++] = ghes_dev;
189
190	return 0;
191err:
192	platform_device_put(ghes_dev);
193	return rc;
194}
195
196static int __init hest_ghes_dev_register(unsigned int ghes_count)
197{
198	int rc, i;
199	struct ghes_arr ghes_arr;
200
201	ghes_arr.count = 0;
202	ghes_arr.ghes_devs = kmalloc_array(ghes_count, sizeof(void *),
203					   GFP_KERNEL);
204	if (!ghes_arr.ghes_devs)
205		return -ENOMEM;
206
207	rc = apei_hest_parse(hest_parse_ghes, &ghes_arr);
208	if (rc)
209		goto err;
210
211	rc = ghes_estatus_pool_init(ghes_count);
212	if (rc)
213		goto err;
214
215out:
216	kfree(ghes_arr.ghes_devs);
217	return rc;
218err:
219	for (i = 0; i < ghes_arr.count; i++)
220		platform_device_unregister(ghes_arr.ghes_devs[i]);
221	goto out;
222}
223
224static int __init setup_hest_disable(char *str)
225{
226	hest_disable = HEST_DISABLED;
227	return 1;
228}
229
230__setup("hest_disable", setup_hest_disable);
231
232void __init acpi_hest_init(void)
233{
234	acpi_status status;
235	int rc;
236	unsigned int ghes_count = 0;
237
238	if (hest_disable) {
239		pr_info(HEST_PFX "Table parsing disabled.\n");
240		return;
241	}
242
243	status = acpi_get_table(ACPI_SIG_HEST, 0,
244				(struct acpi_table_header **)&hest_tab);
245	if (status == AE_NOT_FOUND) {
246		hest_disable = HEST_NOT_FOUND;
247		return;
248	} else if (ACPI_FAILURE(status)) {
249		const char *msg = acpi_format_exception(status);
250		pr_err(HEST_PFX "Failed to get table, %s\n", msg);
251		hest_disable = HEST_DISABLED;
252		return;
253	}
254
255	rc = apei_hest_parse(hest_parse_cmc, NULL);
256	if (rc)
257		goto err;
258
259	if (!ghes_disable) {
260		rc = apei_hest_parse(hest_parse_ghes_count, &ghes_count);
261		if (rc)
262			goto err;
263
264		if (ghes_count)
265			rc = hest_ghes_dev_register(ghes_count);
266		if (rc)
267			goto err;
268	}
269
270	pr_info(HEST_PFX "Table parsing has been initialized.\n");
271	return;
272err:
273	hest_disable = HEST_DISABLED;
274	acpi_put_table((struct acpi_table_header *)hest_tab);
275}
276