1 // SPDX-License-Identifier: GPL-2.0-only
3 * APEI Hardware Error Source Table support
5 * HEST describes error sources in detail; communicates operational
6 * parameters (i.e. severity levels, masking bits, and threshold
7 * values) to Linux as necessary. It also allows the BIOS to report
8 * non-standard error sources to Linux (for example, chipset-specific
11 * For more information about HEST, please refer to ACPI Specification
12 * version 4.0, section 17.3.2.
14 * Copyright 2009 Intel Corp.
15 * Author: Huang Ying <ying.huang@intel.com>
18 #include <linux/kernel.h>
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/acpi.h>
22 #include <linux/kdebug.h>
23 #include <linux/highmem.h>
25 #include <linux/platform_device.h>
26 #include <acpi/apei.h>
27 #include <acpi/ghes.h>
29 #include "apei-internal.h"
31 #define HEST_PFX "HEST: "
34 EXPORT_SYMBOL_GPL(hest_disable);
36 /* HEST table parsing */
38 static struct acpi_table_hest *__read_mostly hest_tab;
41 * Since GHES_ASSIST is not supported, skip initialization of GHES_ASSIST
43 * During HEST parsing, detected MCA error sources are cached from early
44 * table entries so that the Flags and Source Id fields from these cached
45 * values are then referred to in later table entries to determine if the
46 * encountered GHES_ASSIST structure should be initialized.
49 struct acpi_hest_ia_corrected *cmc;
50 struct acpi_hest_ia_machine_check *mc;
51 struct acpi_hest_ia_deferred_check *dmc;
54 static const int hest_esrc_len_tab[ACPI_HEST_TYPE_RESERVED] = {
55 [ACPI_HEST_TYPE_IA32_CHECK] = -1, /* need further calculation */
56 [ACPI_HEST_TYPE_IA32_CORRECTED_CHECK] = -1,
57 [ACPI_HEST_TYPE_IA32_NMI] = sizeof(struct acpi_hest_ia_nmi),
58 [ACPI_HEST_TYPE_AER_ROOT_PORT] = sizeof(struct acpi_hest_aer_root),
59 [ACPI_HEST_TYPE_AER_ENDPOINT] = sizeof(struct acpi_hest_aer),
60 [ACPI_HEST_TYPE_AER_BRIDGE] = sizeof(struct acpi_hest_aer_bridge),
61 [ACPI_HEST_TYPE_GENERIC_ERROR] = sizeof(struct acpi_hest_generic),
62 [ACPI_HEST_TYPE_GENERIC_ERROR_V2] = sizeof(struct acpi_hest_generic_v2),
63 [ACPI_HEST_TYPE_IA32_DEFERRED_CHECK] = -1,
66 static inline bool is_generic_error(struct acpi_hest_header *hest_hdr)
68 return hest_hdr->type == ACPI_HEST_TYPE_GENERIC_ERROR ||
69 hest_hdr->type == ACPI_HEST_TYPE_GENERIC_ERROR_V2;
72 static int hest_esrc_len(struct acpi_hest_header *hest_hdr)
74 u16 hest_type = hest_hdr->type;
77 if (hest_type >= ACPI_HEST_TYPE_RESERVED)
80 len = hest_esrc_len_tab[hest_type];
82 if (hest_type == ACPI_HEST_TYPE_IA32_CORRECTED_CHECK) {
83 struct acpi_hest_ia_corrected *cmc;
84 cmc = (struct acpi_hest_ia_corrected *)hest_hdr;
85 len = sizeof(*cmc) + cmc->num_hardware_banks *
86 sizeof(struct acpi_hest_ia_error_bank);
88 } else if (hest_type == ACPI_HEST_TYPE_IA32_CHECK) {
89 struct acpi_hest_ia_machine_check *mc;
90 mc = (struct acpi_hest_ia_machine_check *)hest_hdr;
91 len = sizeof(*mc) + mc->num_hardware_banks *
92 sizeof(struct acpi_hest_ia_error_bank);
94 } else if (hest_type == ACPI_HEST_TYPE_IA32_DEFERRED_CHECK) {
95 struct acpi_hest_ia_deferred_check *mc;
96 mc = (struct acpi_hest_ia_deferred_check *)hest_hdr;
97 len = sizeof(*mc) + mc->num_hardware_banks *
98 sizeof(struct acpi_hest_ia_error_bank);
107 * GHES and GHESv2 structures share the same format, starting from
108 * Source Id and ending in Error Status Block Length (inclusive).
110 static bool is_ghes_assist_struct(struct acpi_hest_header *hest_hdr)
112 struct acpi_hest_generic *ghes;
113 u16 related_source_id;
115 if (hest_hdr->type != ACPI_HEST_TYPE_GENERIC_ERROR &&
116 hest_hdr->type != ACPI_HEST_TYPE_GENERIC_ERROR_V2)
119 ghes = (struct acpi_hest_generic *)hest_hdr;
120 related_source_id = ghes->related_source_id;
122 if (mces.cmc && mces.cmc->flags & ACPI_HEST_GHES_ASSIST &&
123 related_source_id == mces.cmc->header.source_id)
125 if (mces.mc && mces.mc->flags & ACPI_HEST_GHES_ASSIST &&
126 related_source_id == mces.mc->header.source_id)
128 if (mces.dmc && mces.dmc->flags & ACPI_HEST_GHES_ASSIST &&
129 related_source_id == mces.dmc->header.source_id)
135 typedef int (*apei_hest_func_t)(struct acpi_hest_header *hest_hdr, void *data);
137 static int apei_hest_parse(apei_hest_func_t func, void *data)
139 struct acpi_hest_header *hest_hdr;
142 if (hest_disable || !hest_tab)
145 hest_hdr = (struct acpi_hest_header *)(hest_tab + 1);
146 for (i = 0; i < hest_tab->error_source_count; i++) {
147 len = hest_esrc_len(hest_hdr);
149 pr_warn(FW_WARN HEST_PFX
150 "Unknown or unused hardware error source "
151 "type: %d for hardware error source: %d.\n",
152 hest_hdr->type, hest_hdr->source_id);
155 if ((void *)hest_hdr + len >
156 (void *)hest_tab + hest_tab->header.length) {
157 pr_warn(FW_BUG HEST_PFX
158 "Table contents overflow for hardware error source: %d.\n",
159 hest_hdr->source_id);
163 if (is_ghes_assist_struct(hest_hdr)) {
164 hest_hdr = (void *)hest_hdr + len;
168 rc = func(hest_hdr, data);
172 hest_hdr = (void *)hest_hdr + len;
179 * Check if firmware advertises firmware first mode. We need FF bit to be set
180 * along with a set of MC banks which work in FF mode.
182 static int __init hest_parse_cmc(struct acpi_hest_header *hest_hdr, void *data)
184 if (hest_hdr->type != ACPI_HEST_TYPE_IA32_CORRECTED_CHECK)
187 if (!acpi_disable_cmcff)
188 return !arch_apei_enable_cmcff(hest_hdr, data);
194 struct platform_device **ghes_devs;
198 static int __init hest_parse_ghes_count(struct acpi_hest_header *hest_hdr, void *data)
202 if (is_generic_error(hest_hdr))
207 static int __init hest_parse_ghes(struct acpi_hest_header *hest_hdr, void *data)
209 struct platform_device *ghes_dev;
210 struct ghes_arr *ghes_arr = data;
213 if (!is_generic_error(hest_hdr))
216 if (!((struct acpi_hest_generic *)hest_hdr)->enabled)
218 for (i = 0; i < ghes_arr->count; i++) {
219 struct acpi_hest_header *hdr;
220 ghes_dev = ghes_arr->ghes_devs[i];
221 hdr = *(struct acpi_hest_header **)ghes_dev->dev.platform_data;
222 if (hdr->source_id == hest_hdr->source_id) {
223 pr_warn(FW_WARN HEST_PFX "Duplicated hardware error source ID: %d.\n",
228 ghes_dev = platform_device_alloc("GHES", hest_hdr->source_id);
232 rc = platform_device_add_data(ghes_dev, &hest_hdr, sizeof(void *));
236 rc = platform_device_add(ghes_dev);
239 ghes_arr->ghes_devs[ghes_arr->count++] = ghes_dev;
243 platform_device_put(ghes_dev);
247 static int __init hest_ghes_dev_register(unsigned int ghes_count)
250 struct ghes_arr ghes_arr;
253 ghes_arr.ghes_devs = kmalloc_array(ghes_count, sizeof(void *),
255 if (!ghes_arr.ghes_devs)
258 rc = apei_hest_parse(hest_parse_ghes, &ghes_arr);
262 rc = ghes_estatus_pool_init(ghes_count);
267 kfree(ghes_arr.ghes_devs);
270 for (i = 0; i < ghes_arr.count; i++)
271 platform_device_unregister(ghes_arr.ghes_devs[i]);
275 static int __init setup_hest_disable(char *str)
277 hest_disable = HEST_DISABLED;
281 __setup("hest_disable", setup_hest_disable);
283 void __init acpi_hest_init(void)
287 unsigned int ghes_count = 0;
290 pr_info(HEST_PFX "Table parsing disabled.\n");
294 status = acpi_get_table(ACPI_SIG_HEST, 0,
295 (struct acpi_table_header **)&hest_tab);
296 if (status == AE_NOT_FOUND) {
297 hest_disable = HEST_NOT_FOUND;
299 } else if (ACPI_FAILURE(status)) {
300 const char *msg = acpi_format_exception(status);
301 pr_err(HEST_PFX "Failed to get table, %s\n", msg);
302 hest_disable = HEST_DISABLED;
306 rc = apei_hest_parse(hest_parse_cmc, NULL);
311 rc = apei_hest_parse(hest_parse_ghes_count, &ghes_count);
316 rc = hest_ghes_dev_register(ghes_count);
321 pr_info(HEST_PFX "Table parsing has been initialized.\n");
324 hest_disable = HEST_DISABLED;
325 acpi_put_table((struct acpi_table_header *)hest_tab);