mirror of
https://github.com/AuxXxilium/linux_dsm_epyc7002.git
synced 2024-12-27 04:45:23 +07:00
a3e2acc5e3
ACPI/APEI is designed to verifiy/report H/W errors, like Corrected Error(CE) and Uncorrected Error(UC). It contains four tables: HEST, ERST, EINJ and BERT. The first three tables have been merged for a long time, but because of lacking BIOS support for BERT, the support for BERT is pending until now. Recently on ARM 64 platform it is has been supported. So here we come. Under normal circumstances, when a hardware error occurs, kernel will be notified via NMI, MCE or some other method, then kernel will process the error condition, report it, and recover it if possible. But sometime, the situation is so bad, so that firmware may choose to reset directly without notifying Linux kernel. Linux kernel can use the Boot Error Record Table (BERT) to get the un-notified hardware errors that occurred in a previous boot. In this patch, the error information is reported via printk. For more information about BERT, please refer to ACPI Specification version 6.0, section 18.3.1: http://www.uefi.org/sites/default/files/resources/ACPI_6.0.pdf The following log is a BERT record after system reboot because of hitting a fatal memory error: BERT: Error records from previous boot: [Hardware Error]: It has been corrected by h/w and requires no further action [Hardware Error]: event severity: corrected [Hardware Error]: Error 0, type: recoverable [Hardware Error]: section_type: memory error [Hardware Error]: error_status: 0x0000000000000400 [Hardware Error]: physical_address: 0xffffffffffffffff [Hardware Error]: card: 1 module: 2 bank: 3 row: 1 column: 2 bit_position: 5 [Hardware Error]: error_type: 2, single-bit ECC [Tomasz Nowicki: Clear error status at the end of error handling] [Tony: Applied some cleanups suggested by Fu Wei] [Fu Wei: delete EXPORT_SYMBOL_GPL(bert_disable), improve the code] Signed-off-by: Huang Ying <ying.huang@intel.com> Signed-off-by: Tomasz Nowicki <tomasz.nowicki@linaro.org> Signed-off-by: Chen, Gong <gong.chen@linux.intel.com> Tested-by: Jonathan (Zhixiong) Zhang <zjzhang@codeaurora.org> Signed-off-by: Fu Wei <fu.wei@linaro.org> Tested-by: Tyler Baicar <tbaicar@codeaurora.org> Reviewed-by: Borislav Petkov <bp@suse.de> Signed-off-by: Tony Luck <tony.luck@intel.com> Signed-off-by: Rafael J. Wysocki <rafael.j.wysocki@intel.com>
144 lines
4.1 KiB
C
144 lines
4.1 KiB
C
/*
|
|
* apei-internal.h - ACPI Platform Error Interface internal
|
|
* definitions.
|
|
*/
|
|
|
|
#ifndef APEI_INTERNAL_H
|
|
#define APEI_INTERNAL_H
|
|
|
|
#include <linux/cper.h>
|
|
#include <linux/acpi.h>
|
|
|
|
struct apei_exec_context;
|
|
|
|
typedef int (*apei_exec_ins_func_t)(struct apei_exec_context *ctx,
|
|
struct acpi_whea_header *entry);
|
|
|
|
#define APEI_EXEC_INS_ACCESS_REGISTER 0x0001
|
|
|
|
struct apei_exec_ins_type {
|
|
u32 flags;
|
|
apei_exec_ins_func_t run;
|
|
};
|
|
|
|
struct apei_exec_context {
|
|
u32 ip;
|
|
u64 value;
|
|
u64 var1;
|
|
u64 var2;
|
|
u64 src_base;
|
|
u64 dst_base;
|
|
struct apei_exec_ins_type *ins_table;
|
|
u32 instructions;
|
|
struct acpi_whea_header *action_table;
|
|
u32 entries;
|
|
};
|
|
|
|
void apei_exec_ctx_init(struct apei_exec_context *ctx,
|
|
struct apei_exec_ins_type *ins_table,
|
|
u32 instructions,
|
|
struct acpi_whea_header *action_table,
|
|
u32 entries);
|
|
|
|
static inline void apei_exec_ctx_set_input(struct apei_exec_context *ctx,
|
|
u64 input)
|
|
{
|
|
ctx->value = input;
|
|
}
|
|
|
|
static inline u64 apei_exec_ctx_get_output(struct apei_exec_context *ctx)
|
|
{
|
|
return ctx->value;
|
|
}
|
|
|
|
int __apei_exec_run(struct apei_exec_context *ctx, u8 action, bool optional);
|
|
|
|
static inline int apei_exec_run(struct apei_exec_context *ctx, u8 action)
|
|
{
|
|
return __apei_exec_run(ctx, action, 0);
|
|
}
|
|
|
|
/* It is optional whether the firmware provides the action */
|
|
static inline int apei_exec_run_optional(struct apei_exec_context *ctx, u8 action)
|
|
{
|
|
return __apei_exec_run(ctx, action, 1);
|
|
}
|
|
|
|
/* Common instruction implementation */
|
|
|
|
/* IP has been set in instruction function */
|
|
#define APEI_EXEC_SET_IP 1
|
|
|
|
int apei_map_generic_address(struct acpi_generic_address *reg);
|
|
|
|
static inline void apei_unmap_generic_address(struct acpi_generic_address *reg)
|
|
{
|
|
acpi_os_unmap_generic_address(reg);
|
|
}
|
|
|
|
int apei_read(u64 *val, struct acpi_generic_address *reg);
|
|
int apei_write(u64 val, struct acpi_generic_address *reg);
|
|
|
|
int __apei_exec_read_register(struct acpi_whea_header *entry, u64 *val);
|
|
int __apei_exec_write_register(struct acpi_whea_header *entry, u64 val);
|
|
int apei_exec_read_register(struct apei_exec_context *ctx,
|
|
struct acpi_whea_header *entry);
|
|
int apei_exec_read_register_value(struct apei_exec_context *ctx,
|
|
struct acpi_whea_header *entry);
|
|
int apei_exec_write_register(struct apei_exec_context *ctx,
|
|
struct acpi_whea_header *entry);
|
|
int apei_exec_write_register_value(struct apei_exec_context *ctx,
|
|
struct acpi_whea_header *entry);
|
|
int apei_exec_noop(struct apei_exec_context *ctx,
|
|
struct acpi_whea_header *entry);
|
|
int apei_exec_pre_map_gars(struct apei_exec_context *ctx);
|
|
int apei_exec_post_unmap_gars(struct apei_exec_context *ctx);
|
|
|
|
struct apei_resources {
|
|
struct list_head iomem;
|
|
struct list_head ioport;
|
|
};
|
|
|
|
static inline void apei_resources_init(struct apei_resources *resources)
|
|
{
|
|
INIT_LIST_HEAD(&resources->iomem);
|
|
INIT_LIST_HEAD(&resources->ioport);
|
|
}
|
|
|
|
void apei_resources_fini(struct apei_resources *resources);
|
|
int apei_resources_add(struct apei_resources *resources,
|
|
unsigned long start, unsigned long size,
|
|
bool iomem);
|
|
int apei_resources_sub(struct apei_resources *resources1,
|
|
struct apei_resources *resources2);
|
|
int apei_resources_request(struct apei_resources *resources,
|
|
const char *desc);
|
|
void apei_resources_release(struct apei_resources *resources);
|
|
int apei_exec_collect_resources(struct apei_exec_context *ctx,
|
|
struct apei_resources *resources);
|
|
|
|
struct dentry;
|
|
struct dentry *apei_get_debugfs_dir(void);
|
|
|
|
#define apei_estatus_for_each_section(estatus, section) \
|
|
for (section = (struct acpi_hest_generic_data *)(estatus + 1); \
|
|
(void *)section - (void *)estatus < estatus->data_length; \
|
|
section = (void *)(section+1) + section->error_data_length)
|
|
|
|
static inline u32 cper_estatus_len(struct acpi_hest_generic_status *estatus)
|
|
{
|
|
if (estatus->raw_data_length)
|
|
return estatus->raw_data_offset + \
|
|
estatus->raw_data_length;
|
|
else
|
|
return sizeof(*estatus) + estatus->data_length;
|
|
}
|
|
|
|
void cper_estatus_print(const char *pfx,
|
|
const struct acpi_hest_generic_status *estatus);
|
|
int cper_estatus_check_header(const struct acpi_hest_generic_status *estatus);
|
|
int cper_estatus_check(const struct acpi_hest_generic_status *estatus);
|
|
|
|
int apei_osc_setup(void);
|
|
#endif
|