3f3174996b
AMD Zen-based systems report memory errors through Machine Check banks representing Unified Memory Controllers (UMCs). The address value reported for DRAM ECC errors is a "normalized address" that is relative to the UMC. This normalized address must be converted to a system physical address to be usable by the OS. Support for this address translation was introduced to the MCA subsystem with Zen1 systems. The code was later moved to the AMD64 EDAC module, since this was the only user of the code at the time. However, there are uses for this translation outside of EDAC. The system physical address can be used in MCA for preemptive page offlining as done in some MCA notifier functions. Also, this translation is needed as the basis of similar functionality needed for some CXL configurations on AMD systems. Introduce a common address translation library that can be used for multiple subsystems including MCA, EDAC, and CXL. Include support for UMC normalized to system physical address translation for current CPU systems. The Data Fabric Indirect register access offsets and one of the register fields were changed. Default to the current offsets and register field definition. And fallback to the older values if running on a "legacy" system. Provide built-in code to facilitate the loading and unloading of the library module without affecting other modules or built-in code. Signed-off-by: Yazen Ghannam <yazen.ghannam@amd.com> Signed-off-by: Borislav Petkov (AMD) <bp@alien8.de> Link: https://lore.kernel.org/r/20240123041401.79812-2-yazen.ghannam@amd.com
87 lines
2.0 KiB
C
87 lines
2.0 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Copyright (C) 2014 Intel Corporation
|
|
*
|
|
* Authors:
|
|
* Chen, Gong <gong.chen@linux.intel.com>
|
|
*/
|
|
|
|
#include <linux/init.h>
|
|
#include <linux/ras.h>
|
|
#include <linux/uuid.h>
|
|
|
|
#if IS_ENABLED(CONFIG_AMD_ATL)
|
|
/*
|
|
* Once set, this function pointer should never be unset.
|
|
*
|
|
* The library module will set this pointer if it successfully loads. The module
|
|
* should not be unloaded except for testing and debug purposes.
|
|
*/
|
|
static unsigned long (*amd_atl_umc_na_to_spa)(struct atl_err *err);
|
|
|
|
void amd_atl_register_decoder(unsigned long (*f)(struct atl_err *))
|
|
{
|
|
amd_atl_umc_na_to_spa = f;
|
|
}
|
|
EXPORT_SYMBOL_GPL(amd_atl_register_decoder);
|
|
|
|
void amd_atl_unregister_decoder(void)
|
|
{
|
|
amd_atl_umc_na_to_spa = NULL;
|
|
}
|
|
EXPORT_SYMBOL_GPL(amd_atl_unregister_decoder);
|
|
|
|
unsigned long amd_convert_umc_mca_addr_to_sys_addr(struct atl_err *err)
|
|
{
|
|
if (!amd_atl_umc_na_to_spa)
|
|
return -EINVAL;
|
|
|
|
return amd_atl_umc_na_to_spa(err);
|
|
}
|
|
EXPORT_SYMBOL_GPL(amd_convert_umc_mca_addr_to_sys_addr);
|
|
#endif /* CONFIG_AMD_ATL */
|
|
|
|
#define CREATE_TRACE_POINTS
|
|
#define TRACE_INCLUDE_PATH ../../include/ras
|
|
#include <ras/ras_event.h>
|
|
|
|
void log_non_standard_event(const guid_t *sec_type, const guid_t *fru_id,
|
|
const char *fru_text, const u8 sev, const u8 *err,
|
|
const u32 len)
|
|
{
|
|
trace_non_standard_event(sec_type, fru_id, fru_text, sev, err, len);
|
|
}
|
|
|
|
void log_arm_hw_error(struct cper_sec_proc_arm *err)
|
|
{
|
|
trace_arm_event(err);
|
|
}
|
|
|
|
static int __init ras_init(void)
|
|
{
|
|
int rc = 0;
|
|
|
|
ras_debugfs_init();
|
|
rc = ras_add_daemon_trace();
|
|
|
|
return rc;
|
|
}
|
|
subsys_initcall(ras_init);
|
|
|
|
#if defined(CONFIG_ACPI_EXTLOG) || defined(CONFIG_ACPI_EXTLOG_MODULE)
|
|
EXPORT_TRACEPOINT_SYMBOL_GPL(extlog_mem_event);
|
|
#endif
|
|
EXPORT_TRACEPOINT_SYMBOL_GPL(mc_event);
|
|
EXPORT_TRACEPOINT_SYMBOL_GPL(non_standard_event);
|
|
EXPORT_TRACEPOINT_SYMBOL_GPL(arm_event);
|
|
|
|
static int __init parse_ras_param(char *str)
|
|
{
|
|
#ifdef CONFIG_RAS_CEC
|
|
parse_cec_param(str);
|
|
#endif
|
|
|
|
return 1;
|
|
}
|
|
__setup("ras", parse_ras_param);
|