[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20250506213814.2365788-9-zaidal@os.amperecomputing.com>
Date: Tue, 6 May 2025 14:38:12 -0700
From: Zaid Alali <zaidal@...amperecomputing.com>
To: rafael@...nel.org,
lenb@...nel.org,
james.morse@....com,
tony.luck@...el.com,
bp@...en8.de,
robert.moore@...el.com,
Jonathan.Cameron@...wei.com,
ira.weiny@...el.com,
Benjamin.Cheatham@....com,
dan.j.williams@...el.com,
arnd@...db.de,
Avadhut.Naik@....com,
u.kleine-koenig@...gutronix.de,
john.allen@....com,
linux-acpi@...r.kernel.org,
linux-kernel@...r.kernel.org,
acpica-devel@...ts.linux.dev
Subject: [PATCH v7 8/9] ACPI: APEI: EINJ: Enable EINJv2 error injections
Enable the driver to inject EINJv2 type errors. The component
array values are parsed from user_input and expected to contain
hex values for component id and syndrome separated by space,
and multiple components are separated by new line as follows:
component_id1 component_syndrome1
component_id2 component_syndrome2
:
component_id(n) component_syndrome(n)
for example:
$comp_arr="0x1 0x2
>0x1 0x4
>0x2 0x4"
$cd /sys/kernel/debug/apei/einj/
$echo "$comp_arr" > einjv2_component_array
Signed-off-by: Zaid Alali <zaidal@...amperecomputing.com>
---
drivers/acpi/apei/einj-core.c | 177 +++++++++++++++++++++++++++++++---
1 file changed, 166 insertions(+), 11 deletions(-)
diff --git a/drivers/acpi/apei/einj-core.c b/drivers/acpi/apei/einj-core.c
index 44f9166c3881..491d33529a3d 100644
--- a/drivers/acpi/apei/einj-core.c
+++ b/drivers/acpi/apei/einj-core.c
@@ -34,6 +34,7 @@
/* Firmware should respond within 1 seconds */
#define FIRMWARE_TIMEOUT (1 * USEC_PER_SEC)
#define COMP_ARR_SIZE 1024
+#define COMPONENT_LEN 16
#define ACPI65_EINJV2_SUPP BIT(30)
#define ACPI5_VENDOR_BIT BIT(31)
#define MEM_ERROR_MASK (ACPI_EINJ_MEMORY_CORRECTABLE | \
@@ -87,6 +88,14 @@ enum {
SETWA_FLAGS_APICID = 1,
SETWA_FLAGS_MEM = 2,
SETWA_FLAGS_PCIE_SBDF = 4,
+ SETWA_FLAGS_EINJV2 = 8,
+};
+
+enum {
+ EINJV2_PROCESSOR_ERROR = 0x1,
+ EINJV2_MEMORY_ERROR = 0x2,
+ EINJV2_PCIE_ERROR = 0x4,
+ EINJV2_VENDOR_ERROR = 0x80000000,
};
/*
@@ -110,6 +119,7 @@ static char vendor_dev[64];
static struct debugfs_blob_wrapper einjv2_component_arr;
static void *user_input;
+static int nr_components;
static u32 available_error_type;
static u32 available_error_type_v2;
@@ -180,6 +190,8 @@ static DEFINE_MUTEX(einj_mutex);
bool einj_initialized __ro_after_init;
static void __iomem *einj_param;
+static u32 v5param_size;
+static bool is_V2;
static void einj_exec_ctx_init(struct apei_exec_context *ctx)
{
@@ -304,11 +316,31 @@ static void __iomem *einj_get_parameter_address(void)
struct set_error_type_with_address v5param;
struct set_error_type_with_address __iomem *p;
+ v5param_size = sizeof(v5param);
p = acpi_os_map_iomem(pa_v5, sizeof(*p));
if (p) {
- memcpy_fromio(&v5param, p, sizeof(v5param));
+ int offset, len;
+
+ memcpy_fromio(&v5param, p, v5param_size);
acpi5 = 1;
check_vendor_extension(pa_v5, &v5param);
+ if (available_error_type & ACPI65_EINJV2_SUPP) {
+ len = v5param.einjv2_struct.length;
+ offset = offsetof(struct einjv2_extension_struct, component_arr);
+ nr_components = (len - offset) /
+ sizeof(v5param.einjv2_struct.component_arr[0]);
+ /*
+ * The first call to acpi_os_map_iomem above does not include the
+ * component array, instead it is used to read and calculate maximum
+ * number of components supported by the system. Below, the mapping
+ * is expanded to include the component array.
+ */
+ acpi_os_unmap_iomem(p, v5param_size);
+ offset = offsetof(struct set_error_type_with_address, einjv2_struct);
+ v5param_size = offset + struct_size(&v5param.einjv2_struct,
+ component_arr, nr_components);
+ p = acpi_os_map_iomem(pa_v5, v5param_size);
+ }
return p;
}
}
@@ -486,6 +518,104 @@ static int __einj_error_trigger(u64 trigger_paddr, u32 type,
return rc;
}
+static int parse_hex_to_u8(char *str, u8 *arr)
+{
+ char *ptr, val[32];
+ int pad, str_len;
+
+
+ if (str[0] == '0' && (str[1] == 'x' || str[1] == 'X'))
+ str += 2;
+
+ str_len = strlen(str);
+ if (str_len > 32)
+ return -EINVAL;
+
+ memcpy(val, str, str_len);
+
+ ptr = val;
+ while (*ptr != '\0') {
+ if (!isxdigit(*ptr))
+ return -EINVAL;
+ ptr++;
+ }
+
+ pad = 32 - str_len;
+
+ memmove(val + pad, val, str_len);
+ memset(val, '0', pad);
+
+ for (int i = 0; i < COMPONENT_LEN; ++i) {
+ char byte_str[3] = {val[i * 2], val[i * 2 + 1], '\0'};
+ /* write bytes in little endian format to follow ACPI specs */
+ arr[COMPONENT_LEN - i - 1] = (u8)strtoul(byte_str, NULL, 16);
+ }
+
+ return 0;
+}
+
+static int read_component_array(struct set_error_type_with_address *v5param)
+{
+ int count = 0, str_len;
+ u8 comp_arr[COMPONENT_LEN], synd_arr[COMPONENT_LEN];
+ struct syndrome_array *component_arr;
+ char *tok, *comp_str, *synd_str, *user;
+
+ component_arr = v5param->einjv2_struct.component_arr;
+ str_len = strlen(user_input);
+ user = user_input;
+ user[str_len - 1] = '\0';
+ while ((tok = strsep(&user, "\n")) != NULL) {
+ if (count >= nr_components)
+ return -EINVAL;
+
+ comp_str = strsep(&tok, " \t");
+ synd_str = strsep(&tok, " \t");
+
+ if (!comp_str || !synd_str)
+ return -EINVAL;
+
+ if (parse_hex_to_u8(comp_str, comp_arr))
+ return -EINVAL;
+ if (parse_hex_to_u8(synd_str, synd_arr))
+ return -EINVAL;
+
+ switch (v5param->type) {
+ case EINJV2_PROCESSOR_ERROR:
+ for (int i = 0; i < COMPONENT_LEN; ++i) {
+ component_arr[count].comp_id.acpi_id[i] = comp_arr[i];
+ component_arr[count].comp_synd.proc_synd[i] = synd_arr[i];
+ }
+ break;
+ case EINJV2_MEMORY_ERROR:
+ for (int i = 0; i < COMPONENT_LEN; ++i) {
+ component_arr[count].comp_id.device_id[i] = comp_arr[i];
+ component_arr[count].comp_synd.mem_synd[i] = synd_arr[i];
+ }
+ break;
+ case EINJV2_PCIE_ERROR:
+ for (int i = 0; i < COMPONENT_LEN; ++i) {
+ component_arr[count].comp_id.pcie_sbdf[i] = comp_arr[i];
+ component_arr[count].comp_synd.pcie_synd[i] = synd_arr[i];
+ }
+ break;
+ case EINJV2_VENDOR_ERROR:
+ for (int i = 0; i < COMPONENT_LEN; ++i) {
+ component_arr[count].comp_id.vendor_id[i] = comp_arr[i];
+ component_arr[count].comp_synd.vendor_synd[i] = synd_arr[i];
+ }
+ break;
+ }
+ count++;
+
+ }
+ v5param->einjv2_struct.component_arr_count = count;
+
+ /* clear buffer after user input for next injection */
+ memset(user_input, 0, COMP_ARR_SIZE);
+ return 0;
+}
+
static int __einj_error_inject(u32 type, u32 flags, u64 param1, u64 param2,
u64 param3, u64 param4)
{
@@ -500,10 +630,10 @@ static int __einj_error_inject(u32 type, u32 flags, u64 param1, u64 param2,
return rc;
apei_exec_ctx_set_input(&ctx, type);
if (acpi5) {
- struct set_error_type_with_address *v5param, v5_struct;
+ struct set_error_type_with_address *v5param;
- v5param = &v5_struct;
- memcpy_fromio(v5param, einj_param, sizeof(*v5param));
+ v5param = kmalloc(v5param_size, GFP_KERNEL);
+ memcpy_fromio(v5param, einj_param, v5param_size);
v5param->type = type;
if (type & ACPI5_VENDOR_BIT) {
switch (vendor_flags) {
@@ -523,8 +653,19 @@ static int __einj_error_inject(u32 type, u32 flags, u64 param1, u64 param2,
v5param->flags = flags;
v5param->memory_address = param1;
v5param->memory_address_range = param2;
- v5param->apicid = param3;
- v5param->pcie_sbdf = param4;
+
+ if (is_V2) {
+ rc = read_component_array(v5param);
+ if (rc) {
+ kfree(v5param);
+ goto err_out;
+ }
+ /* clear buffer after user input for next injection */
+ memset(user_input, 0, COMP_ARR_SIZE);
+ } else {
+ v5param->apicid = param3;
+ v5param->pcie_sbdf = param4;
+ }
} else {
switch (type) {
case ACPI_EINJ_PROCESSOR_CORRECTABLE:
@@ -548,7 +689,8 @@ static int __einj_error_inject(u32 type, u32 flags, u64 param1, u64 param2,
break;
}
}
- memcpy_toio(einj_param, v5param, sizeof(*v5param));
+ memcpy_toio(einj_param, v5param, v5param_size);
+ kfree(v5param);
} else {
rc = apei_exec_run(&ctx, ACPI_EINJ_SET_ERROR_TYPE);
if (rc)
@@ -600,6 +742,9 @@ static int __einj_error_inject(u32 type, u32 flags, u64 param1, u64 param2,
rc = apei_exec_run_optional(&ctx, ACPI_EINJ_END_OPERATION);
return rc;
+err_out:
+ memset(user_input, 0, COMP_ARR_SIZE);
+ return -EINVAL;
}
/* Inject the specified hardware error */
@@ -610,10 +755,15 @@ int einj_error_inject(u32 type, u32 flags, u64 param1, u64 param2, u64 param3,
u64 base_addr, size;
/* If user manually set "flags", make sure it is legal */
- if (flags && (flags &
- ~(SETWA_FLAGS_APICID|SETWA_FLAGS_MEM|SETWA_FLAGS_PCIE_SBDF)))
+ if (flags && (flags & ~(SETWA_FLAGS_APICID | SETWA_FLAGS_MEM |
+ SETWA_FLAGS_PCIE_SBDF | SETWA_FLAGS_EINJV2)))
return -EINVAL;
+ /* check if type is a valid EINJv2 error type */
+ if (is_V2) {
+ if (!(type & available_error_type_v2))
+ return -EINVAL;
+ }
/*
* We need extra sanity checks for memory errors.
* Other types leap directly to injection.
@@ -764,7 +914,7 @@ int einj_validate_error_type(u64 type)
if (tval & (tval - 1))
return -EINVAL;
if (!vendor)
- if (!(type & available_error_type))
+ if (!(type & (available_error_type | available_error_type_v2)))
return -EINVAL;
return 0;
@@ -783,9 +933,11 @@ static ssize_t error_type_set(struct file *file, const char __user *buf,
if (strncmp(einj_buf, "V2_", 3) == 0) {
if (!sscanf(einj_buf, "V2_%llx", &val))
return -EINVAL;
+ is_V2 = true;
} else {
if (!sscanf(einj_buf, "%llx", &val))
return -EINVAL;
+ is_V2 = false;
}
rc = einj_validate_error_type(val);
@@ -807,6 +959,9 @@ static int error_inject_set(void *data, u64 val)
if (!error_type)
return -EINVAL;
+ if (is_V2)
+ error_flags |= SETWA_FLAGS_EINJV2;
+
return einj_error_inject(error_type, error_flags, error_param1, error_param2,
error_param3, error_param4);
}
@@ -955,7 +1110,7 @@ static void __exit einj_remove(struct platform_device *pdev)
if (einj_param) {
acpi_size size = (acpi5) ?
- sizeof(struct set_error_type_with_address) :
+ v5param_size :
sizeof(struct einj_parameter);
acpi_os_unmap_iomem(einj_param, size);
--
2.43.0
Powered by blists - more mailing lists