[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-Id: <20220420030223.689259-2-tarumizu.kohei@fujitsu.com>
Date: Wed, 20 Apr 2022 12:02:15 +0900
From: Kohei Tarumizu <tarumizu.kohei@...itsu.com>
To: catalin.marinas@....com, will@...nel.org, tglx@...utronix.de,
mingo@...hat.com, bp@...en8.de, dave.hansen@...ux.intel.com,
x86@...nel.org, hpa@...or.com,
linux-arm-kernel@...ts.infradead.org, linux-kernel@...r.kernel.org,
fenghua.yu@...el.com, reinette.chatre@...el.com
Cc: tarumizu.kohei@...itsu.com
Subject: [PATCH v3 1/9] drivers: base: Add hardware prefetch control core driver
This driver adds the register/unregister function to create the
"prefetch_control" directory and some attribute files. Attributes are
only present if the particular cache implements the relevant
prefetcher controls
If the architecture has control of the CPU's hardware prefetcher
behavior, use this function to create sysfs. When registering, it is
necessary to provide what type of hardware prefetcher is supported
and how to read/write to the register.
Following patches add support for A64FX and x86.
Signed-off-by: Kohei Tarumizu <tarumizu.kohei@...itsu.com>
---
drivers/base/pfctl.c | 458 ++++++++++++++++++++++++++++++++++++++++++
include/linux/pfctl.h | 49 +++++
2 files changed, 507 insertions(+)
create mode 100644 drivers/base/pfctl.c
create mode 100644 include/linux/pfctl.h
diff --git a/drivers/base/pfctl.c b/drivers/base/pfctl.c
new file mode 100644
index 000000000000..035d51c64e33
--- /dev/null
+++ b/drivers/base/pfctl.c
@@ -0,0 +1,458 @@
+// SPDX-License-Identifier: GPL-2.0
+/*
+ * Copyright 2022 FUJITSU LIMITED
+ *
+ * This driver provides tunable sysfs interface for Hardware Prefetch Control.
+ * See Documentation/ABI/testing/sysfs-devices-system-cpu for more information.
+ *
+ * This code provides architecture-independent functions such as create and
+ * remove attribute file.
+ * The implementation of reads and writes to the Hardware Prefetch Control
+ * register is architecture-dependent. Therefore, each architecture register
+ * a callback to read and write the register via pfctl_register_driver().
+ */
+
+#include <linux/cacheinfo.h>
+#include <linux/cpu.h>
+#include <linux/device.h>
+#include <linux/pfctl.h>
+#include <linux/parser.h>
+#include <linux/slab.h>
+
+#ifdef pr_fmt
+#undef pr_fmt
+#endif
+#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
+
+static DEFINE_PER_CPU(struct device *, cache_device_pcpu);
+#define per_cpu_cache_device(cpu) (per_cpu(cache_device_pcpu, cpu))
+
+struct pfctl_driver *pdriver;
+enum cpuhp_state hp_online;
+
+static const char dist_auto_string[] = "auto";
+static const char strength_strong_string[] = "strong";
+static const char strength_weak_string[] = "weak";
+
+static bool prefetcher_is_available(unsigned int level, enum cache_type type,
+ int prefetcher)
+{
+ if ((level == 1) && (type == CACHE_TYPE_DATA)) {
+ if (pdriver->supported_l1d_prefetcher & prefetcher)
+ return true;
+ } else if ((level == 2) && (type == CACHE_TYPE_UNIFIED)) {
+ if (pdriver->supported_l2_prefetcher & prefetcher)
+ return true;
+ }
+
+ return false;
+}
+
+/*
+ * Returns the cpu number of the cpu_device(/sys/devices/system/cpu/cpuX)
+ * in the ancestor directory of prefetch_control.
+ *
+ * When initializing this driver, it is verified that the cache directory exists
+ * under cpu_device. Therefore, the third level up from prefetch_control is
+ * cpu_device as shown below.
+ *
+ * /sys/devices/system/cpu/cpuX/cache/indexX/prefetch_control
+ */
+static inline unsigned int get_pfctl_device_cpunum(struct device *pfctl_dev)
+{
+ return pfctl_dev->parent->parent->parent->id;
+}
+
+#define pfctl_enable_show(prefetcher, pattr) \
+static ssize_t \
+prefetcher##_enable_show(struct device *dev, \
+ struct device_attribute *attr, char *buf) \
+{ \
+ int ret; \
+ u64 val; \
+ unsigned int cpu; \
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent); \
+ \
+ cpu = get_pfctl_device_cpunum(dev); \
+ \
+ ret = pdriver->read_pfreg(pattr, cpu, this_leaf->level, &val); \
+ if (ret < 0) \
+ return ret; \
+ \
+ if ((val == PFCTL_ENABLE_VAL) || (val == PFCTL_DISABLE_VAL)) \
+ return sysfs_emit(buf, "%llu\n", val); \
+ else \
+ return -EINVAL; \
+}
+
+pfctl_enable_show(hardware_prefetcher, HWPF_ENABLE);
+pfctl_enable_show(ip_prefetcher, IPPF_ENABLE);
+pfctl_enable_show(adjacent_cache_line_prefetcher, ACLPF_ENABLE);
+pfctl_enable_show(stream_detect_prefetcher, SDPF_ENABLE);
+
+static ssize_t
+stream_detect_prefetcher_strength_show(struct device *dev,
+ struct device_attribute *attr, char *buf)
+{
+ int ret;
+ u64 val;
+ unsigned int cpu;
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent);
+
+ cpu = get_pfctl_device_cpunum(dev);
+
+ ret = pdriver->read_pfreg(SDPF_STRENGTH, cpu, this_leaf->level, &val);
+ if (ret < 0)
+ return ret;
+
+ if (val == PFCTL_STRONG_VAL)
+ return sysfs_emit(buf, "%s\n", strength_strong_string);
+ if (val == PFCTL_WEAK_VAL)
+ return sysfs_emit(buf, "%s\n", strength_weak_string);
+ else
+ return -EINVAL;
+}
+
+static ssize_t
+stream_detect_prefetcher_strength_available_show(struct device *dev,
+ struct device_attribute *attr,
+ char *buf)
+{
+ ssize_t len = 0;
+
+ if (pdriver->supported_sdpf_strength & STRENGTH_STRONG)
+ len += sysfs_emit_at(buf, len, "%s ", strength_strong_string);
+
+ if (pdriver->supported_sdpf_strength & STRENGTH_WEAK)
+ len += sysfs_emit_at(buf, len, "%s ", strength_weak_string);
+
+ len += sysfs_emit_at(buf, len, "\n");
+
+ return len;
+}
+
+static ssize_t
+stream_detect_prefetcher_dist_show(struct device *dev,
+ struct device_attribute *attr, char *buf)
+{
+ int ret;
+ u64 val;
+ unsigned int cpu;
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent);
+
+ cpu = get_pfctl_device_cpunum(dev);
+
+ ret = pdriver->read_pfreg(SDPF_DIST, cpu, this_leaf->level, &val);
+ if (ret < 0)
+ return ret;
+
+ if (val == PFCTL_DIST_AUTO_VAL)
+ return sysfs_emit(buf, "%s\n", dist_auto_string);
+ else
+ return sysfs_emit(buf, "%llu\n", val);
+}
+
+#define pfctl_enable_store(prefetcher, pattr) \
+static ssize_t \
+prefetcher##_enable_store(struct device *dev, \
+ struct device_attribute *attr, \
+ const char *buf, size_t count) \
+{ \
+ int ret; \
+ u64 val; \
+ unsigned int cpu; \
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent); \
+ \
+ ret = kstrtoull(buf, 10, &val); \
+ if (ret < 0) \
+ return -EINVAL; \
+ \
+ if ((val != PFCTL_ENABLE_VAL) && (val != PFCTL_DISABLE_VAL)) \
+ return -EINVAL; \
+ \
+ cpu = get_pfctl_device_cpunum(dev); \
+ \
+ ret = pdriver->write_pfreg(pattr, cpu, this_leaf->level, val); \
+ if (ret < 0) \
+ return ret; \
+ \
+ return count; \
+}
+
+pfctl_enable_store(hardware_prefetcher, HWPF_ENABLE);
+pfctl_enable_store(ip_prefetcher, IPPF_ENABLE);
+pfctl_enable_store(adjacent_cache_line_prefetcher, ACLPF_ENABLE);
+pfctl_enable_store(stream_detect_prefetcher, SDPF_ENABLE);
+
+static ssize_t
+stream_detect_prefetcher_strength_store(struct device *dev,
+ struct device_attribute *attr,
+ const char *buf, size_t count)
+{
+ int ret;
+ u64 val;
+ unsigned int cpu;
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent);
+
+ if (sysfs_streq(buf, strength_strong_string))
+ val = PFCTL_STRONG_VAL;
+ else if (sysfs_streq(buf, strength_weak_string))
+ val = PFCTL_WEAK_VAL;
+ else
+ return -EINVAL;
+
+ cpu = get_pfctl_device_cpunum(dev);
+
+ ret = pdriver->write_pfreg(SDPF_STRENGTH, cpu, this_leaf->level, val);
+ if (ret < 0)
+ return ret;
+
+ return count;
+}
+
+static ssize_t
+stream_detect_prefetcher_dist_store(struct device *dev,
+ struct device_attribute *attr,
+ const char *buf, size_t count)
+{
+ int ret;
+ u64 val;
+ unsigned int cpu;
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent);
+
+ if (sysfs_streq(buf, dist_auto_string)) {
+ val = PFCTL_DIST_AUTO_VAL;
+ } else {
+ ret = kstrtoull(buf, 10, &val);
+ if (ret < 0 || val < 1)
+ return -EINVAL;
+ }
+
+ cpu = get_pfctl_device_cpunum(dev);
+
+ ret = pdriver->write_pfreg(SDPF_DIST, cpu, this_leaf->level, val);
+ if (ret < 0)
+ return ret;
+
+ return count;
+}
+
+static DEVICE_ATTR_ADMIN_RW(hardware_prefetcher_enable);
+static DEVICE_ATTR_ADMIN_RW(ip_prefetcher_enable);
+static DEVICE_ATTR_ADMIN_RW(adjacent_cache_line_prefetcher_enable);
+static DEVICE_ATTR_ADMIN_RW(stream_detect_prefetcher_enable);
+static DEVICE_ATTR_ADMIN_RW(stream_detect_prefetcher_strength);
+static DEVICE_ATTR_ADMIN_RO(stream_detect_prefetcher_strength_available);
+static DEVICE_ATTR_ADMIN_RW(stream_detect_prefetcher_dist);
+
+static umode_t
+pfctl_attrs_is_visible(struct kobject *kobj, struct attribute *attr, int unused)
+{
+ struct device *dev = kobj_to_dev(kobj);
+ struct cacheinfo *this_leaf = dev_get_drvdata(dev->parent);
+ umode_t mode = attr->mode;
+
+ if ((attr == &dev_attr_hardware_prefetcher_enable.attr) &&
+ (prefetcher_is_available(this_leaf->level, this_leaf->type, HWPF)))
+ return mode;
+
+ if ((attr == &dev_attr_ip_prefetcher_enable.attr) &&
+ (prefetcher_is_available(this_leaf->level, this_leaf->type, IPPF)))
+ return mode;
+
+ if ((attr == &dev_attr_adjacent_cache_line_prefetcher_enable.attr) &&
+ (prefetcher_is_available(this_leaf->level, this_leaf->type, ACLPF)))
+ return mode;
+
+ if (((attr == &dev_attr_stream_detect_prefetcher_enable.attr) ||
+ (attr == &dev_attr_stream_detect_prefetcher_strength.attr) ||
+ (attr == &dev_attr_stream_detect_prefetcher_strength_available.attr)
+ || (attr == &dev_attr_stream_detect_prefetcher_dist.attr)) &&
+ (prefetcher_is_available(this_leaf->level, this_leaf->type, SDPF)))
+ return mode;
+
+ return 0;
+}
+
+static struct attribute *pfctl_attrs[] = {
+ &dev_attr_hardware_prefetcher_enable.attr,
+ &dev_attr_ip_prefetcher_enable.attr,
+ &dev_attr_adjacent_cache_line_prefetcher_enable.attr,
+ &dev_attr_stream_detect_prefetcher_enable.attr,
+ &dev_attr_stream_detect_prefetcher_strength.attr,
+ &dev_attr_stream_detect_prefetcher_strength_available.attr,
+ &dev_attr_stream_detect_prefetcher_dist.attr,
+ NULL,
+};
+
+static const struct attribute_group pfctl_group = {
+ .attrs = pfctl_attrs,
+ .is_visible = pfctl_attrs_is_visible,
+};
+
+static const struct attribute_group *pfctl_groups[] = {
+ &pfctl_group,
+ NULL,
+};
+
+static int find_cache_device(unsigned int cpu)
+{
+ struct device *cpu_dev = get_cpu_device(cpu);
+ struct device *cache_dev;
+
+ cache_dev = device_find_child_by_name(cpu_dev, "cache");
+ if (!cache_dev)
+ return -ENODEV;
+
+ per_cpu_cache_device(cpu) = cache_dev;
+ return 0;
+}
+
+static int _remove_pfctl_attr(struct device *dev, void *data)
+{
+ struct cacheinfo *leaf = dev_get_drvdata(dev);
+ struct device *pfctl_dev;
+
+ if (!prefetcher_is_available(leaf->level, leaf->type, ANYPF))
+ return 0;
+
+ pfctl_dev = device_find_child_by_name(dev, "prefetch_control");
+ if (!pfctl_dev)
+ return 0;
+
+ device_unregister(pfctl_dev);
+ put_device(pfctl_dev);
+ return 0;
+}
+
+static void remove_pfctl_attr(unsigned int cpu)
+{
+ struct device *cache_dev = per_cpu_cache_device(cpu);
+
+ if (!cache_dev)
+ return;
+
+ device_for_each_child(cache_dev, NULL, _remove_pfctl_attr);
+ put_device(cache_dev);
+}
+
+static int _create_pfctl_attr(struct device *dev, void *data)
+{
+ struct cacheinfo *leaf = dev_get_drvdata(dev);
+ struct device *pfctl_dev;
+
+ if (!prefetcher_is_available(leaf->level, leaf->type, ANYPF))
+ return 0;
+
+ pfctl_dev = cpu_device_create(dev, NULL, pfctl_groups,
+ "prefetch_control");
+ if (IS_ERR(pfctl_dev))
+ return PTR_ERR(pfctl_dev);
+
+ return 0;
+}
+
+static int create_pfctl_attr(unsigned int cpu)
+{
+ int ret;
+ struct device *cache_dev = per_cpu_cache_device(cpu);
+
+ if (!cache_dev)
+ return -ENODEV;
+
+ ret = device_for_each_child(cache_dev, NULL, _create_pfctl_attr);
+ if (ret < 0)
+ return ret;
+
+ return 0;
+}
+
+static int pfctl_online(unsigned int cpu)
+{
+ int ret;
+
+ ret = find_cache_device(cpu);
+ if (ret < 0)
+ return ret;
+
+ ret = create_pfctl_attr(cpu);
+ if (ret < 0)
+ return ret;
+
+ return 0;
+}
+
+static int pfctl_prepare_down(unsigned int cpu)
+{
+ remove_pfctl_attr(cpu);
+
+ return 0;
+}
+
+/**
+ * pfctl_register_driver - register a Hardware Prefetch Control driver
+ * @driver_data: struct pfctl_driver must contain the supported prefetcher type
+ * and function pointer for reading and writing hardware prefetch
+ * register. If these are not defined this function return error.
+ *
+ * Note: This function must be called after the cache device is initialized
+ * because it requires access to the cache device.
+ * (e.g. Call at the late_initcall)
+ *
+ * Context: Any context.
+ * Return: 0 on success, negative error code on failure.
+ */
+int pfctl_register_driver(struct pfctl_driver *driver_data)
+{
+ int ret;
+
+ if (pdriver)
+ return -EEXIST;
+
+ if (!(driver_data->supported_l1d_prefetcher & ANYPF) &&
+ !(driver_data->supported_l2_prefetcher & ANYPF))
+ return -EINVAL;
+
+ if ((driver_data->supported_l1d_prefetcher & SDPF) ||
+ (driver_data->supported_l2_prefetcher & SDPF))
+ if (!(driver_data->supported_sdpf_strength & ANY_STRENGTH))
+ return -EINVAL;
+
+ if (!driver_data->read_pfreg || !driver_data->write_pfreg)
+ return -EINVAL;
+
+ pdriver = driver_data;
+
+ ret = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "base/pfctl:online",
+ pfctl_online, pfctl_prepare_down);
+ if (ret < 0) {
+ pr_err("failed to register hotplug callbacks\n");
+ pdriver = NULL;
+ return ret;
+ }
+
+ hp_online = ret;
+
+ return 0;
+}
+EXPORT_SYMBOL_GPL(pfctl_register_driver);
+
+/**
+ * pfctl_unregister_driver - unregister the Hardware Prefetch Control driver
+ * @driver_data: Used to verify that this function is called by the driver that
+ * called pfctl_register_driver by determining if driver_data is
+ * the same.
+ *
+ * Context: Any context.
+ * Return: nothing.
+ */
+void pfctl_unregister_driver(struct pfctl_driver *driver_data)
+{
+ if (!pdriver || (driver_data != pdriver))
+ return;
+
+ cpuhp_remove_state(hp_online);
+
+ pdriver = NULL;
+}
+EXPORT_SYMBOL_GPL(pfctl_unregister_driver);
diff --git a/include/linux/pfctl.h b/include/linux/pfctl.h
new file mode 100644
index 000000000000..9340b23f3d03
--- /dev/null
+++ b/include/linux/pfctl.h
@@ -0,0 +1,49 @@
+/* SPDX-License-Identifier: GPL-2.0 */
+#ifndef _LINUX_PFCTL_H
+#define _LINUX_PFCTL_H
+
+#define PFCTL_ENABLE_VAL 1
+#define PFCTL_DISABLE_VAL 0
+#define PFCTL_STRONG_VAL 0
+#define PFCTL_WEAK_VAL 1
+#define PFCTL_DIST_AUTO_VAL 0
+
+enum pfctl_attr {
+ HWPF_ENABLE,
+ IPPF_ENABLE,
+ ACLPF_ENABLE,
+ SDPF_ENABLE,
+ SDPF_STRENGTH,
+ SDPF_DIST,
+};
+
+enum prefetcher {
+ HWPF = BIT(0), /* Hardware Prefetcher */
+ IPPF = BIT(1), /* IP Prefetcher */
+ ACLPF = BIT(2), /* Adjacent Cache Line Prefetcher */
+ SDPF = BIT(3), /* Stream Detect Prefetcher */
+ ANYPF = HWPF|IPPF|ACLPF|SDPF,
+};
+
+enum strength {
+ STRENGTH_STRONG = BIT(0),
+ STRENGTH_WEAK = BIT(1),
+ ANY_STRENGTH = STRENGTH_STRONG|STRENGTH_WEAK,
+};
+
+struct pfctl_driver {
+ unsigned int supported_l1d_prefetcher;
+ unsigned int supported_l2_prefetcher;
+
+ unsigned int supported_sdpf_strength; /* Set this if support SDPF */
+
+ int (*read_pfreg)(enum pfctl_attr pattr, unsigned int cpu,
+ unsigned int level, u64 *val);
+ int (*write_pfreg)(enum pfctl_attr pattr, unsigned int cpu,
+ unsigned int level, u64 val);
+};
+
+int pfctl_register_driver(struct pfctl_driver *driver_data);
+void pfctl_unregister_driver(struct pfctl_driver *driver_data);
+
+#endif
--
2.27.0
Powered by blists - more mailing lists