[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20250912144514.526441-9-rrichter@amd.com>
Date: Fri, 12 Sep 2025 16:45:10 +0200
From: Robert Richter <rrichter@....com>
To: Alison Schofield <alison.schofield@...el.com>, Vishal Verma
<vishal.l.verma@...el.com>, Ira Weiny <ira.weiny@...el.com>, Dan Williams
<dan.j.williams@...el.com>, Jonathan Cameron <Jonathan.Cameron@...wei.com>,
Dave Jiang <dave.jiang@...el.com>, Davidlohr Bueso <dave@...olabs.net>
CC: <linux-cxl@...r.kernel.org>, <linux-kernel@...r.kernel.org>, Gregory Price
<gourry@...rry.net>, "Fabio M. De Francesco"
<fabio.m.de.francesco@...ux.intel.com>, Terry Bowman <terry.bowman@....com>,
Joshua Hahn <joshua.hahnjy@...il.com>, Robert Richter <rrichter@....com>
Subject: [PATCH v3 08/11] cxl/region: Implement endpoint decoder address translation
Systems that need address translation have the endpoint decoders
programmed for a different address space. Host physical addresses
(HPA) are different from their system physical addresses (SPA). The
decoder's address range and interleaving configuration of such
endpoints cannot be used to determine the region parameters. The
region's address range must be SPA which the decoder does not
provide. In addition, an endpoint's incoming HPA is already converted
to the devices physical address (DPA). Thus it has interleaving
disabled.
Address translation may provide different ways to determine an
endpoint's SPA, e.g. it may support a firmware call. This allows the
determination of the region's parameters without inspecting the
endpoint decoders.
Implement the setup of address translation given there is a function
to convert an endpoint's HPA (which is identical to its DPA) to an
SPA. Use the previously introduced cxl_to_hpa_fn callback for this.
Convert the decoder's address range and ensure it is 256MB aligned.
Identify the region's interleaving ways by inspecting the address
ranges. Also determine the interleaving granularity using the address
translation callback. Note that the position of the chunk from one
interleaving block to the next may vary and thus cannot be considered
constant. Address offsets larger than the interleaving block size
cannot be used to calculate the granularity. Thus, probe the
granularity using address translation for various HPAs in the same
interleaving block.
Note that this patch does not yet enable address translation as
callbacks have not been initialized.
Signed-off-by: Robert Richter <rrichter@....com>
---
drivers/cxl/core/region.c | 95 ++++++++++++++++++++++++++++++++++++++-
1 file changed, 94 insertions(+), 1 deletion(-)
diff --git a/drivers/cxl/core/region.c b/drivers/cxl/core/region.c
index 57697504410b..9fb1e9508213 100644
--- a/drivers/cxl/core/region.c
+++ b/drivers/cxl/core/region.c
@@ -3422,16 +3422,109 @@ struct cxl_region_context {
int interleave_granularity;
};
+static int setup_address_translation(struct cxl_endpoint_decoder *cxled,
+ struct cxl_region_context *ctx)
+{
+ struct cxl_port *port = to_cxl_port(cxled->cxld.dev.parent->parent);
+ struct cxl_decoder *cxld = &cxled->cxld;
+ struct range range = ctx->hpa_range;
+ u64 spa_len, len = range_len(&range);
+ u64 addr, base = range.start;
+ int ways, gran;
+
+ if (!len || !port->to_hpa)
+ return 0;
+
+ if (!IS_ALIGNED(range.start, SZ_256M) ||
+ !IS_ALIGNED(range.end + 1, SZ_256M)) {
+ dev_warn(&port->dev,
+ "CXL address translation: Unaligned decoder HPA range: %#llx-%#llx(%s)\n",
+ range.start, range.end, dev_name(&cxld->dev));
+ return -ENXIO;
+ }
+
+ /* Translate HPA range to SPA. */
+ range.start = port->to_hpa(cxld, range.start);
+ range.end = port->to_hpa(cxld, range.end);
+
+ if (range.start == ULLONG_MAX || range.end == ULLONG_MAX) {
+ dev_warn(&port->dev,
+ "CXL address translation: Failed to translate HPA range: %#llx-%#llx:%#llx-%#llx(%s)\n",
+ range.start, range.end, ctx->hpa_range.start,
+ ctx->hpa_range.end, dev_name(&cxld->dev));
+ return -ENXIO;
+ }
+
+ /*
+ * Since translated addresses include the interleaving
+ * offsets, align the range to 256 MB.
+ */
+ range.start = ALIGN_DOWN(range.start, SZ_256M);
+ range.end = ALIGN(range.end, SZ_256M) - 1;
+
+ spa_len = range_len(&range);
+ if (!len || !spa_len || spa_len % len) {
+ dev_warn(&port->dev,
+ "CXL address translation: HPA range not contiguous: %#llx-%#llx:%#llx-%#llx(%s)\n",
+ range.start, range.end, ctx->hpa_range.start,
+ ctx->hpa_range.end, dev_name(&cxld->dev));
+ return -ENXIO;
+ }
+
+ ways = spa_len / len;
+ gran = SZ_256;
+
+ /*
+ * Determine interleave granularity
+ *
+ * Note: The position of the chunk from one interleaving block
+ * to the next may vary and thus cannot be considered
+ * constant. Address offsets larger than the interleaving
+ * block size cannot be used to calculate the granularity.
+ */
+ while (ways > 1 && gran <= SZ_16M) {
+ addr = port->to_hpa(cxld, base + gran);
+ if (addr != base + gran)
+ break;
+ gran <<= 1;
+ }
+
+ if (gran > SZ_16M) {
+ dev_warn(&port->dev,
+ "CXL address translation: Cannot determine granularity: %#llx-%#llx:%#llx-%#llx(%s)\n",
+ range.start, range.end, ctx->hpa_range.start,
+ ctx->hpa_range.end, dev_name(&cxld->dev));
+ return -ENXIO;
+ }
+
+ ctx->hpa_range = range;
+ ctx->interleave_ways = ways;
+ ctx->interleave_granularity = gran;
+
+ dev_dbg(&cxld->dev,
+ "address mapping found for %s (hpa -> spa): %#llx+%#llx -> %#llx+%#llx ways:%d granularity:%d\n",
+ dev_name(ctx->cxlmd->dev.parent), base, len, range.start,
+ spa_len, ways, gran);
+
+ return 0;
+}
+
static int setup_region_params(struct cxl_endpoint_decoder *cxled,
struct cxl_region_context *ctx)
{
+ int rc;
+
ctx->cxled = cxled;
ctx->cxlmd = cxled_to_memdev(cxled);
ctx->hpa_range = cxled->cxld.hpa_range;
ctx->interleave_ways = cxled->cxld.interleave_ways;
ctx->interleave_granularity = cxled->cxld.interleave_granularity;
- return 0;
+ rc = setup_address_translation(cxled, ctx);
+ if (rc)
+ return rc;
+
+ return rc;
}
static int cxl_extended_linear_cache_resize(struct cxl_region *cxlr,
--
2.39.5
Powered by blists - more mailing lists