[<prev] [next>] [<thread-prev] [day] [month] [year] [list]
Message-ID: <g4txrmmww3werfhho6t625ciqknvyhvqhndceyf6z2pqiygnlr@2pktdkpwrcas>
Date: Thu, 15 Jan 2026 17:48:27 +0900
From: Koichiro Den <den@...inux.co.jp>
To: Frank Li <Frank.li@....com>
Cc: jingoohan1@...il.com, mani@...nel.org, lpieralisi@...nel.org,
kwilczynski@...nel.org, robh@...nel.org, bhelgaas@...gle.com, cassel@...nel.org,
vigneshr@...com, s-vadapalli@...com, hongxing.zhu@....com, l.stach@...gutronix.de,
shawnguo@...nel.org, s.hauer@...gutronix.de, kernel@...gutronix.de,
festevam@...il.com, minghuan.Lian@....com, mingkai.hu@....com, roy.zang@....com,
jesper.nilsson@...s.com, heiko@...ech.de, srikanth.thokala@...el.com,
marek.vasut+renesas@...il.com, yoshihiro.shimoda.uh@...esas.com, geert+renesas@...der.be,
magnus.damm@...il.com, christian.bruel@...s.st.com, mcoquelin.stm32@...il.com,
alexandre.torgue@...s.st.com, thierry.reding@...il.com, jonathanh@...dia.com,
hayashi.kunihiko@...ionext.com, mhiramat@...nel.org, kishon@...nel.org, jirislaby@...nel.org,
rongqianfeng@...o.com, 18255117159@....com, shawn.lin@...k-chips.com,
nicolas.frattaroli@...labora.com, linux.amoon@...il.com, vidyas@...dia.com,
linux-omap@...r.kernel.org, linux-pci@...r.kernel.org, linux-arm-kernel@...ts.infradead.org,
linux-kernel@...r.kernel.org, imx@...ts.linux.dev, linuxppc-dev@...ts.ozlabs.org,
linux-arm-kernel@...s.com, linux-rockchip@...ts.infradead.org,
linux-arm-msm@...r.kernel.org, linux-renesas-soc@...r.kernel.org,
linux-stm32@...md-mailman.stormreply.com, linux-tegra@...r.kernel.org
Subject: Re: [PATCH v7 5/6] PCI: dwc: ep: Support BAR subrange inbound
mapping via Address Match Mode iATU
On Tue, Jan 13, 2026 at 03:53:52PM -0500, Frank Li wrote:
> On Wed, Jan 14, 2026 at 01:27:18AM +0900, Koichiro Den wrote:
> > Extend dw_pcie_ep_set_bar() to support inbound mappings for BAR
> > subranges using Address Match Mode IB iATU.
> >
> > Rename the existing BAR-match helper into dw_pcie_ep_ib_atu_bar() and
> > introduce dw_pcie_ep_ib_atu_addr() for Address Match Mode. When
> > use_submap is set, read the assigned BAR base address and program one
> > inbound iATU window per subrange. Validate the submap array before
> > programming:
> > - each subrange is aligned to pci->region_align
> > - subranges cover the whole BAR (no gaps and no overlaps)
> > - subranges are sorted in ascending order by offset
> >
> > Track Address Match Mode mappings and tear them down on clear_bar() and
> > on set_bar() error paths to avoid leaving half-programmed state or
> > untranslated BAR holes.
> >
> > Advertise this capability by setting subrange_mapping in the EPC
> > features returned from dw_pcie_ep_get_features().
> >
> > Reviewed-by: Niklas Cassel <cassel@...nel.org>
> > Signed-off-by: Koichiro Den <den@...inux.co.jp>
> > ---
> > .../pci/controller/dwc/pcie-designware-ep.c | 230 +++++++++++++++++-
> > drivers/pci/controller/dwc/pcie-designware.h | 2 +
> > 2 files changed, 222 insertions(+), 10 deletions(-)
> >
> > diff --git a/drivers/pci/controller/dwc/pcie-designware-ep.c b/drivers/pci/controller/dwc/pcie-designware-ep.c
> > index 0e5a8d200b00..b2ea2c2c986f 100644
> > --- a/drivers/pci/controller/dwc/pcie-designware-ep.c
> > +++ b/drivers/pci/controller/dwc/pcie-designware-ep.c
> > @@ -139,9 +139,10 @@ static int dw_pcie_ep_write_header(struct pci_epc *epc, u8 func_no, u8 vfunc_no,
> > return 0;
> > }
> >
> > -static int dw_pcie_ep_inbound_atu(struct dw_pcie_ep *ep, u8 func_no, int type,
> > - dma_addr_t parent_bus_addr, enum pci_barno bar,
> > - size_t size)
> > +/* BAR Match Mode inbound iATU mapping */
> > +static int dw_pcie_ep_ib_atu_bar(struct dw_pcie_ep *ep, u8 func_no, int type,
> > + dma_addr_t parent_bus_addr, enum pci_barno bar,
> > + size_t size)
> > {
> > int ret;
> > u32 free_win;
> > @@ -174,6 +175,208 @@ static int dw_pcie_ep_inbound_atu(struct dw_pcie_ep *ep, u8 func_no, int type,
> > return 0;
> > }
> >
> ...
> > +static int dw_pcie_ep_validate_submap(struct dw_pcie_ep *ep,
> > + const struct pci_epf_bar_submap *submap,
> > + unsigned int num_submap, size_t bar_size)
> > +{
> > + struct dw_pcie *pci = to_dw_pcie_from_ep(ep);
> > + u32 align = pci->region_align;
> > + size_t expected = 0;
> > + size_t size, off;
> > + unsigned int i;
> > +
> > + if (!align || !IS_ALIGNED(bar_size, align))
> > + return -EINVAL;
> > +
> > + /*
> > + * The array is expected to be sorted by offset before calling this
> > + * helper. With sorted entries, we can enforce a strict, gapless
> > + * decomposition of the BAR:
> > + * - each entry has a non-zero size
> > + * - offset/size/phys_addr are aligned to pci->region_align
> > + * - each entry lies within the BAR range
> > + * - entries are contiguous (no overlaps, no holes)
> > + * - the entries exactly cover the whole BAR
> > + *
> > + * Note: dw_pcie_prog_inbound_atu() also checks alignment for
> > + * offset/phys_addr, but validating up-front avoids partially
> > + * programming iATU windows in vain.
> > + */
> > + for (i = 0; i < num_submap; i++) {
> > + off = submap[i].offset;
> > + size = submap[i].size;
> > +
> > + if (!size)
> > + return -EINVAL;
> > +
> > + if (!IS_ALIGNED(size, align) || !IS_ALIGNED(off, align))
> > + return -EINVAL;
> > +
> > + if (!IS_ALIGNED(submap[i].phys_addr, align))
> > + return -EINVAL;
> > +
> > + if (off > bar_size || size > bar_size - off)
> > + return -EINVAL;
> > +
> > + /* Enforce contiguity (no overlaps, no holes). */
> > + if (off != expected)
> > + return -EINVAL;
>
> submap[i].offset is unnecessary, you can use expected += size as off.
> code logic will be simple.
Will fix this. as per my earlier response:
https://lore.kernel.org/all/ngvqrju3bi6sugynhksxsci6rmgqevzpoijjflp2373c6uxlum@vyepxqghbzvn/
>
> Frank
> > +
> > + expected += size;
> > + }
> > + if (expected != bar_size)
> > + return -EINVAL;
> > +
> > + return 0;
> > +}
> > +
> > +/* Address Match Mode inbound iATU mapping */
> > +static int dw_pcie_ep_ib_atu_addr(struct dw_pcie_ep *ep, u8 func_no, int type,
> > + const struct pci_epf_bar *epf_bar)
> > +{
> > + const struct pci_epf_bar_submap *submap = epf_bar->submap;
> > + struct dw_pcie *pci = to_dw_pcie_from_ep(ep);
> > + enum pci_barno bar = epf_bar->barno;
> > + struct device *dev = pci->dev;
> > + u64 pci_addr, parent_bus_addr;
> > + struct dw_pcie_ib_map *new;
> > + u64 size, off, base;
> > + unsigned long flags;
> > + int free_win, ret;
> > + unsigned int i;
> > +
> > + if (!epf_bar->num_submap || !submap || !epf_bar->size)
> > + return -EINVAL;
> > +
> > + ret = dw_pcie_ep_validate_submap(ep, submap, epf_bar->num_submap,
> > + epf_bar->size);
> > + if (ret)
> > + return ret;
> > +
> > + base = dw_pcie_ep_read_bar_assigned(ep, func_no, bar, epf_bar->flags);
> > + if (!base) {
> > + dev_err(dev,
> > + "BAR%u not assigned, cannot set up sub-range mappings\n",
> > + bar);
> > + return -EINVAL;
> > + }
> > +
> > + /* Tear down any existing mappings before (re)programming. */
> > + dw_pcie_ep_clear_ib_maps(ep, bar);
> > +
> > + for (i = 0; i < epf_bar->num_submap; i++) {
> > + off = submap[i].offset;
> > + size = submap[i].size;
> > + parent_bus_addr = submap[i].phys_addr;
> > +
> > + if (off > (~0ULL) - base) {
> > + ret = -EINVAL;
> > + goto err;
> > + }
> > +
> > + pci_addr = base + off;
> > +
> > + new = devm_kzalloc(dev, sizeof(*new), GFP_KERNEL);
> > + if (!new) {
> > + ret = -ENOMEM;
> > + goto err;
> > + }
>
> Simple alloc an array struct dw_pcie_ib_map[num_submap] should be simpler
> than link list and alloc some small news.
I'll do so in v8. Thank you for the review!
Koichiro
>
> Frank
> > +
> > + spin_lock_irqsave(&ep->ib_map_lock, flags);
> > +
> > + free_win = find_first_zero_bit(ep->ib_window_map,
> > + pci->num_ib_windows);
> > + if (free_win >= pci->num_ib_windows) {
> > + spin_unlock_irqrestore(&ep->ib_map_lock, flags);
> > + devm_kfree(dev, new);
> > + ret = -ENOSPC;
> > + goto err;
> > + }
> > + set_bit(free_win, ep->ib_window_map);
> > +
> > + new->bar = bar;
> > + new->index = free_win;
> > + new->pci_addr = pci_addr;
> > + new->parent_bus_addr = parent_bus_addr;
> > + new->size = size;
> > + list_add_tail(&new->list, &ep->ib_map_list);
> > +
> > + spin_unlock_irqrestore(&ep->ib_map_lock, flags);
> > +
> > + ret = dw_pcie_prog_inbound_atu(pci, free_win, type,
> > + parent_bus_addr, pci_addr, size);
> > + if (ret) {
> > + spin_lock_irqsave(&ep->ib_map_lock, flags);
> > + list_del(&new->list);
> > + clear_bit(free_win, ep->ib_window_map);
> > + spin_unlock_irqrestore(&ep->ib_map_lock, flags);
> > + devm_kfree(dev, new);
> > + goto err;
> > + }
> > + }
> > + return 0;
> > +err:
> > + dw_pcie_ep_clear_ib_maps(ep, bar);
> > + return ret;
> > +}
> > +
> > static int dw_pcie_ep_outbound_atu(struct dw_pcie_ep *ep,
> > struct dw_pcie_ob_atu_cfg *atu)
> > {
> > @@ -204,17 +407,15 @@ static void dw_pcie_ep_clear_bar(struct pci_epc *epc, u8 func_no, u8 vfunc_no,
> > struct dw_pcie_ep *ep = epc_get_drvdata(epc);
> > struct dw_pcie *pci = to_dw_pcie_from_ep(ep);
> > enum pci_barno bar = epf_bar->barno;
> > - u32 atu_index = ep->bar_to_atu[bar] - 1;
> >
> > - if (!ep->bar_to_atu[bar])
> > + if (!ep->epf_bar[bar])
> > return;
> >
> > __dw_pcie_ep_reset_bar(pci, func_no, bar, epf_bar->flags);
> >
> > - dw_pcie_disable_atu(pci, PCIE_ATU_REGION_DIR_IB, atu_index);
> > - clear_bit(atu_index, ep->ib_window_map);
> > + dw_pcie_ep_clear_ib_maps(ep, bar);
> > +
> > ep->epf_bar[bar] = NULL;
> > - ep->bar_to_atu[bar] = 0;
> > }
> >
> > static unsigned int dw_pcie_ep_get_rebar_offset(struct dw_pcie *pci,
> > @@ -408,8 +609,12 @@ static int dw_pcie_ep_set_bar(struct pci_epc *epc, u8 func_no, u8 vfunc_no,
> > else
> > type = PCIE_ATU_TYPE_IO;
> >
> > - ret = dw_pcie_ep_inbound_atu(ep, func_no, type, epf_bar->phys_addr, bar,
> > - size);
> > + if (epf_bar->use_submap)
> > + ret = dw_pcie_ep_ib_atu_addr(ep, func_no, type, epf_bar);
> > + else
> > + ret = dw_pcie_ep_ib_atu_bar(ep, func_no, type,
> > + epf_bar->phys_addr, bar, size);
> > +
> > if (ret)
> > return ret;
> >
> > @@ -638,6 +843,9 @@ dw_pcie_ep_get_features(struct pci_epc *epc, u8 func_no, u8 vfunc_no)
> > /* All DWC-based glue drivers support dynamic inbound mapping */
> > features->dynamic_inbound_mapping = true;
> >
> > + /* All DWC-based glue drivers support inbound subrange mapping */
> > + features->subrange_mapping = true;
> > +
> > return features;
> > }
> >
> > @@ -1128,6 +1336,8 @@ int dw_pcie_ep_init(struct dw_pcie_ep *ep)
> > struct device *dev = pci->dev;
> >
> > INIT_LIST_HEAD(&ep->func_list);
> > + INIT_LIST_HEAD(&ep->ib_map_list);
> > + spin_lock_init(&ep->ib_map_lock);
> > ep->msi_iatu_mapped = false;
> > ep->msi_msg_addr = 0;
> > ep->msi_map_size = 0;
> > diff --git a/drivers/pci/controller/dwc/pcie-designware.h b/drivers/pci/controller/dwc/pcie-designware.h
> > index 4dda9a38d46b..969b1f32dddf 100644
> > --- a/drivers/pci/controller/dwc/pcie-designware.h
> > +++ b/drivers/pci/controller/dwc/pcie-designware.h
> > @@ -479,6 +479,8 @@ struct dw_pcie_ep {
> > phys_addr_t *outbound_addr;
> > unsigned long *ib_window_map;
> > unsigned long *ob_window_map;
> > + struct list_head ib_map_list;
> > + spinlock_t ib_map_lock;
> > void __iomem *msi_mem;
> > phys_addr_t msi_mem_phys;
> > struct pci_epf_bar *epf_bar[PCI_STD_NUM_BARS];
> > --
> > 2.51.0
> >
Powered by blists - more mailing lists