[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <20240603062741.GA3255068@maili.marvell.com>
Date: Mon, 3 Jun 2024 11:57:41 +0530
From: Ratheesh Kannoth <rkannoth@...vell.com>
To: Lorenzo Bianconi <lorenzo@...nel.org>
CC: <netdev@...r.kernel.org>, <nbd@....name>, <lorenzo.bianconi83@...il.com>,
<davem@...emloft.net>, <edumazet@...gle.com>, <kuba@...nel.org>,
<pabeni@...hat.com>, <conor@...nel.org>,
<linux-arm-kernel@...ts.infradead.org>, <robh+dt@...nel.org>,
<krzysztof.kozlowski+dt@...aro.org>, <conor+dt@...nel.org>,
<devicetree@...r.kernel.org>, <catalin.marinas@....com>,
<will@...nel.org>, <upstream@...oha.com>,
<angelogioacchino.delregno@...labora.com>,
<benjamin.larsson@...exis.eu>
Subject: Re: [PATCH net-next 3/3] net: airoha: Introduce ethernet support for
EN7581 SoC
On 2024-05-31 at 15:52:20, Lorenzo Bianconi (lorenzo@...nel.org) wrote:
> +
> +static int airoha_qdma_fill_rx_queue(struct airoha_queue *q)
> +{
> + struct airoha_eth *eth = q->eth;
> + struct device *dev = eth->net_dev->dev.parent;
> + int qid = q - ð->q_rx[0], nframes = 0;
> +
> + spin_lock_bh(&q->lock);
> + while (q->queued < q->ndesc - 1) {
> + struct airoha_queue_entry *e = &q->entry[q->head];
> + struct airoha_qdma_desc *desc = &q->desc[q->head];
> + enum dma_data_direction dir;
> + struct page *page;
> + int offset;
> + u32 val;
> +
> + page = page_pool_dev_alloc_frag(q->page_pool, &offset,
> + q->buf_size);
> + if (!page)
> + break;
> +
> + q->head = (q->head + 1) % q->ndesc;
q-ndesc is a multiple of 2 ? (q->head + 1)& ~(q-ndesc - 1) would yeild less instruction
and would suffice right ?
> + q->queued++;
> + nframes++;
> +
> + e->buf = page_address(page) + offset;
> + e->dma_addr = page_pool_get_dma_addr(page) + offset;
> + e->dma_len = SKB_WITH_OVERHEAD(q->buf_size);
> + dir = page_pool_get_dma_dir(q->page_pool);
can we move this out from while loop ? as it will be same for the queue
> + dma_sync_single_for_device(dev, e->dma_addr, e->dma_len, dir);
> +
> + val = FIELD_PREP(QDMA_DESC_LEN_MASK, e->dma_len);
> + WRITE_ONCE(desc->ctrl, cpu_to_le32(val));
> + WRITE_ONCE(desc->addr, cpu_to_le32(e->dma_addr));
> + val = FIELD_PREP(QDMA_DESC_NEXT_ID_MASK, q->head);
> + WRITE_ONCE(desc->data, cpu_to_le32(val));
> + WRITE_ONCE(desc->msg0, 0);
> + WRITE_ONCE(desc->msg1, 0);
> + WRITE_ONCE(desc->msg2, 0);
> + WRITE_ONCE(desc->msg3, 0);
> +
> + wmb();
> + airoha_qdma_rmw(eth, REG_RX_CPU_IDX(qid), RX_RING_CPU_IDX_MASK,
> + FIELD_PREP(RX_RING_CPU_IDX_MASK, q->head));
> + }
> + spin_unlock_bh(&q->lock);
> +
> + return nframes;
> +}
> +
> +static int airoha_qdma_rx_process(struct airoha_queue *q, int budget)
> +{
> + struct airoha_eth *eth = q->eth;
> + struct device *dev = eth->net_dev->dev.parent;
> + int done = 0, qid = q - ð->q_rx[0];
Reverse xmas tree.
> +
> + spin_lock_bh(&q->lock);
> + while (done < budget) {
> + struct airoha_queue_entry *e = &q->entry[q->tail];
> + struct airoha_qdma_desc *desc = &q->desc[q->tail];
> + dma_addr_t dma_addr = le32_to_cpu(desc->addr);
> + u32 desc_ctrl = le32_to_cpu(desc->ctrl);
> + struct sk_buff *skb;
> + int len;
> +
> + if (!(desc_ctrl & QDMA_DESC_DONE_MASK))
> + break;
> +
> + len = FIELD_GET(QDMA_DESC_LEN_MASK, desc_ctrl);
> + if (!dma_addr || !len)
> + break;
> +
> + q->tail = (q->tail + 1) % q->ndesc;
> + q->queued--;
> +
> + dma_sync_single_for_cpu(dev, dma_addr,
> + SKB_WITH_OVERHEAD(q->buf_size),
> + page_pool_get_dma_dir(q->page_pool));
> +
> + skb = napi_build_skb(e->buf, q->buf_size);
> + if (!skb) {
> + page_pool_put_full_page(q->page_pool,
> + virt_to_head_page(e->buf),
> + true);
> + continue;
How while loop exist as done is not getting incremented in case is nap_build_skb() keeps
failing ?
> + }
> +
> + skb_reserve(skb, 2);
> + __skb_put(skb, len);
> +
> + skb_mark_for_recycle(skb);
> + skb->dev = eth->net_dev;
> + skb->protocol = eth_type_trans(skb, eth->net_dev);
> + skb->ip_summed = CHECKSUM_UNNECESSARY;
> + skb_record_rx_queue(skb, qid);
> + napi_gro_receive(&q->napi, skb);
> +
> + done++;
> + }
> + spin_unlock_bh(&q->lock);
> +
> + airoha_qdma_fill_rx_queue(q);
> +
> + return done;
> +}
> +
> +static int airoha_qdma_rx_napi_poll(struct napi_struct *napi, int budget)
> +{
> + struct airoha_queue *q = container_of(napi, struct airoha_queue, napi);
> + struct airoha_eth *eth = q->eth;
> + int cur, done = 0;
> +
> + do {
> + cur = airoha_qdma_rx_process(q, budget - done);
> + done += cur;
> + } while (cur && done < budget);
> +
> + if (done < budget && napi_complete(napi))
> + airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX1,
> + RX_DONE_INT_MASK);
> +
> + return done;
> +}
> +
> +static int airoha_qdma_init_rx_queue(struct airoha_eth *eth,
> + struct airoha_queue *q, int ndesc)
> +{
> + struct device *dev = eth->net_dev->dev.parent;
> + struct page_pool_params pp_params = {
> + .order = 0,
> + .pool_size = 256,
> + .flags = PP_FLAG_DMA_MAP | PP_FLAG_DMA_SYNC_DEV,
> + .dma_dir = DMA_FROM_DEVICE,
> + .max_len = PAGE_SIZE,
> + .nid = NUMA_NO_NODE,
> + .dev = dev,
> + .napi = &q->napi,
> + };
> + int qid = q - ð->q_rx[0], thr;
> + dma_addr_t dma_addr;
> +
> + spin_lock_init(&q->lock);
> + q->buf_size = PAGE_SIZE / 2;
> + q->ndesc = ndesc;
> + q->eth = eth;
> +
> + q->entry = devm_kzalloc(dev, q->ndesc * sizeof(*q->entry),
> + GFP_KERNEL);
> + if (!q->entry)
> + return -ENOMEM;
> +
> + q->page_pool = page_pool_create(&pp_params);
> + if (IS_ERR(q->page_pool)) {
> + int err = PTR_ERR(q->page_pool);
> +
> + q->page_pool = NULL;
> + return err;
> + }
> +
> + q->desc = dmam_alloc_coherent(dev, q->ndesc * sizeof(*q->desc),
> + &dma_addr, GFP_KERNEL);
> + if (!q->desc)
Dont we need to destroy the page pool ?
> + return -ENOMEM;
> +
> + netif_napi_add(eth->net_dev, &q->napi, airoha_qdma_rx_napi_poll);
> +
> + airoha_qdma_wr(eth, REG_RX_RING_BASE(qid), dma_addr);
> + airoha_qdma_rmw(eth, REG_RX_RING_SIZE(qid), RX_RING_SIZE_MASK,
> + FIELD_PREP(RX_RING_SIZE_MASK, ndesc));
> +
> + thr = clamp(ndesc >> 3, 1, 32);
> + airoha_qdma_rmw(eth, REG_RX_RING_SIZE(qid), RX_RING_THR_MASK,
> + FIELD_PREP(RX_RING_THR_MASK, thr));
> + airoha_qdma_rmw(eth, REG_RX_DMA_IDX(qid), RX_RING_DMA_IDX_MASK,
> + FIELD_PREP(RX_RING_DMA_IDX_MASK, q->head));
> +
> + airoha_qdma_fill_rx_queue(q);
> +
> + return 0;
> +}
> +
> +static void airoha_qdma_clenaup_rx_queue(struct airoha_queue *q)
> +{
> + struct airoha_eth *eth = q->eth;
> + struct device *dev = eth->net_dev->dev.parent;
Reverse xmas tree.
> +
> + spin_lock_bh(&q->lock);
> +
> + while (q->queued) {
> + struct airoha_queue_entry *e = &q->entry[q->tail];
> + struct page *page = virt_to_head_page(e->buf);
> + enum dma_data_direction dir;
> +
> + dir = page_pool_get_dma_dir(q->page_pool);
can we move this out of while loop ?
> + dma_sync_single_for_cpu(dev, e->dma_addr, e->dma_len, dir);
> + page_pool_put_full_page(q->page_pool, page, false);
> + q->tail = (q->tail + 1) % q->ndesc;
> + q->queued--;
> + }
> +
> + spin_unlock_bh(&q->lock);
> +}
> +
> +static int airoha_qdma_init_rx(struct airoha_eth *eth)
> +{
> + int i;
> +
> + for (i = 0; i < ARRAY_SIZE(eth->q_rx); i++) {
> + int err;
> +
> + if (!(RX_DONE_INT_MASK & BIT(i))) {
> + /* rx-queue not binded to irq */
> + continue;
> + }
> +
> + err = airoha_qdma_init_rx_queue(eth, ð->q_rx[i],
> + RX_DSCP_NUM(i));
> + if (err)
> + return err;
> + }
> +
> + return 0;
> +}
> +
> +static int airoha_qdma_tx_napi_poll(struct napi_struct *napi, int budget)
> +{
> + struct airoha_tx_irq_queue *irq_q;
> + struct airoha_eth *eth;
> + struct device *dev;
> + int id, done = 0;
> +
> + irq_q = container_of(napi, struct airoha_tx_irq_queue, napi);
> + eth = irq_q->eth;
> + id = irq_q - ð->q_tx_irq[0];
> + dev = eth->net_dev->dev.parent;
> +
> + while (irq_q->queued > 0 && done < budget) {
> + u32 qid, last, val = irq_q->q[irq_q->head];
> + struct airoha_queue *q;
> +
> + if (val == 0xff)
> + break;
> +
> + irq_q->q[irq_q->head] = 0xff; /* mark as done */
> + irq_q->head = (irq_q->head + 1) % irq_q->size;
> + irq_q->queued--;
> + done++;
> +
> + last = FIELD_GET(IRQ_DESC_IDX_MASK, val);
> + qid = FIELD_GET(IRQ_RING_IDX_MASK, val);
> +
> + if (qid >= ARRAY_SIZE(eth->q_tx))
> + continue;
> +
> + q = ð->q_tx[qid];
> + spin_lock_bh(&q->lock);
> +
> + while (q->queued > 0) {
> + struct airoha_qdma_desc *desc = &q->desc[q->tail];
> + struct airoha_queue_entry *e = &q->entry[q->tail];
> + u32 desc_ctrl = le32_to_cpu(desc->ctrl);
> + u16 index = q->tail;
> +
> + if (!(desc_ctrl & QDMA_DESC_DONE_MASK) &&
> + !(desc_ctrl & QDMA_DESC_DROP_MASK))
> + break;
> +
> + q->tail = (q->tail + 1) % q->ndesc;
> + q->queued--;
> +
> + dma_unmap_single(dev, e->dma_addr, e->dma_len,
> + DMA_TO_DEVICE);
> + dev_kfree_skb_any(e->skb);
> + e->skb = NULL;
> +
> + WRITE_ONCE(desc->msg0, 0);
> + WRITE_ONCE(desc->msg1, 0);
> +
> + if (index == last)
> + break;
> + }
> +
> + if (__netif_subqueue_stopped(eth->net_dev, qid) &&
> + q->queued + q->free_thr < q->ndesc)
> + netif_wake_subqueue(eth->net_dev, qid);
> +
> + spin_unlock_bh(&q->lock);
> + }
> +
> + if (done) {
> + int i, len = done >> 7;
> +
> + for (i = 0; i < len; i++)
> + airoha_qdma_rmw(eth, REG_IRQ_CLEAR_LEN(id),
> + IRQ_CLEAR_LEN_MASK, 0x80);
> + airoha_qdma_rmw(eth, REG_IRQ_CLEAR_LEN(id),
> + IRQ_CLEAR_LEN_MASK, (done & 0x7f));
> + }
> +
> + if (done < budget && napi_complete(napi))
> + airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX0,
> + TX_DONE_INT_MASK(id));
> +
> + return done;
> +}
> +
> +static int airoha_qdma_init_tx_queue(struct airoha_eth *eth,
> + struct airoha_queue *q, int size)
> +{
> + struct device *dev = eth->net_dev->dev.parent;
> + int i, qid = q - ð->q_tx[0];
> + dma_addr_t dma_addr;
> +
> + spin_lock_init(&q->lock);
> + q->ndesc = size;
> + q->eth = eth;
> + q->free_thr = MAX_SKB_FRAGS;
> +
> + q->entry = devm_kzalloc(dev, q->ndesc * sizeof(*q->entry),
> + GFP_KERNEL);
> + if (!q->entry)
> + return -ENOMEM;
> +
> + q->desc = dmam_alloc_coherent(dev, q->ndesc * sizeof(*q->desc),
> + &dma_addr, GFP_KERNEL);
> + if (!q->desc)
> + return -ENOMEM;
> +
> + for (i = 0; i < q->ndesc; i++) {
> + u32 val;
> +
> + val = FIELD_PREP(QDMA_DESC_DONE_MASK, 1);
> + WRITE_ONCE(q->desc[i].ctrl, cpu_to_le32(val));
> + }
> +
> + airoha_qdma_wr(eth, REG_TX_RING_BASE(qid), dma_addr);
> + airoha_qdma_rmw(eth, REG_TX_CPU_IDX(qid), TX_RING_CPU_IDX_MASK,
> + FIELD_PREP(TX_RING_CPU_IDX_MASK, q->head));
> + airoha_qdma_rmw(eth, REG_TX_DMA_IDX(qid), TX_RING_DMA_IDX_MASK,
> + FIELD_PREP(TX_RING_DMA_IDX_MASK, q->head));
> +
> + return 0;
> +}
> +
> +static int airoha_qdma_tx_irq_init(struct airoha_eth *eth,
> + struct airoha_tx_irq_queue *irq_q,
> + int size)
> +{
> + struct device *dev = eth->net_dev->dev.parent;
> + int id = irq_q - ð->q_tx_irq[0];
> + dma_addr_t dma_addr;
> +
> + netif_napi_add(eth->net_dev, &irq_q->napi, airoha_qdma_tx_napi_poll);
> + irq_q->q = dmam_alloc_coherent(dev, size * sizeof(u32), &dma_addr,
> + GFP_KERNEL);
> + if (!irq_q->q)
> + return -ENOMEM;
> +
> + memset(irq_q->q, 0xff, size * sizeof(u32));
> + irq_q->size = size;
> + irq_q->eth = eth;
> +
> + airoha_qdma_wr(eth, REG_TX_IRQ_BASE(id), dma_addr);
> + airoha_qdma_rmw(eth, REG_TX_IRQ_CFG(id), TX_IRQ_DEPTH_MASK,
> + FIELD_PREP(TX_IRQ_DEPTH_MASK, size));
> + airoha_qdma_rmw(eth, REG_TX_IRQ_CFG(id), TX_IRQ_THR_MASK,
> + FIELD_PREP(TX_IRQ_THR_MASK, 32));
> +
> + return 0;
> +}
> +
> +static int airoha_qdma_init_tx(struct airoha_eth *eth)
> +{
> + int i, err;
> +
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++) {
> + err = airoha_qdma_tx_irq_init(eth, ð->q_tx_irq[i],
> + IRQ_QUEUE_LEN(i));
> + if (err)
> + return err;
> + }
> +
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++) {
> + err = airoha_qdma_init_tx_queue(eth, ð->q_tx[i],
> + TX_DSCP_NUM);
> + if (err)
> + return err;
> + }
> +
> + return 0;
> +}
> +
> +static void airoha_qdma_clenaup_tx_queue(struct airoha_queue *q)
> +{
> + struct airoha_eth *eth = q->eth;
> + struct device *dev = eth->net_dev->dev.parent;
> +
> + spin_lock_bh(&q->lock);
> +
> + while (q->queued) {
> + struct airoha_queue_entry *e = &q->entry[q->tail];
> +
> + dma_unmap_single(dev, e->dma_addr, e->dma_len, DMA_TO_DEVICE);
> + dev_kfree_skb_any(e->skb);
> + e->skb = NULL;
> +
> + q->tail = (q->tail + 1) % q->ndesc;
> + q->queued--;
> + }
> +
> + spin_unlock_bh(&q->lock);
> +}
> +
> +static int airoha_qdma_init_hfwd_queues(struct airoha_eth *eth)
> +{
> + struct device *dev = eth->net_dev->dev.parent;
> + dma_addr_t dma_addr;
> + u32 status;
> + int size;
> +
> + size = HW_DSCP_NUM * sizeof(struct airoha_qdma_fwd_desc);
> + eth->hfwd.desc = dmam_alloc_coherent(dev, size, &dma_addr,
> + GFP_KERNEL);
> + if (!eth->hfwd.desc)
> + return -ENOMEM;
> +
> + airoha_qdma_wr(eth, REG_FWD_DSCP_BASE, dma_addr);
> +
> + size = AIROHA_MAX_PACKET_SIZE * HW_DSCP_NUM;
> + eth->hfwd.q = dmam_alloc_coherent(dev, size, &dma_addr, GFP_KERNEL);
> + if (!eth->hfwd.q)
> + return -ENOMEM;
> +
> + airoha_qdma_wr(eth, REG_FWD_BUF_BASE, dma_addr);
> +
> + airoha_qdma_rmw(eth, REG_HW_FWD_DSCP_CFG,
> + HW_FWD_DSCP_PAYLOAD_SIZE_MASK,
> + FIELD_PREP(HW_FWD_DSCP_PAYLOAD_SIZE_MASK, 0));
> + airoha_qdma_rmw(eth, REG_FWD_DSCP_LOW_THR, FWD_DSCP_LOW_THR_MASK,
> + FIELD_PREP(FWD_DSCP_LOW_THR_MASK, 128));
> + airoha_qdma_rmw(eth, REG_LMGR_INIT_CFG,
> + LMGR_INIT_START | LMGR_SRAM_MODE_MASK |
> + HW_FWD_DESC_NUM_MASK,
> + FIELD_PREP(HW_FWD_DESC_NUM_MASK, HW_DSCP_NUM) |
> + LMGR_INIT_START);
> +
> + return read_poll_timeout(airoha_qdma_rr, status,
> + !(status & LMGR_INIT_START), USEC_PER_MSEC,
> + 30 * USEC_PER_MSEC, true, eth,
> + REG_LMGR_INIT_CFG);
> +}
> +
> +static void airoha_qdma_init_qos(struct airoha_eth *eth)
> +{
> + airoha_qdma_clear(eth, REG_TXWRR_MODE_CFG, TWRR_WEIGHT_SCALE_MASK);
> + airoha_qdma_set(eth, REG_TXWRR_MODE_CFG, TWRR_WEIGHT_BASE_MASK);
> +
> + airoha_qdma_clear(eth, REG_PSE_BUF_USAGE_CFG,
> + PSE_BUF_ESTIMATE_EN_MASK);
> +
> + airoha_qdma_set(eth, REG_EGRESS_RATE_METER_CFG,
> + EGRESS_RATE_METER_EN_MASK |
> + EGRESS_RATE_METER_EQ_RATE_EN_MASK);
> + /* 2047us x 31 = 63.457ms */
> + airoha_qdma_rmw(eth, REG_EGRESS_RATE_METER_CFG,
> + EGRESS_RATE_METER_WINDOW_SZ_MASK,
> + FIELD_PREP(EGRESS_RATE_METER_WINDOW_SZ_MASK, 0x1f));
> + airoha_qdma_rmw(eth, REG_EGRESS_RATE_METER_CFG,
> + EGRESS_RATE_METER_TIMESLICE_MASK,
> + FIELD_PREP(EGRESS_RATE_METER_TIMESLICE_MASK, 0x7ff));
> +
> + /* ratelimit init */
> + airoha_qdma_set(eth, REG_GLB_TRTCM_CFG, GLB_TRTCM_EN_MASK);
> + airoha_qdma_rmw(eth, REG_GLB_TRTCM_CFG, GLB_FAST_TICK_MASK,
> + FIELD_PREP(GLB_FAST_TICK_MASK, 25)); /* fast-tick 25us */
> + airoha_qdma_rmw(eth, REG_GLB_TRTCM_CFG, GLB_SLOW_TICK_RATIO_MASK,
> + FIELD_PREP(GLB_SLOW_TICK_RATIO_MASK, 40));
> +
> + airoha_qdma_set(eth, REG_EGRESS_TRTCM_CFG, EGRESS_TRTCM_EN_MASK);
> + airoha_qdma_rmw(eth, REG_EGRESS_TRTCM_CFG, EGRESS_FAST_TICK_MASK,
> + FIELD_PREP(EGRESS_FAST_TICK_MASK, 25));
> + airoha_qdma_rmw(eth, REG_EGRESS_TRTCM_CFG,
> + EGRESS_SLOW_TICK_RATIO_MASK,
> + FIELD_PREP(EGRESS_SLOW_TICK_RATIO_MASK, 40));
> +
> + airoha_qdma_set(eth, REG_INGRESS_TRTCM_CFG, INGRESS_TRTCM_EN_MASK);
> + airoha_qdma_clear(eth, REG_INGRESS_TRTCM_CFG,
> + INGRESS_TRTCM_MODE_MASK);
> + airoha_qdma_rmw(eth, REG_INGRESS_TRTCM_CFG, INGRESS_FAST_TICK_MASK,
> + FIELD_PREP(INGRESS_FAST_TICK_MASK, 125));
> + airoha_qdma_rmw(eth, REG_INGRESS_TRTCM_CFG,
> + INGRESS_SLOW_TICK_RATIO_MASK,
> + FIELD_PREP(INGRESS_SLOW_TICK_RATIO_MASK, 8));
> +
> + airoha_qdma_set(eth, REG_SLA_TRTCM_CFG, SLA_TRTCM_EN_MASK);
> + airoha_qdma_rmw(eth, REG_SLA_TRTCM_CFG, SLA_FAST_TICK_MASK,
> + FIELD_PREP(SLA_FAST_TICK_MASK, 25));
> + airoha_qdma_rmw(eth, REG_SLA_TRTCM_CFG, SLA_SLOW_TICK_RATIO_MASK,
> + FIELD_PREP(SLA_SLOW_TICK_RATIO_MASK, 40));
> +}
> +
> +static int airoha_qdma_hw_init(struct airoha_eth *eth)
> +{
> + int i;
> +
> + /* clear pending irqs */
> + for (i = 0; i < ARRAY_SIZE(eth->irqmask); i++)
> + airoha_qdma_wr(eth, REG_INT_STATUS(i), 0xffffffff);
> +
> + /* setup irqs */
> + airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX0, INT_IDX0_MASK);
> + airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX1, INT_IDX1_MASK);
> + airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX4, INT_IDX4_MASK);
> +
> + /* setup irq binding */
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++) {
> + if (TX_RING_IRQ_BLOCKING_MAP_MASK & BIT(i))
> + airoha_qdma_set(eth, REG_TX_RING_BLOCKING(i),
> + TX_RING_IRQ_BLOCKING_CFG_MASK);
> + else
> + airoha_qdma_clear(eth, REG_TX_RING_BLOCKING(i),
> + TX_RING_IRQ_BLOCKING_CFG_MASK);
> + }
> +
> + airoha_qdma_wr(eth, REG_QDMA_GLOBAL_CFG,
> + GLOBAL_CFG_RX_2B_OFFSET |
> + FIELD_PREP(GLOBAL_CFG_DMA_PREFERENCE_MASK, 3) |
> + GLOBAL_CFG_CPU_TXR_ROUND_ROBIN |
> + GLOBAL_CFG_PAYLOAD_BYTE_SWAP |
> + GLOBAL_CFG_MULTICAST_MODIFY_FP |
> + GLOBAL_CFG_MULTICAST_EN_MASK |
> + GLOBAL_CFG_IRQ0_EN | GLOBAL_CFG_IRQ1_EN |
> + GLOBAL_CFG_TX_WB_DONE |
> + FIELD_PREP(GLOBAL_CFG_MAX_ISSUE_NUM_MASK, 2));
> +
> + airoha_qdma_init_qos(eth);
> +
> + /* disable qdma rx delay interrupt */
> + airoha_qdma_for_each_q_rx(eth, i)
> + airoha_qdma_clear(eth, REG_RX_DELAY_INT_IDX(i),
> + RX_DELAY_INT_MASK);
> +
> + airoha_qdma_set(eth, REG_TXQ_CNGST_CFG,
> + TXQ_CNGST_DROP_EN | TXQ_CNGST_DEI_DROP_EN);
> +
> + return 0;
> +}
> +
> +static irqreturn_t airoha_irq_handler(int irq, void *dev_instance)
> +{
> + struct airoha_eth *eth = dev_instance;
> + u32 intr[ARRAY_SIZE(eth->irqmask)];
> + int i;
> +
> + for (i = 0; i < ARRAY_SIZE(eth->irqmask); i++) {
> + intr[i] = airoha_qdma_rr(eth, REG_INT_STATUS(i));
> + intr[i] &= eth->irqmask[i];
> + airoha_qdma_wr(eth, REG_INT_STATUS(i), intr[i]);
> + }
> +
> + if (!test_bit(DEV_STATE_INITIALIZED, ð->state))
> + return IRQ_NONE;
> +
> + if (intr[1] & RX_DONE_INT_MASK) {
> + airoha_qdma_irq_disable(eth, QDMA_INT_REG_IDX1,
> + RX_DONE_INT_MASK);
> + airoha_qdma_for_each_q_rx(eth, i) {
> + if (intr[1] & BIT(i))
> + napi_schedule(ð->q_rx[i].napi);
> + }
> + }
> +
> + if (intr[0] & INT_TX_MASK) {
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++) {
> + struct airoha_tx_irq_queue *irq_q = ð->q_tx_irq[i];
> + u32 status, head;
> +
> + if (!(intr[0] & TX_DONE_INT_MASK(i)))
> + continue;
> +
> + airoha_qdma_irq_disable(eth, QDMA_INT_REG_IDX0,
> + TX_DONE_INT_MASK(i));
> +
> + status = airoha_qdma_rr(eth, REG_IRQ_STATUS(i));
> + head = FIELD_GET(IRQ_HEAD_IDX_MASK, status);
> + irq_q->head = head % irq_q->size;
> + irq_q->queued = FIELD_GET(IRQ_ENTRY_LEN_MASK, status);
> +
> + napi_schedule(ð->q_tx_irq[i].napi);
> + }
> + }
> +
> + return IRQ_HANDLED;
> +}
> +
> +static int airoha_qdma_init(struct airoha_eth *eth)
> +{
> + struct device *dev = eth->net_dev->dev.parent;
> + int err;
> +
> + err = devm_request_irq(dev, eth->irq, airoha_irq_handler,
> + IRQF_SHARED, KBUILD_MODNAME, eth);
> + if (err)
> + return err;
> +
> + err = airoha_qdma_init_rx(eth);
> + if (err)
> + return err;
> +
> + err = airoha_qdma_init_tx(eth);
> + if (err)
> + return err;
> +
> + err = airoha_qdma_init_hfwd_queues(eth);
> + if (err)
> + return err;
> +
> + err = airoha_qdma_hw_init(eth);
> + if (err)
> + return err;
> +
> + set_bit(DEV_STATE_INITIALIZED, ð->state);
> +
> + return 0;
> +}
> +
> +static int airoha_hw_init(struct airoha_eth *eth)
> +{
> + int err;
> +
> + /* disable xsi */
> + reset_control_bulk_assert(ARRAY_SIZE(eth->xsi_rsts), eth->xsi_rsts);
> +
> + reset_control_bulk_assert(ARRAY_SIZE(eth->rsts), eth->rsts);
> + msleep(20);
> + reset_control_bulk_deassert(ARRAY_SIZE(eth->rsts), eth->rsts);
> + msleep(20);
> +
> + err = airoha_fe_init(eth);
> + if (err)
> + return err;
> +
> + return airoha_qdma_init(eth);
> +}
> +
> +static int airoha_dev_open(struct net_device *dev)
> +{
> + struct airoha_eth *eth = netdev_priv(dev);
> + int err;
> +
> + if (netdev_uses_dsa(dev))
> + airoha_fe_set(eth, REG_GDM1_INGRESS_CFG, GDM1_STAG_EN_MASK);
> + else
> + airoha_fe_clear(eth, REG_GDM1_INGRESS_CFG, GDM1_STAG_EN_MASK);
> +
> + netif_tx_start_all_queues(dev);
> + err = airoha_set_gdma_ports(eth, true);
> + if (err)
> + return err;
> +
> + airoha_qdma_set(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_TX_DMA_EN);
> + airoha_qdma_set(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_RX_DMA_EN);
> +
> + return 0;
> +}
> +
> +static int airoha_dev_stop(struct net_device *dev)
> +{
> + struct airoha_eth *eth = netdev_priv(dev);
> + int err;
> +
> + netif_tx_disable(dev);
> + err = airoha_set_gdma_ports(eth, false);
> + if (err)
> + return err;
> +
> + airoha_qdma_clear(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_TX_DMA_EN);
> + airoha_qdma_clear(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_RX_DMA_EN);
> +
> + return 0;
> +}
> +
> +static int airoha_dev_set_macaddr(struct net_device *dev, void *p)
> +{
> + struct airoha_eth *eth = netdev_priv(dev);
> + int err;
> +
> + err = eth_mac_addr(dev, p);
> + if (err)
> + return err;
> +
> + airoha_set_macaddr(eth, dev->dev_addr);
> +
> + return 0;
> +}
> +
> +static int airoha_dev_init(struct net_device *dev)
> +{
> + struct airoha_eth *eth = netdev_priv(dev);
> +
> + airoha_set_macaddr(eth, dev->dev_addr);
> +
> + return 0;
> +}
> +
> +static netdev_tx_t airoha_dev_xmit(struct sk_buff *skb,
> + struct net_device *dev)
> +{
> + struct skb_shared_info *sinfo = skb_shinfo(skb);
> + u32 nr_frags = 1 + sinfo->nr_frags, msg0 = 0, msg1;
> + struct airoha_eth *eth = netdev_priv(dev);
> + int i, qid = skb_get_queue_mapping(skb);
> + u32 len = skb_headlen(skb);
> + struct airoha_queue *q;
> + void *data = skb->data;
> + u16 index;
> +
> + if (skb->ip_summed == CHECKSUM_PARTIAL)
> + msg0 |= FIELD_PREP(QDMA_ETH_TXMSG_TCO_MASK, 1) |
> + FIELD_PREP(QDMA_ETH_TXMSG_UCO_MASK, 1) |
> + FIELD_PREP(QDMA_ETH_TXMSG_ICO_MASK, 1);
> +
> + /* TSO: fill MSS info in tcp checksum field */
> + if (skb_is_gso(skb)) {
> + if (skb_cow_head(skb, 0))
> + goto error;
> +
> + if (sinfo->gso_type & (SKB_GSO_TCPV4 | SKB_GSO_TCPV6)) {
> + tcp_hdr(skb)->check = cpu_to_be16(sinfo->gso_size);
> + msg0 |= FIELD_PREP(QDMA_ETH_TXMSG_TSO_MASK, 1);
> + }
> + }
> +
> + msg1 = FIELD_PREP(QDMA_ETH_TXMSG_FPORT_MASK, DPORT_GDM1) |
> + FIELD_PREP(QDMA_ETH_TXMSG_METER_MASK, 0x7f);
> +
> + if (WARN_ON_ONCE(qid >= ARRAY_SIZE(eth->q_tx)))
> + qid = 0;
> +
> + q = ð->q_tx[qid];
> + spin_lock_bh(&q->lock);
> +
> + if (q->queued + nr_frags > q->ndesc) {
> + /* not enough space in the queue */
> + spin_unlock_bh(&q->lock);
> + return NETDEV_TX_BUSY;
> + }
> +
> + index = q->head;
> + for (i = 0; i < nr_frags; i++) {
> + struct airoha_qdma_desc *desc = &q->desc[index];
> + struct airoha_queue_entry *e = &q->entry[index];
> + skb_frag_t *frag = &sinfo->frags[i];
> + dma_addr_t addr;
> + u32 val;
> +
> + addr = dma_map_single(dev->dev.parent, data, len,
> + DMA_TO_DEVICE);
> + if (unlikely(dma_mapping_error(dev->dev.parent, addr)))
> + goto error_unmap;
> +
> + index = (index + 1) % q->ndesc;
> +
> + val = FIELD_PREP(QDMA_DESC_LEN_MASK, len);
> + if (i < nr_frags - 1)
> + val |= FIELD_PREP(QDMA_DESC_MORE_MASK, 1);
> + WRITE_ONCE(desc->ctrl, cpu_to_le32(val));
> + WRITE_ONCE(desc->addr, cpu_to_le32(addr));
> + val = FIELD_PREP(QDMA_DESC_NEXT_ID_MASK, index);
> + WRITE_ONCE(desc->data, cpu_to_le32(val));
> + WRITE_ONCE(desc->msg0, cpu_to_le32(msg0));
> + WRITE_ONCE(desc->msg1, cpu_to_le32(msg1));
> + WRITE_ONCE(desc->msg2, cpu_to_le32(0xffff));
> +
> + e->skb = i ? NULL : skb;
> + e->dma_addr = addr;
> + e->dma_len = len;
> +
> + wmb();
> + airoha_qdma_rmw(eth, REG_TX_CPU_IDX(qid), TX_RING_CPU_IDX_MASK,
> + FIELD_PREP(TX_RING_CPU_IDX_MASK, index));
> +
> + data = skb_frag_address(frag);
> + len = skb_frag_size(frag);
> + }
> +
> + q->head = index;
> + q->queued += i;
> +
> + if (q->queued + q->free_thr >= q->ndesc)
> + netif_stop_subqueue(dev, qid);
> +
> + spin_unlock_bh(&q->lock);
> +
> + return NETDEV_TX_OK;
> +
> +error_unmap:
> + for (; i >= 0; i++)
> + dma_unmap_single(dev->dev.parent, q->entry[i].dma_addr,
> + q->entry[i].dma_len, DMA_TO_DEVICE);
> +
> + spin_unlock_bh(&q->lock);
> +error:
> + dev_kfree_skb_any(skb);
> + dev->stats.tx_dropped++;
> +
> + return NETDEV_TX_OK;
> +}
> +
> +static int airoha_dev_change_mtu(struct net_device *dev, int new_mtu)
> +{
> + dev->mtu = new_mtu;
> +
> + return 0;
> +}
> +
> +static const struct net_device_ops airoha_netdev_ops = {
> + .ndo_init = airoha_dev_init,
> + .ndo_open = airoha_dev_open,
> + .ndo_stop = airoha_dev_stop,
> + .ndo_start_xmit = airoha_dev_xmit,
> + .ndo_change_mtu = airoha_dev_change_mtu,
> + .ndo_set_mac_address = airoha_dev_set_macaddr,
> +};
> +
> +static int airoha_rx_queues_show(struct seq_file *s, void *data)
> +{
> + struct airoha_eth *eth = s->private;
> + int i;
> +
> + seq_puts(s, " queue | hw-queued | head | tail |\n");
> + airoha_qdma_for_each_q_rx(eth, i) {
> + struct airoha_queue *q = ð->q_rx[i];
> +
> + seq_printf(s, " %9d | %9d | %9d | %9d |\n",
> + i, q->queued, q->head, q->tail);
> + }
> +
> + return 0;
> +}
> +DEFINE_SHOW_ATTRIBUTE(airoha_rx_queues);
> +
> +static int airoha_xmit_queues_show(struct seq_file *s, void *data)
> +{
> + struct airoha_eth *eth = s->private;
> + int i;
> +
> + seq_puts(s, " queue | hw-queued | head | tail |\n");
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++) {
> + struct airoha_queue *q = ð->q_tx[i];
> +
> + seq_printf(s, " %9d | %9d | %9d | %9d |\n",
> + i, q->queued, q->head, q->tail);
> + }
> +
> + return 0;
> +}
> +DEFINE_SHOW_ATTRIBUTE(airoha_xmit_queues);
> +
> +static int airoha_register_debugfs(struct airoha_eth *eth)
> +{
> + eth->debugfs_dir = debugfs_create_dir(KBUILD_MODNAME, NULL);
> + if (IS_ERR(eth->debugfs_dir))
> + return PTR_ERR(eth->debugfs_dir);
> +
> + debugfs_create_file("rx-queues", 0400, eth->debugfs_dir, eth,
> + &airoha_rx_queues_fops);
> + debugfs_create_file("xmit-queues", 0400, eth->debugfs_dir, eth,
> + &airoha_xmit_queues_fops);
> +
> + return 0;
> +}
> +
> +static int airoha_probe(struct platform_device *pdev)
> +{
> + struct device_node *np = pdev->dev.of_node;
> + struct net_device *dev;
> + struct airoha_eth *eth;
> + int err;
> +
> + dev = devm_alloc_etherdev_mqs(&pdev->dev, sizeof(*eth),
> + AIROHA_NUM_TX_RING, AIROHA_NUM_RX_RING);
> + if (!dev) {
> + dev_err(&pdev->dev, "alloc_etherdev failed\n");
> + return -ENOMEM;
> + }
> +
> + eth = netdev_priv(dev);
> + eth->net_dev = dev;
> +
> + err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
> + if (err) {
> + dev_err(&pdev->dev, "failed configuring DMA mask\n");
> + return err;
> + }
> +
> + eth->fe_regs = devm_platform_ioremap_resource_byname(pdev, "fe");
> + if (IS_ERR(eth->fe_regs))
> + return dev_err_probe(&pdev->dev, PTR_ERR(eth->fe_regs),
> + "failed to iomap fe regs\n");
> +
> + eth->qdma_regs = devm_platform_ioremap_resource_byname(pdev, "qdma0");
> + if (IS_ERR(eth->qdma_regs))
> + return dev_err_probe(&pdev->dev, PTR_ERR(eth->qdma_regs),
> + "failed to iomap qdma regs\n");
> +
> + eth->rsts[0].id = "fe";
> + eth->rsts[1].id = "pdma";
> + eth->rsts[2].id = "qdma";
> + err = devm_reset_control_bulk_get_exclusive(&pdev->dev,
> + ARRAY_SIZE(eth->rsts),
> + eth->rsts);
> + if (err) {
> + dev_err(&pdev->dev, "failed to get bulk reset lines\n");
> + return err;
> + }
> +
> + eth->xsi_rsts[0].id = "xsi-mac";
> + eth->xsi_rsts[1].id = "hsi0-mac";
> + eth->xsi_rsts[2].id = "hsi1-mac";
> + eth->xsi_rsts[3].id = "hsi-mac";
> + err = devm_reset_control_bulk_get_exclusive(&pdev->dev,
> + ARRAY_SIZE(eth->xsi_rsts),
> + eth->xsi_rsts);
> + if (err) {
> + dev_err(&pdev->dev, "failed to get bulk xsi reset lines\n");
> + return err;
> + }
> +
> + spin_lock_init(ð->irq_lock);
> + eth->irq = platform_get_irq(pdev, 0);
> + if (eth->irq < 0) {
> + dev_err(&pdev->dev, "failed reading irq line\n");
> + return eth->irq;
> + }
> +
> + dev->netdev_ops = &airoha_netdev_ops;
> + dev->max_mtu = AIROHA_MAX_MTU;
> + dev->watchdog_timeo = 5 * HZ;
> + dev->hw_features = NETIF_F_IP_CSUM | NETIF_F_RXCSUM |
> + NETIF_F_TSO6 | NETIF_F_IPV6_CSUM |
> + NETIF_F_SG | NETIF_F_TSO;
> + dev->features |= dev->hw_features;
> + dev->dev.of_node = np;
> + dev->irq = eth->irq;
> + SET_NETDEV_DEV(dev, &pdev->dev);
> +
> + err = of_get_ethdev_address(np, dev);
> + if (err) {
> + if (err == -EPROBE_DEFER)
> + return err;
> +
> + eth_hw_addr_random(dev);
> + dev_err(&pdev->dev, "generated random MAC address %pM\n",
> + dev->dev_addr);
> + }
> +
> + err = airoha_hw_init(eth);
> + if (err)
> + return err;
> +
> + airoha_qdma_start_napi(eth);
> + err = register_netdev(dev);
> + if (err)
> + return err;
> +
> + err = airoha_register_debugfs(eth);
> + if (err)
> + return err;
> +
> + platform_set_drvdata(pdev, eth);
> +
> + return 0;
> +}
> +
> +static void airoha_remove(struct platform_device *pdev)
> +{
> + struct airoha_eth *eth = platform_get_drvdata(pdev);
> + int i;
> +
> + debugfs_remove(eth->debugfs_dir);
> +
> + airoha_qdma_for_each_q_rx(eth, i) {
> + struct airoha_queue *q = ð->q_rx[i];
> +
> + netif_napi_del(&q->napi);
> + airoha_qdma_clenaup_rx_queue(q);
> + page_pool_destroy(q->page_pool);
> + }
> +
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++)
> + netif_napi_del(ð->q_tx_irq[i].napi);
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++)
> + airoha_qdma_clenaup_tx_queue(ð->q_tx[i]);
> +}
> +
> +const struct of_device_id of_airoha_match[] = {
> + { .compatible = "airoha,en7581-eth" },
> + { /* sentinel */ }
> +};
> +
> +static struct platform_driver airoha_driver = {
> + .probe = airoha_probe,
> + .remove_new = airoha_remove,
> + .driver = {
> + .name = KBUILD_MODNAME,
> + .of_match_table = of_airoha_match,
> + },
> +};
> +module_platform_driver(airoha_driver);
> +
> +MODULE_LICENSE("GPL");
> +MODULE_AUTHOR("Lorenzo Bianconi <lorenzo@...nel.org>");
> +MODULE_DESCRIPTION("Ethernet driver for Airoha SoC");
> diff --git a/drivers/net/ethernet/mediatek/airoha_eth.h b/drivers/net/ethernet/mediatek/airoha_eth.h
> new file mode 100644
> index 000000000000..e88fecfac44f
> --- /dev/null
> +++ b/drivers/net/ethernet/mediatek/airoha_eth.h
> @@ -0,0 +1,719 @@
> +// SPDX-License-Identifier: GPL-2.0
> +/*
> + * Copyright (C) 2024 Lorenzo Bianconi <lorenzo@...nel.org>
> + */
> +
> +#define AIROHA_MAX_NUM_RSTS 3
> +#define AIROHA_MAX_NUM_XSI_RSTS 4
> +#define AIROHA_MAX_MTU 2000
> +#define AIROHA_MAX_PACKET_SIZE 2048
> +#define AIROHA_NUM_TX_RING 32
> +#define AIROHA_NUM_RX_RING 32
> +#define AIROHA_FE_MC_MAX_VLAN_TABLE 64
> +#define AIROHA_FE_MC_MAX_VLAN_PORT 16
> +#define AIROHA_NUM_TX_IRQ 2
> +#define HW_DSCP_NUM 2048
> +#define IRQ_QUEUE_LEN(_n) ((_n) ? 1024 : 2048)
> +#define TX_DSCP_NUM 1024
> +#define RX_DSCP_NUM(_n) \
> + ((_n) == 2 ? 128 : \
> + (_n) == 11 ? 128 : \
> + (_n) == 15 ? 128 : \
> + (_n) == 0 ? 1024 : 16)
> +
> +/* FE */
> +#define PSE_BASE 0x0100
> +#define CSR_IFC_BASE 0x0200
> +#define CDM1_BASE 0x0400
> +#define GDM1_BASE 0x0500
> +#define PPE1_BASE 0x0c00
> +
> +#define CDM2_BASE 0x1400
> +#define GDM2_BASE 0x1500
> +
> +#define GDM3_BASE 0x1100
> +#define GDM4_BASE 0x2400
> +
> +#define REG_FE_DMA_GLO_CFG 0x0000
> +#define FE_DMA_GLO_L2_SPACE_MASK GENMASK(7, 4)
> +#define FE_DMA_GLO_PG_SZ_MASK BIT(3)
> +
> +#define REG_FE_RST_GLO_CFG 0x0004
> +#define FE_RST_GDM4_MBI_ARB_MASK BIT(3)
> +#define FE_RST_GDM3_MBI_ARB_MASK BIT(2)
> +#define FE_RST_CORE_MASK BIT(0)
> +
> +#define REG_FE_LAN_MAC_H 0x0040
> +#define REG_FE_LAN_MAC_LMIN 0x0044
> +#define REG_FE_LAN_MAC_LMAX 0x0048
> +
> +#define REG_FE_CDM1_OQ_MAP0 0x0050
> +#define REG_FE_CDM1_OQ_MAP1 0x0054
> +#define REG_FE_CDM1_OQ_MAP2 0x0058
> +#define REG_FE_CDM1_OQ_MAP3 0x005c
> +
> +#define REG_FE_PCE_CFG 0x0070
> +#define PCE_DPI_EN BIT(2)
> +#define PCE_KA_EN BIT(1)
> +#define PCE_MC_EN BIT(0)
> +
> +#define PSE_PORT0_QUEUE 6
> +#define PSE_PORT1_QUEUE 6
> +#define PSE_PORT2_QUEUE 32
> +#define PSE_PORT3_QUEUE 6
> +#define PSE_PORT4_QUEUE 4
> +#define PSE_PORT5_QUEUE 6
> +#define PSE_PORT6_QUEUE 8
> +#define PSE_PORT7_QUEUE 10
> +#define PSE_PORT8_QUEUE 4
> +#define PSE_PORT9_QUEUE 2
> +#define PSE_PORT10_QUEUE 2
> +#define PSE_PORT11_QUEUE 0
> +#define PSE_PORT12_QUEUE 0
> +#define PSE_PORT13_QUEUE 0
> +#define PSE_PORT14_QUEUE 0
> +#define PSE_PORT15_QUEUE 0
> +
> +#define REG_FE_PSE_QUEUE_CFG_WR 0x0080
> +#define PSE_CFG_PORT_ID_MASK GENMASK(27, 24)
> +#define PSE_CFG_QUEUE_ID_MASK GENMASK(20, 16)
> +#define PSE_CFG_WR_EN_MASK BIT(8)
> +#define PSE_CFG_OQRSV_SEL_MASK BIT(0)
> +
> +#define REG_FE_PSE_QUEUE_CFG_VAL 0x0084
> +#define PSE_CFG_OQ_RSV_MASK GENMASK(13, 0)
> +
> +#define PSE_FQ_CFG 0x008c
> +#define PSE_FQ_LIMIT_MASK GENMASK(14, 0)
> +
> +#define REG_FE_PSE_BUF_SET 0x0090
> +#define PSE_SHARE_USED_LTHD_MASK GENMASK(31, 16)
> +#define PSE_ALLRSV_MASK GENMASK(14, 0)
> +
> +#define REG_PSE_SHARE_USED_THD 0x0094
> +#define PSE_SHARE_USED_MTHD_MASK GENMASK(31, 16)
> +#define PSE_SHARE_USED_HTHD_MASK GENMASK(15, 0)
> +
> +#define REG_GDM_MISC_CFG 0x0148
> +#define GDM2_RDM_ACK_WAIT_PREF_MASK BIT(9)
> +#define GDM2_CHN_VLD_MODE_MASK BIT(5)
> +
> +#define REG_FE_CSR_IFC_CFG CSR_IFC_BASE
> +#define FE_IFC_EN_MASK BIT(0)
> +
> +#define REG_FE_VIP_PORT_EN 0x01f0
> +#define REG_FE_IFC_PORT_EN 0x01f4
> +
> +#define REG_PSE_IQ_REV1 (PSE_BASE + 0x08)
> +#define PSE_IQ_RES1_P2_MASK GENMASK(23, 16)
> +
> +#define REG_PSE_IQ_REV2 (PSE_BASE + 0x0c)
> +#define PSE_IQ_RES2_P5_MASK GENMASK(15, 8)
> +#define PSE_IQ_RES2_P4_MASK GENMASK(7, 0)
> +
> +#define REG_FE_VIP_EN(_n) (0x0300 + ((_n) << 3))
> +#define PATN_FCPU_EN_MASK BIT(7)
> +#define PATN_SWP_EN_MASK BIT(6)
> +#define PATN_DP_EN_MASK BIT(5)
> +#define PATN_SP_EN_MASK BIT(4)
> +#define PATN_TYPE_MASK GENMASK(3, 1)
> +#define PATN_EN_MASK BIT(0)
> +
> +#define REG_FE_VIP_PATN(_n) (0x0304 + ((_n) << 3))
> +#define PATN_DP_MASK GENMASK(31, 16)
> +#define PATN_SP_MASK GENMASK(15, 0)
> +
> +#define REG_CDM1_VLAN_CTRL CDM1_BASE
> +#define CDM1_VLAN_MASK GENMASK(31, 16)
> +
> +#define REG_CDM1_FWD_CFG (CDM1_BASE + 0x08)
> +#define CDM1_VIP_QSEL_MASK GENMASK(24, 20)
> +
> +#define REG_CDM1_CRSN_QSEL(_n) (CDM1_BASE + 0x10 + ((_n) << 2))
> +#define CDM1_CRSN_QSEL_REASON_MASK(_n) \
> + GENMASK(4 + (((_n) % 4) << 3), (((_n) % 4 ) << 3))
> +
> +#define REG_CDM2_FWD_CFG (CDM2_BASE + 0x08)
> +#define CDM2_OAM_QSEL_MASK GENMASK(31, 27)
> +#define CDM2_VIP_QSEL_MASK GENMASK(24, 20)
> +
> +#define REG_CDM2_CRSN_QSEL(_n) (CDM2_BASE + 0x10 + ((_n) << 2))
> +#define CDM2_CRSN_QSEL_REASON_MASK(_n) \
> + GENMASK(4 + (((_n) % 4) << 3), (((_n) % 4 ) << 3))
> +
> +#define REG_GDM1_FWD_CFG GDM1_BASE
> +#define GDM1_DROP_CRC_ERR BIT(23)
> +#define GDM1_IP4_CKSUM BIT(22)
> +#define GDM1_TCP_CKSUM BIT(21)
> +#define GDM1_UDP_CKSUM BIT(20)
> +#define GDM1_UCFQ_MASK GENMASK(15, 12)
> +#define GDM1_BCFQ_MASK GENMASK(11, 8)
> +#define GDM1_MCFQ_MASK GENMASK(7, 4)
> +#define GDM1_OCFQ_MASK GENMASK(3, 0)
> +
> +#define REG_GDM1_INGRESS_CFG (GDM1_BASE + 0x10)
> +#define GDM1_INGRESS_FC_EN_MASK BIT(1)
> +#define GDM1_STAG_EN_MASK BIT(0)
> +
> +#define REG_GDM1_LEN_CFG (GDM1_BASE + 0x14)
> +#define GDM1_SHORT_LEN_MASK GENMASK(13, 0)
> +#define GDM1_LONG_LEN_MASK GENMASK(29, 16)
> +
> +#define REG_FE_CPORT_CFG (GDM1_BASE + 0x40)
> +#define FE_CPORT_PAD BIT(26)
> +#define FE_CPORT_PORT_XFC_MASK BIT(25)
> +#define FE_CPORT_QUEUE_XFC_MASK BIT(24)
> +
> +#define REG_PPE1_TB_HASH_CFG (PPE1_BASE + 0x250)
> +#define PPE1_SRAM_TABLE_EN_MASK BIT(0)
> +#define PPE1_SRAM_HASH1_EN_MASK BIT(8)
> +#define PPE1_DRAM_TABLE_EN_MASK BIT(16)
> +#define PPE1_DRAM_HASH1_EN_MASK BIT(24)
> +
> +#define REG_GDM2_CHN_RLS (GDM2_BASE + 0x20)
> +#define MBI_RX_AGE_SEL_MASK GENMASK(18, 17)
> +#define MBI_TX_AGE_SEL_MASK GENMASK(18, 17)
> +
> +#define REG_GDM3_FWD_CFG GDM3_BASE
> +#define GDM3_PAD_EN_MASK BIT(28)
> +
> +#define REG_GDM4_FWD_CFG (GDM4_BASE + 0x100)
> +#define GDM4_PAD_EN_MASK BIT(28)
> +#define GDM4_SPORT_OFFSET0_MASK GENMASK(11, 8)
> +
> +#define REG_GDM4_SRC_PORT_SET (GDM4_BASE + 0x33c)
> +#define GDM4_SPORT_OFF2_MASK GENMASK(19, 16)
> +#define GDM4_SPORT_OFF1_MASK GENMASK(15, 12)
> +#define GDM4_SPORT_OFF0_MASK GENMASK(11, 8)
> +
> +#define REG_IP_FRAG_FP 0x2010
> +#define IP_ASSEMBLE_PORT_MASK GENMASK(24, 21)
> +#define IP_ASSEMBLE_NBQ_MASK GENMASK(20, 16)
> +#define IP_FRAGMENT_PORT_MASK GENMASK(8, 5)
> +#define IP_FRAGMENT_NBQ_MASK GENMASK(4, 0)
> +
> +#define REG_MC_VLAN_EN 0x2100
> +#define MC_VLAN_EN_MASK BIT(0)
> +
> +#define REG_MC_VLAN_CFG 0x2104
> +#define MC_VLAN_CFG_CMD_DONE_MASK BIT(31)
> +#define MC_VLAN_CFG_TABLE_ID_MASK GENMASK(21, 16)
> +#define MC_VLAN_CFG_PORT_ID_MASK GENMASK(11, 8)
> +#define MC_VLAN_CFG_TABLE_SEL_MASK BIT(4)
> +#define MC_VLAN_CFG_RW_MASK BIT(0)
> +
> +#define REG_MC_VLAN_DATA 0x2108
> +
> +#define REG_CDM5_RX_OQ1_DROP_CNT 0x29d4
> +
> +/* QDMA */
> +#define REG_QDMA_GLOBAL_CFG 0x0004
> +#define GLOBAL_CFG_RX_2B_OFFSET BIT(31)
> +#define GLOBAL_CFG_DMA_PREFERENCE_MASK GENMASK(30, 29)
> +#define GLOBAL_CFG_CPU_TXR_ROUND_ROBIN BIT(28)
> +#define GLOBAL_CFG_DSCP_BYTE_SWAP BIT(27)
> +#define GLOBAL_CFG_PAYLOAD_BYTE_SWAP BIT(26)
> +#define GLOBAL_CFG_MULTICAST_MODIFY_FP BIT(25)
> +#define GLOBAL_CFG_OAM_MODIFY_MASK BIT(24)
> +#define GLOBAL_CFG_RESET_MASK BIT(23)
> +#define GLOBAL_CFG_RESET_DONE_MASK BIT(22)
> +#define GLOBAL_CFG_MULTICAST_EN_MASK BIT(21)
> +#define GLOBAL_CFG_IRQ1_EN BIT(20)
> +#define GLOBAL_CFG_IRQ0_EN BIT(19)
> +#define GLOBAL_CFG_LOOPCNT_EN BIT(18)
> +#define GLOBAL_CFG_RD_BYPASS_WR BIT(17)
> +#define GLOBAL_CFG_QDMA_LOOPBACK BIT(16)
> +#define GLOBAL_CFG_LPBK_RXQ_SEL_MASK GENMASK(13, 8)
> +#define GLOBAL_CFG_CHECK_DONE BIT(7)
> +#define GLOBAL_CFG_TX_WB_DONE BIT(6)
> +#define GLOBAL_CFG_MAX_ISSUE_NUM_MASK GENMASK(5, 4)
> +#define GLOBAL_CFG_RX_DMA_BUSY BIT(3)
> +#define GLOBAL_CFG_RX_DMA_EN BIT(2)
> +#define GLOBAL_CFG_TX_DMA_BUSY BIT(1)
> +#define GLOBAL_CFG_TX_DMA_EN BIT(0)
> +
> +#define REG_FWD_DSCP_BASE 0x0010
> +#define REG_FWD_BUF_BASE 0x0014
> +
> +#define REG_HW_FWD_DSCP_CFG 0x0018
> +#define HW_FWD_DSCP_PAYLOAD_SIZE_MASK GENMASK(29, 28)
> +#define HW_FWD_DSCP_SCATTER_LEN_MASK GENMASK(17, 16)
> +#define HW_FWD_DSCP_MIN_SCATTER_LEN_MASK GENMASK(15, 0)
> +
> +#define REG_INT_STATUS(_n) \
> + (((_n) == 4) ? 0x0730 : \
> + ((_n) == 3) ? 0x0724 : \
> + ((_n) == 2) ? 0x0720 : \
> + ((_n) == 1) ? 0x0024 : 0x0020)
> +
> +#define REG_INT_ENABLE(_n) \
> + (((_n) == 4) ? 0x0750 : \
> + ((_n) == 3) ? 0x0744 : \
> + ((_n) == 2) ? 0x0740 : \
> + ((_n) == 1) ? 0x002c : 0x0028)
> +
> +/* QDMA_CSR_INT_ENABLE1 */
> +#define RX15_COHERENT_INT_MASK BIT(31)
> +#define RX14_COHERENT_INT_MASK BIT(30)
> +#define RX13_COHERENT_INT_MASK BIT(29)
> +#define RX12_COHERENT_INT_MASK BIT(28)
> +#define RX11_COHERENT_INT_MASK BIT(27)
> +#define RX10_COHERENT_INT_MASK BIT(26)
> +#define RX9_COHERENT_INT_MASK BIT(25)
> +#define RX8_COHERENT_INT_MASK BIT(24)
> +#define RX7_COHERENT_INT_MASK BIT(23)
> +#define RX6_COHERENT_INT_MASK BIT(22)
> +#define RX5_COHERENT_INT_MASK BIT(21)
> +#define RX4_COHERENT_INT_MASK BIT(20)
> +#define RX3_COHERENT_INT_MASK BIT(19)
> +#define RX2_COHERENT_INT_MASK BIT(18)
> +#define RX1_COHERENT_INT_MASK BIT(17)
> +#define RX0_COHERENT_INT_MASK BIT(16)
> +#define TX7_COHERENT_INT_MASK BIT(15)
> +#define TX6_COHERENT_INT_MASK BIT(14)
> +#define TX5_COHERENT_INT_MASK BIT(13)
> +#define TX4_COHERENT_INT_MASK BIT(12)
> +#define TX3_COHERENT_INT_MASK BIT(11)
> +#define TX2_COHERENT_INT_MASK BIT(10)
> +#define TX1_COHERENT_INT_MASK BIT(9)
> +#define TX0_COHERENT_INT_MASK BIT(8)
> +#define CNT_OVER_FLOW_INT_MASK BIT(7)
> +#define IRQ1_FULL_INT_MASK BIT(5)
> +#define IRQ1_INT_MASK BIT(4)
> +#define HWFWD_DSCP_LOW_INT_MASK BIT(3)
> +#define HWFWD_DSCP_EMPTY_INT_MASK BIT(2)
> +#define IRQ0_FULL_INT_MASK BIT(1)
> +#define IRQ0_INT_MASK BIT(0)
> +
> +#define TX_DONE_INT_MASK(_n) \
> + ((_n) ? IRQ1_INT_MASK | IRQ1_FULL_INT_MASK \
> + : IRQ0_INT_MASK | IRQ0_FULL_INT_MASK)
> +
> +#define INT_TX_MASK \
> + (IRQ1_INT_MASK | IRQ1_FULL_INT_MASK | \
> + IRQ0_INT_MASK | IRQ0_FULL_INT_MASK)
> +
> +#define INT_IDX0_MASK \
> + (TX0_COHERENT_INT_MASK | TX1_COHERENT_INT_MASK | \
> + TX2_COHERENT_INT_MASK | TX3_COHERENT_INT_MASK | \
> + TX4_COHERENT_INT_MASK | TX5_COHERENT_INT_MASK | \
> + TX6_COHERENT_INT_MASK | TX7_COHERENT_INT_MASK | \
> + RX0_COHERENT_INT_MASK | RX1_COHERENT_INT_MASK | \
> + RX2_COHERENT_INT_MASK | RX3_COHERENT_INT_MASK | \
> + RX4_COHERENT_INT_MASK | RX7_COHERENT_INT_MASK | \
> + RX8_COHERENT_INT_MASK | RX9_COHERENT_INT_MASK | \
> + RX15_COHERENT_INT_MASK | INT_TX_MASK)
> +
> +/* QDMA_CSR_INT_ENABLE2 */
> +#define RX15_NO_CPU_DSCP_INT_MASK BIT(31)
> +#define RX14_NO_CPU_DSCP_INT_MASK BIT(30)
> +#define RX13_NO_CPU_DSCP_INT_MASK BIT(29)
> +#define RX12_NO_CPU_DSCP_INT_MASK BIT(28)
> +#define RX11_NO_CPU_DSCP_INT_MASK BIT(27)
> +#define RX10_NO_CPU_DSCP_INT_MASK BIT(26)
> +#define RX9_NO_CPU_DSCP_INT_MASK BIT(25)
> +#define RX8_NO_CPU_DSCP_INT_MASK BIT(24)
> +#define RX7_NO_CPU_DSCP_INT_MASK BIT(23)
> +#define RX6_NO_CPU_DSCP_INT_MASK BIT(22)
> +#define RX5_NO_CPU_DSCP_INT_MASK BIT(21)
> +#define RX4_NO_CPU_DSCP_INT_MASK BIT(20)
> +#define RX3_NO_CPU_DSCP_INT_MASK BIT(19)
> +#define RX2_NO_CPU_DSCP_INT_MASK BIT(18)
> +#define RX1_NO_CPU_DSCP_INT_MASK BIT(17)
> +#define RX0_NO_CPU_DSCP_INT_MASK BIT(16)
> +#define RX15_DONE_INT_MASK BIT(15)
> +#define RX14_DONE_INT_MASK BIT(14)
> +#define RX13_DONE_INT_MASK BIT(13)
> +#define RX12_DONE_INT_MASK BIT(12)
> +#define RX11_DONE_INT_MASK BIT(11)
> +#define RX10_DONE_INT_MASK BIT(10)
> +#define RX9_DONE_INT_MASK BIT(9)
> +#define RX8_DONE_INT_MASK BIT(8)
> +#define RX7_DONE_INT_MASK BIT(7)
> +#define RX6_DONE_INT_MASK BIT(6)
> +#define RX5_DONE_INT_MASK BIT(5)
> +#define RX4_DONE_INT_MASK BIT(4)
> +#define RX3_DONE_INT_MASK BIT(3)
> +#define RX2_DONE_INT_MASK BIT(2)
> +#define RX1_DONE_INT_MASK BIT(1)
> +#define RX0_DONE_INT_MASK BIT(0)
> +
> +#define RX_DONE_INT_MASK \
> + (RX0_DONE_INT_MASK | RX1_DONE_INT_MASK | \
> + RX2_DONE_INT_MASK | RX3_DONE_INT_MASK | \
> + RX4_DONE_INT_MASK | RX7_DONE_INT_MASK | \
> + RX8_DONE_INT_MASK | RX9_DONE_INT_MASK | \
> + RX15_DONE_INT_MASK)
> +#define INT_IDX1_MASK \
> + (RX_DONE_INT_MASK | \
> + RX0_NO_CPU_DSCP_INT_MASK | RX1_NO_CPU_DSCP_INT_MASK | \
> + RX2_NO_CPU_DSCP_INT_MASK | RX3_NO_CPU_DSCP_INT_MASK | \
> + RX4_NO_CPU_DSCP_INT_MASK | RX7_NO_CPU_DSCP_INT_MASK | \
> + RX8_NO_CPU_DSCP_INT_MASK | RX9_NO_CPU_DSCP_INT_MASK | \
> + RX15_NO_CPU_DSCP_INT_MASK)
> +
> +/* QDMA_CSR_INT_ENABLE5 */
> +#define TX31_COHERENT_INT_MASK BIT(31)
> +#define TX30_COHERENT_INT_MASK BIT(30)
> +#define TX29_COHERENT_INT_MASK BIT(29)
> +#define TX28_COHERENT_INT_MASK BIT(28)
> +#define TX27_COHERENT_INT_MASK BIT(27)
> +#define TX26_COHERENT_INT_MASK BIT(26)
> +#define TX25_COHERENT_INT_MASK BIT(25)
> +#define TX24_COHERENT_INT_MASK BIT(24)
> +#define TX23_COHERENT_INT_MASK BIT(23)
> +#define TX22_COHERENT_INT_MASK BIT(22)
> +#define TX21_COHERENT_INT_MASK BIT(21)
> +#define TX20_COHERENT_INT_MASK BIT(20)
> +#define TX19_COHERENT_INT_MASK BIT(19)
> +#define TX18_COHERENT_INT_MASK BIT(18)
> +#define TX17_COHERENT_INT_MASK BIT(17)
> +#define TX16_COHERENT_INT_MASK BIT(16)
> +#define TX15_COHERENT_INT_MASK BIT(15)
> +#define TX14_COHERENT_INT_MASK BIT(14)
> +#define TX13_COHERENT_INT_MASK BIT(13)
> +#define TX12_COHERENT_INT_MASK BIT(12)
> +#define TX11_COHERENT_INT_MASK BIT(11)
> +#define TX10_COHERENT_INT_MASK BIT(10)
> +#define TX9_COHERENT_INT_MASK BIT(9)
> +#define TX8_COHERENT_INT_MASK BIT(8)
> +
> +#define INT_IDX4_MASK \
> + (TX8_COHERENT_INT_MASK | TX9_COHERENT_INT_MASK | \
> + TX10_COHERENT_INT_MASK | TX11_COHERENT_INT_MASK | \
> + TX12_COHERENT_INT_MASK | TX13_COHERENT_INT_MASK | \
> + TX14_COHERENT_INT_MASK | TX15_COHERENT_INT_MASK | \
> + TX16_COHERENT_INT_MASK | TX17_COHERENT_INT_MASK | \
> + TX18_COHERENT_INT_MASK | TX19_COHERENT_INT_MASK | \
> + TX20_COHERENT_INT_MASK | TX21_COHERENT_INT_MASK | \
> + TX20_COHERENT_INT_MASK | TX21_COHERENT_INT_MASK | \
> + TX22_COHERENT_INT_MASK | TX23_COHERENT_INT_MASK | \
> + TX24_COHERENT_INT_MASK | TX25_COHERENT_INT_MASK | \
> + TX26_COHERENT_INT_MASK | TX27_COHERENT_INT_MASK | \
> + TX28_COHERENT_INT_MASK | TX29_COHERENT_INT_MASK | \
> + TX30_COHERENT_INT_MASK | TX31_COHERENT_INT_MASK)
> +
> +#define REG_TX_IRQ_BASE(_n) ((_n) ? 0x0048 : 0x0050)
> +
> +#define REG_TX_IRQ_CFG(_n) ((_n) ? 0x004c : 0x0054)
> +#define TX_IRQ_THR_MASK GENMASK(27, 16)
> +#define TX_IRQ_DEPTH_MASK GENMASK(11, 0)
> +
> +#define REG_IRQ_CLEAR_LEN(_n) ((_n) ? 0x0064 : 0x0058)
> +#define IRQ_CLEAR_LEN_MASK GENMASK(7, 0)
> +
> +#define REG_IRQ_STATUS(_n) ((_n) ? 0x0068 : 0x005c)
> +#define IRQ_ENTRY_LEN_MASK GENMASK(27, 16)
> +#define IRQ_HEAD_IDX_MASK GENMASK(11, 0)
> +
> +#define REG_TX_RING_BASE(_n) \
> + (((_n) < 8) ? 0x0100 + ((_n) << 5) : 0x0b00 + (((_n) - 8) << 5))
> +
> +#define REG_TX_RING_BLOCKING(_n) \
> + (((_n) < 8) ? 0x0104 + ((_n) << 5) : 0x0b04 + (((_n) - 8) << 5))
> +
> +#define TX_RING_IRQ_BLOCKING_MAP_MASK BIT(6)
> +#define TX_RING_IRQ_BLOCKING_CFG_MASK BIT(4)
> +#define TX_RING_IRQ_BLOCKING_TX_DROP_EN_MASK BIT(2)
> +#define TX_RING_IRQ_BLOCKING_MAX_TH_TXRING_EN_MASK BIT(1)
> +#define TX_RING_IRQ_BLOCKING_MIN_TH_TXRING_EN_MASK BIT(0)
> +
> +#define REG_TX_CPU_IDX(_n) \
> + (((_n) < 8) ? 0x0108 + ((_n) << 5) : 0x0b08 + (((_n) - 8) << 5))
> +
> +#define TX_RING_CPU_IDX_MASK GENMASK(15, 0)
> +
> +#define REG_TX_DMA_IDX(_n) \
> + (((_n) < 8) ? 0x010c + ((_n) << 5) : 0x0b0c + (((_n) - 8) << 5))
> +
> +#define TX_RING_DMA_IDX_MASK GENMASK(15, 0)
> +
> +#define IRQ_RING_IDX_MASK GENMASK(20, 16)
> +#define IRQ_DESC_IDX_MASK GENMASK(15, 0)
> +
> +#define REG_RX_RING_BASE(_n) \
> + (((_n) < 16) ? 0x0200 + ((_n) << 5) : 0x0e00 + (((_n) - 16) << 5))
> +
> +#define REG_RX_RING_SIZE(_n) \
> + (((_n) < 16) ? 0x0204 + ((_n) << 5) : 0x0e04 + (((_n) - 16) << 5))
> +
> +#define RX_RING_THR_MASK GENMASK(31, 16)
> +#define RX_RING_SIZE_MASK GENMASK(15, 0)
> +
> +#define REG_RX_CPU_IDX(_n) \
> + (((_n) < 16) ? 0x0208 + ((_n) << 5) : 0x0e08 + (((_n) - 16) << 5))
> +
> +#define RX_RING_CPU_IDX_MASK GENMASK(15, 0)
> +
> +#define REG_RX_DMA_IDX(_n) \
> + (((_n) < 16) ? 0x020c + ((_n) << 5) : 0x0e0c + (((_n) - 16) << 5))
> +
> +#define REG_RX_DELAY_INT_IDX(_n) \
> + (((_n) < 16) ? 0x0210 + ((_n) << 5) : 0x0e10 + (((_n) - 16) << 5))
> +
> +#define RX_DELAY_INT_MASK GENMASK(15, 0)
> +
> +#define RX_RING_DMA_IDX_MASK GENMASK(15, 0)
> +
> +#define REG_INGRESS_TRTCM_CFG 0x0070
> +#define INGRESS_TRTCM_EN_MASK BIT(31)
> +#define INGRESS_TRTCM_MODE_MASK BIT(30)
> +#define INGRESS_SLOW_TICK_RATIO_MASK GENMASK(29, 16)
> +#define INGRESS_FAST_TICK_MASK GENMASK(15, 0)
> +
> +#define REG_TXQ_DIS_CFG_BASE(_n) ((_n) ? 0x20a0 : 0x00a0)
> +#define REG_TXQ_DIS_CFG(_n, _m) (REG_TXQ_DIS_CFG_BASE((_n)) + (_m) << 2)
> +
> +#define REG_LMGR_INIT_CFG 0x1000
> +#define LMGR_INIT_START BIT(31)
> +#define LMGR_SRAM_MODE_MASK BIT(30)
> +#define HW_FWD_PKTSIZE_OVERHEAD_MASK GENMASK(27, 20)
> +#define HW_FWD_DESC_NUM_MASK GENMASK(16, 0)
> +
> +#define REG_FWD_DSCP_LOW_THR 0x1004
> +#define FWD_DSCP_LOW_THR_MASK GENMASK(17, 0)
> +
> +#define REG_EGRESS_RATE_METER_CFG 0x100c
> +#define EGRESS_RATE_METER_EN_MASK BIT(29)
> +#define EGRESS_RATE_METER_EQ_RATE_EN_MASK BIT(17)
> +#define EGRESS_RATE_METER_WINDOW_SZ_MASK GENMASK(16, 12)
> +#define EGRESS_RATE_METER_TIMESLICE_MASK GENMASK(10, 0)
> +
> +#define REG_EGRESS_TRTCM_CFG 0x1010
> +#define EGRESS_TRTCM_EN_MASK BIT(31)
> +#define EGRESS_TRTCM_MODE_MASK BIT(30)
> +#define EGRESS_SLOW_TICK_RATIO_MASK GENMASK(29, 16)
> +#define EGRESS_FAST_TICK_MASK GENMASK(15, 0)
> +
> +#define REG_TXWRR_MODE_CFG 0x1020
> +#define TWRR_WEIGHT_SCALE_MASK BIT(31)
> +#define TWRR_WEIGHT_BASE_MASK BIT(3)
> +
> +#define REG_PSE_BUF_USAGE_CFG 0x1028
> +#define PSE_BUF_ESTIMATE_EN_MASK BIT(29)
> +
> +#define REG_GLB_TRTCM_CFG 0x1080
> +#define GLB_TRTCM_EN_MASK BIT(31)
> +#define GLB_TRTCM_MODE_MASK BIT(30)
> +#define GLB_SLOW_TICK_RATIO_MASK GENMASK(29, 16)
> +#define GLB_FAST_TICK_MASK GENMASK(15, 0)
> +
> +#define REG_TXQ_CNGST_CFG 0x10a0
> +#define TXQ_CNGST_DROP_EN BIT(31)
> +#define TXQ_CNGST_DEI_DROP_EN BIT(30)
> +
> +#define REG_SLA_TRTCM_CFG 0x1150
> +#define SLA_TRTCM_EN_MASK BIT(31)
> +#define SLA_TRTCM_MODE_MASK BIT(30)
> +#define SLA_SLOW_TICK_RATIO_MASK GENMASK(29, 16)
> +#define SLA_FAST_TICK_MASK GENMASK(15, 0)
> +
> +/* CTRL */
> +#define QDMA_DESC_DONE_MASK BIT(31)
> +#define QDMA_DESC_DROP_MASK BIT(30) /* tx: drop pkt - rx: overflow */
> +#define QDMA_DESC_MORE_MASK BIT(29) /* more SG elements */
> +#define QDMA_DESC_DEI_MASK BIT(25)
> +#define QDMA_DESC_NO_DROP_MASK BIT(24)
> +#define QDMA_DESC_LEN_MASK GENMASK(15, 0)
> +/* DATA */
> +#define QDMA_DESC_NEXT_ID_MASK GENMASK(15, 0)
> +/* MSG0 */
> +#define QDMA_ETH_TXMSG_MIC_IDX_MASK BIT(30)
> +#define QDMA_ETH_TXMSG_SP_TAG_MASK GENMASK(29, 14)
> +#define QDMA_ETH_TXMSG_ICO_MASK BIT(13)
> +#define QDMA_ETH_TXMSG_UCO_MASK BIT(12)
> +#define QDMA_ETH_TXMSG_TCO_MASK BIT(11)
> +#define QDMA_ETH_TXMSG_TSO_MASK BIT(10)
> +#define QDMA_ETH_TXMSG_FAST_MASK BIT(9)
> +#define QDMA_ETH_TXMSG_OAM_MASK BIT(8)
> +#define QDMA_ETH_TXMSG_CHAN_MASK GENMASK(7, 3)
> +#define QDMA_ETH_TXMSG_QUEUE_MASK GENMASK(2, 0)
> +/* MSG1 */
> +#define QDMA_ETH_TXMSG_NO_DROP BIT(31)
> +#define QDMA_ETH_TXMSG_METER_MASK GENMASK(30, 24) /* 0x7f means do not apply meters */
> +#define QDMA_ETH_TXMSG_FPORT_MASK GENMASK(23, 20)
> +#define QDMA_ETH_TXMSG_NBOQ_MASK GENMASK(19, 15)
> +#define QDMA_ETH_TXMSG_HWF_MASK BIT(14)
> +#define QDMA_ETH_TXMSG_HOP_MASK BIT(13)
> +#define QDMA_ETH_TXMSG_PTP_MASK BIT(12)
> +#define QDMA_ETH_TXMSG_ACNT_G1_MASK GENMASK(10, 6) /* 0x1f means do not count */
> +#define QDMA_ETH_TXMSG_ACNT_G0_MASK GENMASK(5, 0) /* 0x3f means do not count */
> +
> +struct airoha_qdma_desc {
> + __le32 rsv;
> + __le32 ctrl;
> + __le32 addr;
> + __le32 data;
> + __le32 msg0;
> + __le32 msg1;
> + __le32 msg2;
> + __le32 msg3;
> +};
> +
> +/* CTRL0 */
> +#define QDMA_FWD_DESC_CTX_MASK BIT(31)
> +#define QDMA_FWD_DESC_RING_MASK GENMASK(30, 28)
> +#define QDMA_FWD_DESC_IDX_MASK GENMASK(27, 16)
> +#define QDMA_FWD_DESC_LEN_MASK GENMASK(15, 0)
> +/* CTRL1 */
> +#define QDMA_FWD_DESC_FIRST_IDX_MASK GENMASK(15, 0)
> +/* CTRL2 */
> +#define QDMA_FWD_DESC_MORE_PKT_NUM_MASK GENMASK(2, 0)
> +
> +struct airoha_qdma_fwd_desc {
> + __le32 addr;
> + __le32 ctrl0;
> + __le32 ctrl1;
> + __le32 ctrl2;
> + __le32 msg0;
> + __le32 msg1;
> + __le32 rsv0;
> + __le32 rsv1;
> +};
> +
> +enum {
> + QDMA_INT_REG_IDX0,
> + QDMA_INT_REG_IDX1,
> + QDMA_INT_REG_IDX2,
> + QDMA_INT_REG_IDX3,
> + QDMA_INT_REG_IDX4,
> + QDMA_INT_REG_MAX
> +};
> +
> +enum airoha_dport {
> + DPORT_PDMA,
> + DPORT_GDM1,
> + DPORT_GDM2,
> + DPORT_GDM3,
> + DPORT_PPE,
> + DPORT_QDMA,
> + DPORT_QDMA_HW,
> + DPORT_DISCARD,
> + DPORT_GDM4 = 9,
> +};
> +
> +enum {
> + FE_DP_CPU,
> + FE_DP_GDM1,
> + FE_DP_GDM2,
> + FE_DP_QDMA1_HWF,
> + FE_DP_GDMA3_HWF = 3,
> + FE_DP_PPE,
> + FE_DP_QDMA2_CPU,
> + FE_DP_QDMA2_HWF,
> + FE_DP_DISCARD,
> + FE_DP_PPE2 = 8,
> + FE_DP_DROP = 15,
> +};
> +
> +enum {
> + CDM_CRSN_QSEL_Q1 = 1,
> + CDM_CRSN_QSEL_Q5 = 5,
> + CDM_CRSN_QSEL_Q6 = 6,
> + CDM_CRSN_QSEL_Q15 = 15,
> +};
> +
> +enum {
> + CRSN_08 = 0x8,
> + CRSN_21 = 0x15, /* KA */
> + CRSN_22 = 0x16, /* hit bind and force route to CPU */
> + CRSN_24 = 0x18,
> + CRSN_25 = 0x19,
> +};
> +
> +enum {
> + DEV_STATE_INITIALIZED,
> +};
> +
> +struct airoha_queue_entry {
> + union {
> + void *buf;
> + struct sk_buff *skb;
> + };
> + dma_addr_t dma_addr;
> + u16 dma_len;
> +};
> +
> +struct airoha_queue {
> + struct airoha_eth *eth;
> +
> + spinlock_t lock;
> + struct airoha_queue_entry *entry;
> + struct airoha_qdma_desc *desc;
> + u16 head;
> + u16 tail;
> +
> + int queued;
> + int ndesc;
> + int free_thr;
> + int buf_size;
> +
> + struct napi_struct napi;
> + struct page_pool *page_pool;
> +};
> +
> +struct airoha_tx_irq_queue {
> + struct airoha_eth *eth;
> +
> + struct napi_struct napi;
> + u32 *q;
> +
> + int size;
> + int queued;
> + u16 head;
> +};
> +
> +struct airoha_eth {
> + struct net_device *net_dev;
> +
> + unsigned long state;
> +
> + void __iomem *qdma_regs;
> + void __iomem *fe_regs;
> +
> + spinlock_t irq_lock;
> + u32 irqmask[QDMA_INT_REG_MAX];
> + int irq;
> +
> + struct reset_control_bulk_data rsts[AIROHA_MAX_NUM_RSTS];
> + struct reset_control_bulk_data xsi_rsts[AIROHA_MAX_NUM_XSI_RSTS];
> +
> + struct airoha_queue q_tx[AIROHA_NUM_TX_RING];
> + struct airoha_queue q_rx[AIROHA_NUM_RX_RING];
> +
> + struct airoha_tx_irq_queue q_tx_irq[AIROHA_NUM_TX_IRQ];
> +
> + /* descriptor and packet buffers for qdma hw forward */
> + struct {
> + void *desc;
> + void *q;
> + } hfwd;
> +
> + struct dentry *debugfs_dir;
> +};
> +
> +#define airoha_qdma_for_each_q_rx(eth, i) \
> + for (i = 0; i < ARRAY_SIZE((eth)->q_rx); i++) \
> + if ((eth)->q_rx[i].ndesc)
> +
> +static inline void airoha_qdma_start_napi(struct airoha_eth *eth)
> +{
> + int i;
> +
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++)
> + napi_enable(ð->q_tx_irq[i].napi);
> +
> + airoha_qdma_for_each_q_rx(eth, i)
> + napi_enable(ð->q_rx[i].napi);
> +}
> +
> +static inline void airoha_qdma_stop_napi(struct airoha_eth *eth)
> +{
> + int i;
> +
> + for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++)
> + napi_disable(ð->q_tx_irq[i].napi);
> +
> + airoha_qdma_for_each_q_rx(eth, i)
> + napi_disable(ð->q_rx[i].napi);
> +}
> --
> 2.45.1
>
Powered by blists - more mailing lists