Re: [PATCH net-next 3/3] net: airoha: Introduce ethernet support for EN7581 SoC

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



> On 2024-05-31 at 15:52:20, Lorenzo Bianconi (lorenzo@xxxxxxxxxx) wrote:
> > +
> > +static int airoha_qdma_fill_rx_queue(struct airoha_queue *q)
> > +{
> > +	struct airoha_eth *eth = q->eth;
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	int qid = q - &eth->q_rx[0], nframes = 0;
> > +
> > +	spin_lock_bh(&q->lock);
> > +	while (q->queued < q->ndesc - 1) {
> > +		struct airoha_queue_entry *e = &q->entry[q->head];
> > +		struct airoha_qdma_desc *desc = &q->desc[q->head];
> > +		enum dma_data_direction dir;
> > +		struct page *page;
> > +		int offset;
> > +		u32 val;
> > +
> > +		page = page_pool_dev_alloc_frag(q->page_pool, &offset,
> > +						q->buf_size);
> > +		if (!page)
> > +			break;
> > +
> > +		q->head = (q->head + 1) % q->ndesc;
> q-ndesc is a multiple of 2 ? (q->head + 1)& ~(q-ndesc - 1) would yeild less instruction
> and would suffice right ?

maybe we can just leave as it is if in the future we would change the queue
size?

> > +		q->queued++;
> > +		nframes++;
> > +
> > +		e->buf = page_address(page) + offset;
> > +		e->dma_addr = page_pool_get_dma_addr(page) + offset;
> > +		e->dma_len = SKB_WITH_OVERHEAD(q->buf_size);
> > +		dir = page_pool_get_dma_dir(q->page_pool);
> can we move this out from while loop ? as it will be same for the queue

ack, I will do in v2.

> > +		dma_sync_single_for_device(dev, e->dma_addr, e->dma_len, dir);
> > +
> > +		val = FIELD_PREP(QDMA_DESC_LEN_MASK, e->dma_len);
> > +		WRITE_ONCE(desc->ctrl, cpu_to_le32(val));
> > +		WRITE_ONCE(desc->addr, cpu_to_le32(e->dma_addr));
> > +		val = FIELD_PREP(QDMA_DESC_NEXT_ID_MASK, q->head);
> > +		WRITE_ONCE(desc->data, cpu_to_le32(val));
> > +		WRITE_ONCE(desc->msg0, 0);
> > +		WRITE_ONCE(desc->msg1, 0);
> > +		WRITE_ONCE(desc->msg2, 0);
> > +		WRITE_ONCE(desc->msg3, 0);
> > +
> > +		wmb();
> > +		airoha_qdma_rmw(eth, REG_RX_CPU_IDX(qid), RX_RING_CPU_IDX_MASK,
> > +				FIELD_PREP(RX_RING_CPU_IDX_MASK, q->head));
> > +	}
> > +	spin_unlock_bh(&q->lock);
> > +
> > +	return nframes;
> > +}
> > +
> > +static int airoha_qdma_rx_process(struct airoha_queue *q, int budget)
> > +{
> > +	struct airoha_eth *eth = q->eth;
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	int done = 0, qid = q - &eth->q_rx[0];
> Reverse xmas tree.

ack, I will do in v2.

> 
> > +
> > +	spin_lock_bh(&q->lock);
> > +	while (done < budget) {
> > +		struct airoha_queue_entry *e = &q->entry[q->tail];
> > +		struct airoha_qdma_desc *desc = &q->desc[q->tail];
> > +		dma_addr_t dma_addr = le32_to_cpu(desc->addr);
> > +		u32 desc_ctrl = le32_to_cpu(desc->ctrl);
> > +		struct sk_buff *skb;
> > +		int len;
> > +
> > +		if (!(desc_ctrl & QDMA_DESC_DONE_MASK))
> > +			break;
> > +
> > +		len = FIELD_GET(QDMA_DESC_LEN_MASK, desc_ctrl);
> > +		if (!dma_addr || !len)
> > +			break;
> > +
> > +		q->tail = (q->tail + 1) % q->ndesc;
> > +		q->queued--;
> > +
> > +		dma_sync_single_for_cpu(dev, dma_addr,
> > +					SKB_WITH_OVERHEAD(q->buf_size),
> > +					page_pool_get_dma_dir(q->page_pool));
> > +
> > +		skb = napi_build_skb(e->buf, q->buf_size);
> > +		if (!skb) {
> > +			page_pool_put_full_page(q->page_pool,
> > +						virt_to_head_page(e->buf),
> > +						true);
> > +			continue;
> How while loop exist as done is not getting incremented in case is nap_build_skb() keeps
> failing ?

ack, right. I will fix it in v2

> > +		}
> > +
> > +		skb_reserve(skb, 2);
> > +		__skb_put(skb, len);
> > +
> > +		skb_mark_for_recycle(skb);
> > +		skb->dev = eth->net_dev;
> > +		skb->protocol = eth_type_trans(skb, eth->net_dev);
> > +		skb->ip_summed = CHECKSUM_UNNECESSARY;
> > +		skb_record_rx_queue(skb, qid);
> > +		napi_gro_receive(&q->napi, skb);
> > +
> > +		done++;
> > +	}
> > +	spin_unlock_bh(&q->lock);
> > +
> > +	airoha_qdma_fill_rx_queue(q);
> > +
> > +	return done;
> > +}
> > +
> > +static int airoha_qdma_rx_napi_poll(struct napi_struct *napi, int budget)
> > +{
> > +	struct airoha_queue *q = container_of(napi, struct airoha_queue, napi);
> > +	struct airoha_eth *eth = q->eth;
> > +	int cur, done = 0;
> > +
> > +	do {
> > +		cur = airoha_qdma_rx_process(q, budget - done);
> > +		done += cur;
> > +	} while (cur && done < budget);
> > +
> > +	if (done < budget && napi_complete(napi))
> > +		airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX1,
> > +				       RX_DONE_INT_MASK);
> > +
> > +	return done;
> > +}
> > +
> > +static int airoha_qdma_init_rx_queue(struct airoha_eth *eth,
> > +				     struct airoha_queue *q, int ndesc)
> > +{
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	struct page_pool_params pp_params = {
> > +		.order = 0,
> > +		.pool_size = 256,
> > +		.flags = PP_FLAG_DMA_MAP | PP_FLAG_DMA_SYNC_DEV,
> > +		.dma_dir = DMA_FROM_DEVICE,
> > +		.max_len = PAGE_SIZE,
> > +		.nid = NUMA_NO_NODE,
> > +		.dev = dev,
> > +		.napi = &q->napi,
> > +	};
> > +	int qid = q - &eth->q_rx[0], thr;
> > +	dma_addr_t dma_addr;
> > +
> > +	spin_lock_init(&q->lock);
> > +	q->buf_size = PAGE_SIZE / 2;
> > +	q->ndesc = ndesc;
> > +	q->eth = eth;
> > +
> > +	q->entry = devm_kzalloc(dev, q->ndesc * sizeof(*q->entry),
> > +				GFP_KERNEL);
> > +	if (!q->entry)
> > +		return -ENOMEM;
> > +
> > +	q->page_pool = page_pool_create(&pp_params);
> > +	if (IS_ERR(q->page_pool)) {
> > +		int err = PTR_ERR(q->page_pool);
> > +
> > +		q->page_pool = NULL;
> > +		return err;
> > +	}
> > +
> > +	q->desc = dmam_alloc_coherent(dev, q->ndesc * sizeof(*q->desc),
> > +				      &dma_addr, GFP_KERNEL);
> > +	if (!q->desc)
> Dont we need to destroy the page pool ?

ack, right. I will fix it in v2

> > +		return -ENOMEM;
> > +
> > +	netif_napi_add(eth->net_dev, &q->napi, airoha_qdma_rx_napi_poll);
> > +
> > +	airoha_qdma_wr(eth, REG_RX_RING_BASE(qid), dma_addr);
> > +	airoha_qdma_rmw(eth, REG_RX_RING_SIZE(qid), RX_RING_SIZE_MASK,
> > +			FIELD_PREP(RX_RING_SIZE_MASK, ndesc));
> > +
> > +	thr = clamp(ndesc >> 3, 1, 32);
> > +	airoha_qdma_rmw(eth, REG_RX_RING_SIZE(qid), RX_RING_THR_MASK,
> > +			FIELD_PREP(RX_RING_THR_MASK, thr));
> > +	airoha_qdma_rmw(eth, REG_RX_DMA_IDX(qid), RX_RING_DMA_IDX_MASK,
> > +			FIELD_PREP(RX_RING_DMA_IDX_MASK, q->head));
> > +
> > +	airoha_qdma_fill_rx_queue(q);
> > +
> > +	return 0;
> > +}
> > +
> > +static void airoha_qdma_clenaup_rx_queue(struct airoha_queue *q)
> > +{
> > +	struct airoha_eth *eth = q->eth;
> > +	struct device *dev = eth->net_dev->dev.parent;
> Reverse xmas tree.

ack, right. I will do it in v2

> > +
> > +	spin_lock_bh(&q->lock);
> > +
> > +	while (q->queued) {
> > +		struct airoha_queue_entry *e = &q->entry[q->tail];
> > +		struct page *page = virt_to_head_page(e->buf);
> > +		enum dma_data_direction dir;
> > +
> > +		dir = page_pool_get_dma_dir(q->page_pool);
> can we move this out of while loop ?

ack, right. I will do it in v2

Regards,
Lorenzo

> 
> > +		dma_sync_single_for_cpu(dev, e->dma_addr, e->dma_len, dir);
> > +		page_pool_put_full_page(q->page_pool, page, false);
> > +		q->tail = (q->tail + 1) % q->ndesc;
> > +		q->queued--;
> > +	}
> > +
> > +	spin_unlock_bh(&q->lock);
> > +}
> > +
> > +static int airoha_qdma_init_rx(struct airoha_eth *eth)
> > +{
> > +	int i;
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_rx); i++) {
> > +		int err;
> > +
> > +		if (!(RX_DONE_INT_MASK & BIT(i))) {
> > +			/* rx-queue not binded to irq */
> > +			continue;
> > +		}
> > +
> > +		err = airoha_qdma_init_rx_queue(eth, &eth->q_rx[i],
> > +						RX_DSCP_NUM(i));
> > +		if (err)
> > +			return err;
> > +	}
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_qdma_tx_napi_poll(struct napi_struct *napi, int budget)
> > +{
> > +	struct airoha_tx_irq_queue *irq_q;
> > +	struct airoha_eth *eth;
> > +	struct device *dev;
> > +	int id, done = 0;
> > +
> > +	irq_q = container_of(napi, struct airoha_tx_irq_queue, napi);
> > +	eth = irq_q->eth;
> > +	id = irq_q - &eth->q_tx_irq[0];
> > +	dev = eth->net_dev->dev.parent;
> > +
> > +	while (irq_q->queued > 0 && done < budget) {
> > +		u32 qid, last, val = irq_q->q[irq_q->head];
> > +		struct airoha_queue *q;
> > +
> > +		if (val == 0xff)
> > +			break;
> > +
> > +		irq_q->q[irq_q->head] = 0xff; /* mark as done */
> > +		irq_q->head = (irq_q->head + 1) % irq_q->size;
> > +		irq_q->queued--;
> > +		done++;
> > +
> > +		last = FIELD_GET(IRQ_DESC_IDX_MASK, val);
> > +		qid = FIELD_GET(IRQ_RING_IDX_MASK, val);
> > +
> > +		if (qid >= ARRAY_SIZE(eth->q_tx))
> > +			continue;
> > +
> > +		q = &eth->q_tx[qid];
> > +		spin_lock_bh(&q->lock);
> > +
> > +		while (q->queued > 0) {
> > +			struct airoha_qdma_desc *desc = &q->desc[q->tail];
> > +			struct airoha_queue_entry *e = &q->entry[q->tail];
> > +			u32 desc_ctrl = le32_to_cpu(desc->ctrl);
> > +			u16 index = q->tail;
> > +
> > +			if (!(desc_ctrl & QDMA_DESC_DONE_MASK) &&
> > +			    !(desc_ctrl & QDMA_DESC_DROP_MASK))
> > +				break;
> > +
> > +			q->tail = (q->tail + 1) % q->ndesc;
> > +			q->queued--;
> > +
> > +			dma_unmap_single(dev, e->dma_addr, e->dma_len,
> > +					 DMA_TO_DEVICE);
> > +			dev_kfree_skb_any(e->skb);
> > +			e->skb = NULL;
> > +
> > +			WRITE_ONCE(desc->msg0, 0);
> > +			WRITE_ONCE(desc->msg1, 0);
> > +
> > +			if (index == last)
> > +				break;
> > +		}
> > +
> > +		if (__netif_subqueue_stopped(eth->net_dev, qid) &&
> > +		    q->queued + q->free_thr < q->ndesc)
> > +			netif_wake_subqueue(eth->net_dev, qid);
> > +
> > +		spin_unlock_bh(&q->lock);
> > +	}
> > +
> > +	if (done) {
> > +		int i, len = done >> 7;
> > +
> > +		for (i = 0; i < len; i++)
> > +			airoha_qdma_rmw(eth, REG_IRQ_CLEAR_LEN(id),
> > +					IRQ_CLEAR_LEN_MASK, 0x80);
> > +		airoha_qdma_rmw(eth, REG_IRQ_CLEAR_LEN(id),
> > +				IRQ_CLEAR_LEN_MASK, (done & 0x7f));
> > +	}
> > +
> > +	if (done < budget && napi_complete(napi))
> > +		airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX0,
> > +				       TX_DONE_INT_MASK(id));
> > +
> > +	return done;
> > +}
> > +
> > +static int airoha_qdma_init_tx_queue(struct airoha_eth *eth,
> > +				     struct airoha_queue *q, int size)
> > +{
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	int i, qid = q - &eth->q_tx[0];
> > +	dma_addr_t dma_addr;
> > +
> > +	spin_lock_init(&q->lock);
> > +	q->ndesc = size;
> > +	q->eth = eth;
> > +	q->free_thr = MAX_SKB_FRAGS;
> > +
> > +	q->entry = devm_kzalloc(dev, q->ndesc * sizeof(*q->entry),
> > +				GFP_KERNEL);
> > +	if (!q->entry)
> > +		return -ENOMEM;
> > +
> > +	q->desc = dmam_alloc_coherent(dev, q->ndesc * sizeof(*q->desc),
> > +				      &dma_addr, GFP_KERNEL);
> > +	if (!q->desc)
> > +		return -ENOMEM;
> > +
> > +	for (i = 0; i < q->ndesc; i++) {
> > +		u32 val;
> > +
> > +		val = FIELD_PREP(QDMA_DESC_DONE_MASK, 1);
> > +		WRITE_ONCE(q->desc[i].ctrl, cpu_to_le32(val));
> > +	}
> > +
> > +	airoha_qdma_wr(eth, REG_TX_RING_BASE(qid), dma_addr);
> > +	airoha_qdma_rmw(eth, REG_TX_CPU_IDX(qid), TX_RING_CPU_IDX_MASK,
> > +			FIELD_PREP(TX_RING_CPU_IDX_MASK, q->head));
> > +	airoha_qdma_rmw(eth, REG_TX_DMA_IDX(qid), TX_RING_DMA_IDX_MASK,
> > +			FIELD_PREP(TX_RING_DMA_IDX_MASK, q->head));
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_qdma_tx_irq_init(struct airoha_eth *eth,
> > +				   struct airoha_tx_irq_queue *irq_q,
> > +				   int size)
> > +{
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	int id = irq_q - &eth->q_tx_irq[0];
> > +	dma_addr_t dma_addr;
> > +
> > +	netif_napi_add(eth->net_dev, &irq_q->napi, airoha_qdma_tx_napi_poll);
> > +	irq_q->q = dmam_alloc_coherent(dev, size * sizeof(u32), &dma_addr,
> > +				       GFP_KERNEL);
> > +	if (!irq_q->q)
> > +		return -ENOMEM;
> > +
> > +	memset(irq_q->q, 0xff, size * sizeof(u32));
> > +	irq_q->size = size;
> > +	irq_q->eth = eth;
> > +
> > +	airoha_qdma_wr(eth, REG_TX_IRQ_BASE(id), dma_addr);
> > +	airoha_qdma_rmw(eth, REG_TX_IRQ_CFG(id), TX_IRQ_DEPTH_MASK,
> > +			FIELD_PREP(TX_IRQ_DEPTH_MASK, size));
> > +	airoha_qdma_rmw(eth, REG_TX_IRQ_CFG(id), TX_IRQ_THR_MASK,
> > +			FIELD_PREP(TX_IRQ_THR_MASK, 32));
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_qdma_init_tx(struct airoha_eth *eth)
> > +{
> > +	int i, err;
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++) {
> > +		err = airoha_qdma_tx_irq_init(eth, &eth->q_tx_irq[i],
> > +					      IRQ_QUEUE_LEN(i));
> > +		if (err)
> > +			return err;
> > +	}
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++) {
> > +		err = airoha_qdma_init_tx_queue(eth, &eth->q_tx[i],
> > +						TX_DSCP_NUM);
> > +		if (err)
> > +			return err;
> > +	}
> > +
> > +	return 0;
> > +}
> > +
> > +static void airoha_qdma_clenaup_tx_queue(struct airoha_queue *q)
> > +{
> > +	struct airoha_eth *eth = q->eth;
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +
> > +	spin_lock_bh(&q->lock);
> > +
> > +	while (q->queued) {
> > +		struct airoha_queue_entry *e = &q->entry[q->tail];
> > +
> > +		dma_unmap_single(dev, e->dma_addr, e->dma_len, DMA_TO_DEVICE);
> > +		dev_kfree_skb_any(e->skb);
> > +		e->skb = NULL;
> > +
> > +		q->tail = (q->tail + 1) % q->ndesc;
> > +		q->queued--;
> > +	}
> > +
> > +	spin_unlock_bh(&q->lock);
> > +}
> > +
> > +static int airoha_qdma_init_hfwd_queues(struct airoha_eth *eth)
> > +{
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	dma_addr_t dma_addr;
> > +	u32 status;
> > +	int size;
> > +
> > +	size = HW_DSCP_NUM * sizeof(struct airoha_qdma_fwd_desc);
> > +	eth->hfwd.desc = dmam_alloc_coherent(dev, size, &dma_addr,
> > +					     GFP_KERNEL);
> > +	if (!eth->hfwd.desc)
> > +		return -ENOMEM;
> > +
> > +	airoha_qdma_wr(eth, REG_FWD_DSCP_BASE, dma_addr);
> > +
> > +	size = AIROHA_MAX_PACKET_SIZE * HW_DSCP_NUM;
> > +	eth->hfwd.q = dmam_alloc_coherent(dev, size, &dma_addr, GFP_KERNEL);
> > +	if (!eth->hfwd.q)
> > +		return -ENOMEM;
> > +
> > +	airoha_qdma_wr(eth, REG_FWD_BUF_BASE, dma_addr);
> > +
> > +	airoha_qdma_rmw(eth, REG_HW_FWD_DSCP_CFG,
> > +			HW_FWD_DSCP_PAYLOAD_SIZE_MASK,
> > +			FIELD_PREP(HW_FWD_DSCP_PAYLOAD_SIZE_MASK, 0));
> > +	airoha_qdma_rmw(eth, REG_FWD_DSCP_LOW_THR, FWD_DSCP_LOW_THR_MASK,
> > +			FIELD_PREP(FWD_DSCP_LOW_THR_MASK, 128));
> > +	airoha_qdma_rmw(eth, REG_LMGR_INIT_CFG,
> > +			LMGR_INIT_START | LMGR_SRAM_MODE_MASK |
> > +			HW_FWD_DESC_NUM_MASK,
> > +			FIELD_PREP(HW_FWD_DESC_NUM_MASK, HW_DSCP_NUM) |
> > +			LMGR_INIT_START);
> > +
> > +	return read_poll_timeout(airoha_qdma_rr, status,
> > +				 !(status & LMGR_INIT_START), USEC_PER_MSEC,
> > +				 30 * USEC_PER_MSEC, true, eth,
> > +				 REG_LMGR_INIT_CFG);
> > +}
> > +
> > +static void airoha_qdma_init_qos(struct airoha_eth *eth)
> > +{
> > +	airoha_qdma_clear(eth, REG_TXWRR_MODE_CFG, TWRR_WEIGHT_SCALE_MASK);
> > +	airoha_qdma_set(eth, REG_TXWRR_MODE_CFG, TWRR_WEIGHT_BASE_MASK);
> > +
> > +	airoha_qdma_clear(eth, REG_PSE_BUF_USAGE_CFG,
> > +			  PSE_BUF_ESTIMATE_EN_MASK);
> > +
> > +	airoha_qdma_set(eth, REG_EGRESS_RATE_METER_CFG,
> > +			EGRESS_RATE_METER_EN_MASK |
> > +			EGRESS_RATE_METER_EQ_RATE_EN_MASK);
> > +	/* 2047us x 31 = 63.457ms */
> > +	airoha_qdma_rmw(eth, REG_EGRESS_RATE_METER_CFG,
> > +			EGRESS_RATE_METER_WINDOW_SZ_MASK,
> > +			FIELD_PREP(EGRESS_RATE_METER_WINDOW_SZ_MASK, 0x1f));
> > +	airoha_qdma_rmw(eth, REG_EGRESS_RATE_METER_CFG,
> > +			EGRESS_RATE_METER_TIMESLICE_MASK,
> > +			FIELD_PREP(EGRESS_RATE_METER_TIMESLICE_MASK, 0x7ff));
> > +
> > +	/* ratelimit init */
> > +	airoha_qdma_set(eth, REG_GLB_TRTCM_CFG, GLB_TRTCM_EN_MASK);
> > +	airoha_qdma_rmw(eth, REG_GLB_TRTCM_CFG, GLB_FAST_TICK_MASK,
> > +			FIELD_PREP(GLB_FAST_TICK_MASK, 25)); /* fast-tick 25us */
> > +	airoha_qdma_rmw(eth, REG_GLB_TRTCM_CFG, GLB_SLOW_TICK_RATIO_MASK,
> > +			FIELD_PREP(GLB_SLOW_TICK_RATIO_MASK, 40));
> > +
> > +	airoha_qdma_set(eth, REG_EGRESS_TRTCM_CFG, EGRESS_TRTCM_EN_MASK);
> > +	airoha_qdma_rmw(eth, REG_EGRESS_TRTCM_CFG, EGRESS_FAST_TICK_MASK,
> > +			FIELD_PREP(EGRESS_FAST_TICK_MASK, 25));
> > +	airoha_qdma_rmw(eth, REG_EGRESS_TRTCM_CFG,
> > +			EGRESS_SLOW_TICK_RATIO_MASK,
> > +			FIELD_PREP(EGRESS_SLOW_TICK_RATIO_MASK, 40));
> > +
> > +	airoha_qdma_set(eth, REG_INGRESS_TRTCM_CFG, INGRESS_TRTCM_EN_MASK);
> > +	airoha_qdma_clear(eth, REG_INGRESS_TRTCM_CFG,
> > +			  INGRESS_TRTCM_MODE_MASK);
> > +	airoha_qdma_rmw(eth, REG_INGRESS_TRTCM_CFG, INGRESS_FAST_TICK_MASK,
> > +			FIELD_PREP(INGRESS_FAST_TICK_MASK, 125));
> > +	airoha_qdma_rmw(eth, REG_INGRESS_TRTCM_CFG,
> > +			INGRESS_SLOW_TICK_RATIO_MASK,
> > +			FIELD_PREP(INGRESS_SLOW_TICK_RATIO_MASK, 8));
> > +
> > +	airoha_qdma_set(eth, REG_SLA_TRTCM_CFG, SLA_TRTCM_EN_MASK);
> > +	airoha_qdma_rmw(eth, REG_SLA_TRTCM_CFG, SLA_FAST_TICK_MASK,
> > +			FIELD_PREP(SLA_FAST_TICK_MASK, 25));
> > +	airoha_qdma_rmw(eth, REG_SLA_TRTCM_CFG, SLA_SLOW_TICK_RATIO_MASK,
> > +			FIELD_PREP(SLA_SLOW_TICK_RATIO_MASK, 40));
> > +}
> > +
> > +static int airoha_qdma_hw_init(struct airoha_eth *eth)
> > +{
> > +	int i;
> > +
> > +	/* clear pending irqs */
> > +	for (i = 0; i < ARRAY_SIZE(eth->irqmask); i++)
> > +		airoha_qdma_wr(eth, REG_INT_STATUS(i), 0xffffffff);
> > +
> > +	/* setup irqs */
> > +	airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX0, INT_IDX0_MASK);
> > +	airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX1, INT_IDX1_MASK);
> > +	airoha_qdma_irq_enable(eth, QDMA_INT_REG_IDX4, INT_IDX4_MASK);
> > +
> > +	/* setup irq binding */
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++) {
> > +		if (TX_RING_IRQ_BLOCKING_MAP_MASK & BIT(i))
> > +			airoha_qdma_set(eth, REG_TX_RING_BLOCKING(i),
> > +					TX_RING_IRQ_BLOCKING_CFG_MASK);
> > +		else
> > +			airoha_qdma_clear(eth, REG_TX_RING_BLOCKING(i),
> > +					  TX_RING_IRQ_BLOCKING_CFG_MASK);
> > +	}
> > +
> > +	airoha_qdma_wr(eth, REG_QDMA_GLOBAL_CFG,
> > +		       GLOBAL_CFG_RX_2B_OFFSET |
> > +		       FIELD_PREP(GLOBAL_CFG_DMA_PREFERENCE_MASK, 3) |
> > +		       GLOBAL_CFG_CPU_TXR_ROUND_ROBIN |
> > +		       GLOBAL_CFG_PAYLOAD_BYTE_SWAP |
> > +		       GLOBAL_CFG_MULTICAST_MODIFY_FP |
> > +		       GLOBAL_CFG_MULTICAST_EN_MASK |
> > +		       GLOBAL_CFG_IRQ0_EN | GLOBAL_CFG_IRQ1_EN |
> > +		       GLOBAL_CFG_TX_WB_DONE |
> > +		       FIELD_PREP(GLOBAL_CFG_MAX_ISSUE_NUM_MASK, 2));
> > +
> > +	airoha_qdma_init_qos(eth);
> > +
> > +	/* disable qdma rx delay interrupt */
> > +	airoha_qdma_for_each_q_rx(eth, i)
> > +		airoha_qdma_clear(eth, REG_RX_DELAY_INT_IDX(i),
> > +				  RX_DELAY_INT_MASK);
> > +
> > +	airoha_qdma_set(eth, REG_TXQ_CNGST_CFG,
> > +			TXQ_CNGST_DROP_EN | TXQ_CNGST_DEI_DROP_EN);
> > +
> > +	return 0;
> > +}
> > +
> > +static irqreturn_t airoha_irq_handler(int irq, void *dev_instance)
> > +{
> > +	struct airoha_eth *eth = dev_instance;
> > +	u32 intr[ARRAY_SIZE(eth->irqmask)];
> > +	int i;
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->irqmask); i++) {
> > +		intr[i] = airoha_qdma_rr(eth, REG_INT_STATUS(i));
> > +		intr[i] &= eth->irqmask[i];
> > +		airoha_qdma_wr(eth, REG_INT_STATUS(i), intr[i]);
> > +	}
> > +
> > +	if (!test_bit(DEV_STATE_INITIALIZED, &eth->state))
> > +		return IRQ_NONE;
> > +
> > +	if (intr[1] & RX_DONE_INT_MASK) {
> > +		airoha_qdma_irq_disable(eth, QDMA_INT_REG_IDX1,
> > +					RX_DONE_INT_MASK);
> > +		airoha_qdma_for_each_q_rx(eth, i) {
> > +			if (intr[1] & BIT(i))
> > +				napi_schedule(&eth->q_rx[i].napi);
> > +		}
> > +	}
> > +
> > +	if (intr[0] & INT_TX_MASK) {
> > +		for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++) {
> > +			struct airoha_tx_irq_queue *irq_q = &eth->q_tx_irq[i];
> > +			u32 status, head;
> > +
> > +			if (!(intr[0] & TX_DONE_INT_MASK(i)))
> > +				continue;
> > +
> > +			airoha_qdma_irq_disable(eth, QDMA_INT_REG_IDX0,
> > +						TX_DONE_INT_MASK(i));
> > +
> > +			status = airoha_qdma_rr(eth, REG_IRQ_STATUS(i));
> > +			head = FIELD_GET(IRQ_HEAD_IDX_MASK, status);
> > +			irq_q->head = head % irq_q->size;
> > +			irq_q->queued = FIELD_GET(IRQ_ENTRY_LEN_MASK, status);
> > +
> > +			napi_schedule(&eth->q_tx_irq[i].napi);
> > +		}
> > +	}
> > +
> > +	return IRQ_HANDLED;
> > +}
> > +
> > +static int airoha_qdma_init(struct airoha_eth *eth)
> > +{
> > +	struct device *dev = eth->net_dev->dev.parent;
> > +	int err;
> > +
> > +	err = devm_request_irq(dev, eth->irq, airoha_irq_handler,
> > +			       IRQF_SHARED, KBUILD_MODNAME, eth);
> > +	if (err)
> > +		return err;
> > +
> > +	err = airoha_qdma_init_rx(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	err = airoha_qdma_init_tx(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	err = airoha_qdma_init_hfwd_queues(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	err = airoha_qdma_hw_init(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	set_bit(DEV_STATE_INITIALIZED, &eth->state);
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_hw_init(struct airoha_eth *eth)
> > +{
> > +	int err;
> > +
> > +	/* disable xsi */
> > +	reset_control_bulk_assert(ARRAY_SIZE(eth->xsi_rsts), eth->xsi_rsts);
> > +
> > +	reset_control_bulk_assert(ARRAY_SIZE(eth->rsts), eth->rsts);
> > +	msleep(20);
> > +	reset_control_bulk_deassert(ARRAY_SIZE(eth->rsts), eth->rsts);
> > +	msleep(20);
> > +
> > +	err = airoha_fe_init(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	return airoha_qdma_init(eth);
> > +}
> > +
> > +static int airoha_dev_open(struct net_device *dev)
> > +{
> > +	struct airoha_eth *eth = netdev_priv(dev);
> > +	int err;
> > +
> > +	if (netdev_uses_dsa(dev))
> > +		airoha_fe_set(eth, REG_GDM1_INGRESS_CFG, GDM1_STAG_EN_MASK);
> > +	else
> > +		airoha_fe_clear(eth, REG_GDM1_INGRESS_CFG, GDM1_STAG_EN_MASK);
> > +
> > +	netif_tx_start_all_queues(dev);
> > +	err = airoha_set_gdma_ports(eth, true);
> > +	if (err)
> > +		return err;
> > +
> > +	airoha_qdma_set(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_TX_DMA_EN);
> > +	airoha_qdma_set(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_RX_DMA_EN);
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_dev_stop(struct net_device *dev)
> > +{
> > +	struct airoha_eth *eth = netdev_priv(dev);
> > +	int err;
> > +
> > +	netif_tx_disable(dev);
> > +	err = airoha_set_gdma_ports(eth, false);
> > +	if (err)
> > +		return err;
> > +
> > +	airoha_qdma_clear(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_TX_DMA_EN);
> > +	airoha_qdma_clear(eth, REG_QDMA_GLOBAL_CFG, GLOBAL_CFG_RX_DMA_EN);
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_dev_set_macaddr(struct net_device *dev, void *p)
> > +{
> > +	struct airoha_eth *eth = netdev_priv(dev);
> > +	int err;
> > +
> > +	err = eth_mac_addr(dev, p);
> > +	if (err)
> > +		return err;
> > +
> > +	airoha_set_macaddr(eth, dev->dev_addr);
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_dev_init(struct net_device *dev)
> > +{
> > +	struct airoha_eth *eth = netdev_priv(dev);
> > +
> > +	airoha_set_macaddr(eth, dev->dev_addr);
> > +
> > +	return 0;
> > +}
> > +
> > +static netdev_tx_t airoha_dev_xmit(struct sk_buff *skb,
> > +				   struct net_device *dev)
> > +{
> > +	struct skb_shared_info *sinfo = skb_shinfo(skb);
> > +	u32 nr_frags = 1 + sinfo->nr_frags, msg0 = 0, msg1;
> > +	struct airoha_eth *eth = netdev_priv(dev);
> > +	int i, qid = skb_get_queue_mapping(skb);
> > +	u32 len = skb_headlen(skb);
> > +	struct airoha_queue *q;
> > +	void *data = skb->data;
> > +	u16 index;
> > +
> > +	if (skb->ip_summed == CHECKSUM_PARTIAL)
> > +		msg0 |= FIELD_PREP(QDMA_ETH_TXMSG_TCO_MASK, 1) |
> > +			FIELD_PREP(QDMA_ETH_TXMSG_UCO_MASK, 1) |
> > +			FIELD_PREP(QDMA_ETH_TXMSG_ICO_MASK, 1);
> > +
> > +	/* TSO: fill MSS info in tcp checksum field */
> > +	if (skb_is_gso(skb)) {
> > +		if (skb_cow_head(skb, 0))
> > +			goto error;
> > +
> > +		if (sinfo->gso_type & (SKB_GSO_TCPV4 | SKB_GSO_TCPV6)) {
> > +			tcp_hdr(skb)->check = cpu_to_be16(sinfo->gso_size);
> > +			msg0 |= FIELD_PREP(QDMA_ETH_TXMSG_TSO_MASK, 1);
> > +		}
> > +	}
> > +
> > +	msg1 = FIELD_PREP(QDMA_ETH_TXMSG_FPORT_MASK, DPORT_GDM1) |
> > +	       FIELD_PREP(QDMA_ETH_TXMSG_METER_MASK, 0x7f);
> > +
> > +	if (WARN_ON_ONCE(qid >= ARRAY_SIZE(eth->q_tx)))
> > +		qid = 0;
> > +
> > +	q = &eth->q_tx[qid];
> > +	spin_lock_bh(&q->lock);
> > +
> > +	if (q->queued + nr_frags > q->ndesc) {
> > +		/* not enough space in the queue */
> > +		spin_unlock_bh(&q->lock);
> > +		return NETDEV_TX_BUSY;
> > +	}
> > +
> > +	index = q->head;
> > +	for (i = 0; i < nr_frags; i++) {
> > +		struct airoha_qdma_desc *desc = &q->desc[index];
> > +		struct airoha_queue_entry *e = &q->entry[index];
> > +		skb_frag_t *frag = &sinfo->frags[i];
> > +		dma_addr_t addr;
> > +		u32 val;
> > +
> > +		addr = dma_map_single(dev->dev.parent, data, len,
> > +				      DMA_TO_DEVICE);
> > +		if (unlikely(dma_mapping_error(dev->dev.parent, addr)))
> > +			goto error_unmap;
> > +
> > +		index = (index + 1) % q->ndesc;
> > +
> > +		val = FIELD_PREP(QDMA_DESC_LEN_MASK, len);
> > +		if (i < nr_frags - 1)
> > +			val |= FIELD_PREP(QDMA_DESC_MORE_MASK, 1);
> > +		WRITE_ONCE(desc->ctrl, cpu_to_le32(val));
> > +		WRITE_ONCE(desc->addr, cpu_to_le32(addr));
> > +		val = FIELD_PREP(QDMA_DESC_NEXT_ID_MASK, index);
> > +		WRITE_ONCE(desc->data, cpu_to_le32(val));
> > +		WRITE_ONCE(desc->msg0, cpu_to_le32(msg0));
> > +		WRITE_ONCE(desc->msg1, cpu_to_le32(msg1));
> > +		WRITE_ONCE(desc->msg2, cpu_to_le32(0xffff));
> > +
> > +		e->skb = i ? NULL : skb;
> > +		e->dma_addr = addr;
> > +		e->dma_len = len;
> > +
> > +		wmb();
> > +		airoha_qdma_rmw(eth, REG_TX_CPU_IDX(qid), TX_RING_CPU_IDX_MASK,
> > +				FIELD_PREP(TX_RING_CPU_IDX_MASK, index));
> > +
> > +		data = skb_frag_address(frag);
> > +		len = skb_frag_size(frag);
> > +	}
> > +
> > +	q->head = index;
> > +	q->queued += i;
> > +
> > +	if (q->queued + q->free_thr >= q->ndesc)
> > +		netif_stop_subqueue(dev, qid);
> > +
> > +	spin_unlock_bh(&q->lock);
> > +
> > +	return NETDEV_TX_OK;
> > +
> > +error_unmap:
> > +	for (; i >= 0; i++)
> > +		dma_unmap_single(dev->dev.parent, q->entry[i].dma_addr,
> > +				 q->entry[i].dma_len, DMA_TO_DEVICE);
> > +
> > +	spin_unlock_bh(&q->lock);
> > +error:
> > +	dev_kfree_skb_any(skb);
> > +	dev->stats.tx_dropped++;
> > +
> > +	return NETDEV_TX_OK;
> > +}
> > +
> > +static int airoha_dev_change_mtu(struct net_device *dev, int new_mtu)
> > +{
> > +	dev->mtu = new_mtu;
> > +
> > +	return 0;
> > +}
> > +
> > +static const struct net_device_ops airoha_netdev_ops = {
> > +	.ndo_init		= airoha_dev_init,
> > +	.ndo_open		= airoha_dev_open,
> > +	.ndo_stop		= airoha_dev_stop,
> > +	.ndo_start_xmit		= airoha_dev_xmit,
> > +	.ndo_change_mtu		= airoha_dev_change_mtu,
> > +	.ndo_set_mac_address	= airoha_dev_set_macaddr,
> > +};
> > +
> > +static int airoha_rx_queues_show(struct seq_file *s, void *data)
> > +{
> > +	struct airoha_eth *eth = s->private;
> > +	int i;
> > +
> > +	seq_puts(s, "     queue | hw-queued |      head |      tail |\n");
> > +	airoha_qdma_for_each_q_rx(eth, i) {
> > +		struct airoha_queue *q = &eth->q_rx[i];
> > +
> > +		seq_printf(s, " %9d | %9d | %9d | %9d |\n",
> > +			   i, q->queued, q->head, q->tail);
> > +	}
> > +
> > +	return 0;
> > +}
> > +DEFINE_SHOW_ATTRIBUTE(airoha_rx_queues);
> > +
> > +static int airoha_xmit_queues_show(struct seq_file *s, void *data)
> > +{
> > +	struct airoha_eth *eth = s->private;
> > +	int i;
> > +
> > +	seq_puts(s, "     queue | hw-queued |      head |      tail |\n");
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++) {
> > +		struct airoha_queue *q = &eth->q_tx[i];
> > +
> > +		seq_printf(s, " %9d | %9d | %9d | %9d |\n",
> > +			   i, q->queued, q->head, q->tail);
> > +	}
> > +
> > +	return 0;
> > +}
> > +DEFINE_SHOW_ATTRIBUTE(airoha_xmit_queues);
> > +
> > +static int airoha_register_debugfs(struct airoha_eth *eth)
> > +{
> > +	eth->debugfs_dir = debugfs_create_dir(KBUILD_MODNAME, NULL);
> > +	if (IS_ERR(eth->debugfs_dir))
> > +		return PTR_ERR(eth->debugfs_dir);
> > +
> > +	debugfs_create_file("rx-queues", 0400, eth->debugfs_dir, eth,
> > +			    &airoha_rx_queues_fops);
> > +	debugfs_create_file("xmit-queues", 0400, eth->debugfs_dir, eth,
> > +			    &airoha_xmit_queues_fops);
> > +
> > +	return 0;
> > +}
> > +
> > +static int airoha_probe(struct platform_device *pdev)
> > +{
> > +	struct device_node *np = pdev->dev.of_node;
> > +	struct net_device *dev;
> > +	struct airoha_eth *eth;
> > +	int err;
> > +
> > +	dev = devm_alloc_etherdev_mqs(&pdev->dev, sizeof(*eth),
> > +				      AIROHA_NUM_TX_RING, AIROHA_NUM_RX_RING);
> > +	if (!dev) {
> > +		dev_err(&pdev->dev, "alloc_etherdev failed\n");
> > +		return -ENOMEM;
> > +	}
> > +
> > +	eth = netdev_priv(dev);
> > +	eth->net_dev = dev;
> > +
> > +	err = dma_set_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(32));
> > +	if (err) {
> > +		dev_err(&pdev->dev, "failed configuring DMA mask\n");
> > +		return err;
> > +	}
> > +
> > +	eth->fe_regs = devm_platform_ioremap_resource_byname(pdev, "fe");
> > +	if (IS_ERR(eth->fe_regs))
> > +		return dev_err_probe(&pdev->dev, PTR_ERR(eth->fe_regs),
> > +				     "failed to iomap fe regs\n");
> > +
> > +	eth->qdma_regs = devm_platform_ioremap_resource_byname(pdev, "qdma0");
> > +	if (IS_ERR(eth->qdma_regs))
> > +		return dev_err_probe(&pdev->dev, PTR_ERR(eth->qdma_regs),
> > +				     "failed to iomap qdma regs\n");
> > +
> > +	eth->rsts[0].id = "fe";
> > +	eth->rsts[1].id = "pdma";
> > +	eth->rsts[2].id = "qdma";
> > +	err = devm_reset_control_bulk_get_exclusive(&pdev->dev,
> > +						    ARRAY_SIZE(eth->rsts),
> > +						    eth->rsts);
> > +	if (err) {
> > +		dev_err(&pdev->dev, "failed to get bulk reset lines\n");
> > +		return err;
> > +	}
> > +
> > +	eth->xsi_rsts[0].id = "xsi-mac";
> > +	eth->xsi_rsts[1].id = "hsi0-mac";
> > +	eth->xsi_rsts[2].id = "hsi1-mac";
> > +	eth->xsi_rsts[3].id = "hsi-mac";
> > +	err = devm_reset_control_bulk_get_exclusive(&pdev->dev,
> > +						    ARRAY_SIZE(eth->xsi_rsts),
> > +						    eth->xsi_rsts);
> > +	if (err) {
> > +		dev_err(&pdev->dev, "failed to get bulk xsi reset lines\n");
> > +		return err;
> > +	}
> > +
> > +	spin_lock_init(&eth->irq_lock);
> > +	eth->irq = platform_get_irq(pdev, 0);
> > +	if (eth->irq < 0) {
> > +		dev_err(&pdev->dev, "failed reading irq line\n");
> > +		return eth->irq;
> > +	}
> > +
> > +	dev->netdev_ops = &airoha_netdev_ops;
> > +	dev->max_mtu = AIROHA_MAX_MTU;
> > +	dev->watchdog_timeo = 5 * HZ;
> > +	dev->hw_features = NETIF_F_IP_CSUM | NETIF_F_RXCSUM |
> > +			   NETIF_F_TSO6 | NETIF_F_IPV6_CSUM |
> > +			   NETIF_F_SG | NETIF_F_TSO;
> > +	dev->features |= dev->hw_features;
> > +	dev->dev.of_node = np;
> > +	dev->irq = eth->irq;
> > +	SET_NETDEV_DEV(dev, &pdev->dev);
> > +
> > +	err = of_get_ethdev_address(np, dev);
> > +	if (err) {
> > +		if (err == -EPROBE_DEFER)
> > +			return err;
> > +
> > +		eth_hw_addr_random(dev);
> > +		dev_err(&pdev->dev, "generated random MAC address %pM\n",
> > +			dev->dev_addr);
> > +	}
> > +
> > +	err = airoha_hw_init(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	airoha_qdma_start_napi(eth);
> > +	err = register_netdev(dev);
> > +	if (err)
> > +		return err;
> > +
> > +	err = airoha_register_debugfs(eth);
> > +	if (err)
> > +		return err;
> > +
> > +	platform_set_drvdata(pdev, eth);
> > +
> > +	return 0;
> > +}
> > +
> > +static void airoha_remove(struct platform_device *pdev)
> > +{
> > +	struct airoha_eth *eth = platform_get_drvdata(pdev);
> > +	int i;
> > +
> > +	debugfs_remove(eth->debugfs_dir);
> > +
> > +	airoha_qdma_for_each_q_rx(eth, i) {
> > +		struct airoha_queue *q = &eth->q_rx[i];
> > +
> > +		netif_napi_del(&q->napi);
> > +		airoha_qdma_clenaup_rx_queue(q);
> > +		page_pool_destroy(q->page_pool);
> > +	}
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++)
> > +		netif_napi_del(&eth->q_tx_irq[i].napi);
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx); i++)
> > +		airoha_qdma_clenaup_tx_queue(&eth->q_tx[i]);
> > +}
> > +
> > +const struct of_device_id of_airoha_match[] = {
> > +	{ .compatible = "airoha,en7581-eth" },
> > +	{ /* sentinel */ }
> > +};
> > +
> > +static struct platform_driver airoha_driver = {
> > +	.probe = airoha_probe,
> > +	.remove_new = airoha_remove,
> > +	.driver = {
> > +		.name = KBUILD_MODNAME,
> > +		.of_match_table = of_airoha_match,
> > +	},
> > +};
> > +module_platform_driver(airoha_driver);
> > +
> > +MODULE_LICENSE("GPL");
> > +MODULE_AUTHOR("Lorenzo Bianconi <lorenzo@xxxxxxxxxx>");
> > +MODULE_DESCRIPTION("Ethernet driver for Airoha SoC");
> > diff --git a/drivers/net/ethernet/mediatek/airoha_eth.h b/drivers/net/ethernet/mediatek/airoha_eth.h
> > new file mode 100644
> > index 000000000000..e88fecfac44f
> > --- /dev/null
> > +++ b/drivers/net/ethernet/mediatek/airoha_eth.h
> > @@ -0,0 +1,719 @@
> > +// SPDX-License-Identifier: GPL-2.0
> > +/*
> > + * Copyright (C) 2024 Lorenzo Bianconi <lorenzo@xxxxxxxxxx>
> > + */
> > +
> > +#define AIROHA_MAX_NUM_RSTS		3
> > +#define AIROHA_MAX_NUM_XSI_RSTS		4
> > +#define AIROHA_MAX_MTU			2000
> > +#define AIROHA_MAX_PACKET_SIZE		2048
> > +#define AIROHA_NUM_TX_RING		32
> > +#define AIROHA_NUM_RX_RING		32
> > +#define AIROHA_FE_MC_MAX_VLAN_TABLE	64
> > +#define AIROHA_FE_MC_MAX_VLAN_PORT	16
> > +#define AIROHA_NUM_TX_IRQ		2
> > +#define HW_DSCP_NUM			2048
> > +#define IRQ_QUEUE_LEN(_n)		((_n) ? 1024 : 2048)
> > +#define TX_DSCP_NUM			1024
> > +#define RX_DSCP_NUM(_n)			\
> > +	((_n) ==  2 ? 128 :		\
> > +	 (_n) == 11 ? 128 :		\
> > +	 (_n) == 15 ? 128 :		\
> > +	 (_n) ==  0 ? 1024 : 16)
> > +
> > +/* FE */
> > +#define PSE_BASE			0x0100
> > +#define CSR_IFC_BASE			0x0200
> > +#define CDM1_BASE			0x0400
> > +#define GDM1_BASE			0x0500
> > +#define PPE1_BASE			0x0c00
> > +
> > +#define CDM2_BASE			0x1400
> > +#define GDM2_BASE			0x1500
> > +
> > +#define GDM3_BASE			0x1100
> > +#define GDM4_BASE			0x2400
> > +
> > +#define REG_FE_DMA_GLO_CFG		0x0000
> > +#define FE_DMA_GLO_L2_SPACE_MASK	GENMASK(7, 4)
> > +#define FE_DMA_GLO_PG_SZ_MASK		BIT(3)
> > +
> > +#define REG_FE_RST_GLO_CFG		0x0004
> > +#define FE_RST_GDM4_MBI_ARB_MASK	BIT(3)
> > +#define FE_RST_GDM3_MBI_ARB_MASK	BIT(2)
> > +#define FE_RST_CORE_MASK		BIT(0)
> > +
> > +#define REG_FE_LAN_MAC_H		0x0040
> > +#define REG_FE_LAN_MAC_LMIN		0x0044
> > +#define REG_FE_LAN_MAC_LMAX		0x0048
> > +
> > +#define REG_FE_CDM1_OQ_MAP0		0x0050
> > +#define REG_FE_CDM1_OQ_MAP1		0x0054
> > +#define REG_FE_CDM1_OQ_MAP2		0x0058
> > +#define REG_FE_CDM1_OQ_MAP3		0x005c
> > +
> > +#define REG_FE_PCE_CFG			0x0070
> > +#define PCE_DPI_EN			BIT(2)
> > +#define PCE_KA_EN			BIT(1)
> > +#define PCE_MC_EN			BIT(0)
> > +
> > +#define PSE_PORT0_QUEUE			6
> > +#define PSE_PORT1_QUEUE			6
> > +#define PSE_PORT2_QUEUE			32
> > +#define PSE_PORT3_QUEUE			6
> > +#define PSE_PORT4_QUEUE			4
> > +#define PSE_PORT5_QUEUE			6
> > +#define PSE_PORT6_QUEUE			8
> > +#define PSE_PORT7_QUEUE			10
> > +#define PSE_PORT8_QUEUE			4
> > +#define PSE_PORT9_QUEUE			2
> > +#define PSE_PORT10_QUEUE		2
> > +#define PSE_PORT11_QUEUE		0
> > +#define PSE_PORT12_QUEUE		0
> > +#define PSE_PORT13_QUEUE		0
> > +#define PSE_PORT14_QUEUE		0
> > +#define PSE_PORT15_QUEUE		0
> > +
> > +#define REG_FE_PSE_QUEUE_CFG_WR		0x0080
> > +#define PSE_CFG_PORT_ID_MASK		GENMASK(27, 24)
> > +#define PSE_CFG_QUEUE_ID_MASK		GENMASK(20, 16)
> > +#define PSE_CFG_WR_EN_MASK		BIT(8)
> > +#define PSE_CFG_OQRSV_SEL_MASK		BIT(0)
> > +
> > +#define REG_FE_PSE_QUEUE_CFG_VAL	0x0084
> > +#define PSE_CFG_OQ_RSV_MASK		GENMASK(13, 0)
> > +
> > +#define PSE_FQ_CFG			0x008c
> > +#define PSE_FQ_LIMIT_MASK		GENMASK(14, 0)
> > +
> > +#define REG_FE_PSE_BUF_SET		0x0090
> > +#define PSE_SHARE_USED_LTHD_MASK	GENMASK(31, 16)
> > +#define PSE_ALLRSV_MASK			GENMASK(14, 0)
> > +
> > +#define REG_PSE_SHARE_USED_THD		0x0094
> > +#define PSE_SHARE_USED_MTHD_MASK	GENMASK(31, 16)
> > +#define PSE_SHARE_USED_HTHD_MASK	GENMASK(15, 0)
> > +
> > +#define REG_GDM_MISC_CFG		0x0148
> > +#define GDM2_RDM_ACK_WAIT_PREF_MASK	BIT(9)
> > +#define GDM2_CHN_VLD_MODE_MASK		BIT(5)
> > +
> > +#define REG_FE_CSR_IFC_CFG		CSR_IFC_BASE
> > +#define FE_IFC_EN_MASK			BIT(0)
> > +
> > +#define REG_FE_VIP_PORT_EN		0x01f0
> > +#define REG_FE_IFC_PORT_EN		0x01f4
> > +
> > +#define REG_PSE_IQ_REV1			(PSE_BASE + 0x08)
> > +#define PSE_IQ_RES1_P2_MASK		GENMASK(23, 16)
> > +
> > +#define REG_PSE_IQ_REV2			(PSE_BASE + 0x0c)
> > +#define PSE_IQ_RES2_P5_MASK		GENMASK(15, 8)
> > +#define PSE_IQ_RES2_P4_MASK		GENMASK(7, 0)
> > +
> > +#define REG_FE_VIP_EN(_n)		(0x0300 + ((_n) << 3))
> > +#define PATN_FCPU_EN_MASK		BIT(7)
> > +#define PATN_SWP_EN_MASK		BIT(6)
> > +#define PATN_DP_EN_MASK			BIT(5)
> > +#define PATN_SP_EN_MASK			BIT(4)
> > +#define PATN_TYPE_MASK			GENMASK(3, 1)
> > +#define PATN_EN_MASK			BIT(0)
> > +
> > +#define REG_FE_VIP_PATN(_n)		(0x0304 + ((_n) << 3))
> > +#define PATN_DP_MASK			GENMASK(31, 16)
> > +#define PATN_SP_MASK			GENMASK(15, 0)
> > +
> > +#define REG_CDM1_VLAN_CTRL		CDM1_BASE
> > +#define CDM1_VLAN_MASK			GENMASK(31, 16)
> > +
> > +#define REG_CDM1_FWD_CFG		(CDM1_BASE + 0x08)
> > +#define CDM1_VIP_QSEL_MASK		GENMASK(24, 20)
> > +
> > +#define REG_CDM1_CRSN_QSEL(_n)		(CDM1_BASE + 0x10 + ((_n) << 2))
> > +#define CDM1_CRSN_QSEL_REASON_MASK(_n)	\
> > +	GENMASK(4 + (((_n) % 4) << 3), (((_n) % 4 ) << 3))
> > +
> > +#define REG_CDM2_FWD_CFG		(CDM2_BASE + 0x08)
> > +#define CDM2_OAM_QSEL_MASK		GENMASK(31, 27)
> > +#define CDM2_VIP_QSEL_MASK		GENMASK(24, 20)
> > +
> > +#define REG_CDM2_CRSN_QSEL(_n)		(CDM2_BASE + 0x10 + ((_n) << 2))
> > +#define CDM2_CRSN_QSEL_REASON_MASK(_n)	\
> > +	GENMASK(4 + (((_n) % 4) << 3), (((_n) % 4 ) << 3))
> > +
> > +#define REG_GDM1_FWD_CFG		GDM1_BASE
> > +#define GDM1_DROP_CRC_ERR		BIT(23)
> > +#define GDM1_IP4_CKSUM			BIT(22)
> > +#define GDM1_TCP_CKSUM			BIT(21)
> > +#define GDM1_UDP_CKSUM			BIT(20)
> > +#define GDM1_UCFQ_MASK			GENMASK(15, 12)
> > +#define GDM1_BCFQ_MASK			GENMASK(11, 8)
> > +#define GDM1_MCFQ_MASK			GENMASK(7, 4)
> > +#define GDM1_OCFQ_MASK			GENMASK(3, 0)
> > +
> > +#define REG_GDM1_INGRESS_CFG		(GDM1_BASE + 0x10)
> > +#define GDM1_INGRESS_FC_EN_MASK		BIT(1)
> > +#define GDM1_STAG_EN_MASK		BIT(0)
> > +
> > +#define REG_GDM1_LEN_CFG		(GDM1_BASE + 0x14)
> > +#define GDM1_SHORT_LEN_MASK		GENMASK(13, 0)
> > +#define GDM1_LONG_LEN_MASK		GENMASK(29, 16)
> > +
> > +#define REG_FE_CPORT_CFG		(GDM1_BASE + 0x40)
> > +#define FE_CPORT_PAD			BIT(26)
> > +#define FE_CPORT_PORT_XFC_MASK		BIT(25)
> > +#define FE_CPORT_QUEUE_XFC_MASK		BIT(24)
> > +
> > +#define REG_PPE1_TB_HASH_CFG		(PPE1_BASE + 0x250)
> > +#define PPE1_SRAM_TABLE_EN_MASK		BIT(0)
> > +#define PPE1_SRAM_HASH1_EN_MASK		BIT(8)
> > +#define PPE1_DRAM_TABLE_EN_MASK		BIT(16)
> > +#define PPE1_DRAM_HASH1_EN_MASK		BIT(24)
> > +
> > +#define REG_GDM2_CHN_RLS		(GDM2_BASE + 0x20)
> > +#define MBI_RX_AGE_SEL_MASK		GENMASK(18, 17)
> > +#define MBI_TX_AGE_SEL_MASK		GENMASK(18, 17)
> > +
> > +#define REG_GDM3_FWD_CFG		GDM3_BASE
> > +#define GDM3_PAD_EN_MASK		BIT(28)
> > +
> > +#define REG_GDM4_FWD_CFG		(GDM4_BASE + 0x100)
> > +#define GDM4_PAD_EN_MASK		BIT(28)
> > +#define GDM4_SPORT_OFFSET0_MASK		GENMASK(11, 8)
> > +
> > +#define REG_GDM4_SRC_PORT_SET		(GDM4_BASE + 0x33c)
> > +#define GDM4_SPORT_OFF2_MASK		GENMASK(19, 16)
> > +#define GDM4_SPORT_OFF1_MASK		GENMASK(15, 12)
> > +#define GDM4_SPORT_OFF0_MASK		GENMASK(11, 8)
> > +
> > +#define REG_IP_FRAG_FP			0x2010
> > +#define IP_ASSEMBLE_PORT_MASK		GENMASK(24, 21)
> > +#define IP_ASSEMBLE_NBQ_MASK		GENMASK(20, 16)
> > +#define IP_FRAGMENT_PORT_MASK		GENMASK(8, 5)
> > +#define IP_FRAGMENT_NBQ_MASK		GENMASK(4, 0)
> > +
> > +#define REG_MC_VLAN_EN			0x2100
> > +#define MC_VLAN_EN_MASK			BIT(0)
> > +
> > +#define REG_MC_VLAN_CFG			0x2104
> > +#define MC_VLAN_CFG_CMD_DONE_MASK	BIT(31)
> > +#define MC_VLAN_CFG_TABLE_ID_MASK	GENMASK(21, 16)
> > +#define MC_VLAN_CFG_PORT_ID_MASK	GENMASK(11, 8)
> > +#define MC_VLAN_CFG_TABLE_SEL_MASK	BIT(4)
> > +#define MC_VLAN_CFG_RW_MASK		BIT(0)
> > +
> > +#define REG_MC_VLAN_DATA		0x2108
> > +
> > +#define REG_CDM5_RX_OQ1_DROP_CNT	0x29d4
> > +
> > +/* QDMA */
> > +#define REG_QDMA_GLOBAL_CFG		0x0004
> > +#define GLOBAL_CFG_RX_2B_OFFSET		BIT(31)
> > +#define GLOBAL_CFG_DMA_PREFERENCE_MASK	GENMASK(30, 29)
> > +#define GLOBAL_CFG_CPU_TXR_ROUND_ROBIN	BIT(28)
> > +#define GLOBAL_CFG_DSCP_BYTE_SWAP	BIT(27)
> > +#define GLOBAL_CFG_PAYLOAD_BYTE_SWAP	BIT(26)
> > +#define GLOBAL_CFG_MULTICAST_MODIFY_FP	BIT(25)
> > +#define GLOBAL_CFG_OAM_MODIFY_MASK	BIT(24)
> > +#define GLOBAL_CFG_RESET_MASK		BIT(23)
> > +#define GLOBAL_CFG_RESET_DONE_MASK	BIT(22)
> > +#define GLOBAL_CFG_MULTICAST_EN_MASK	BIT(21)
> > +#define GLOBAL_CFG_IRQ1_EN		BIT(20)
> > +#define GLOBAL_CFG_IRQ0_EN		BIT(19)
> > +#define GLOBAL_CFG_LOOPCNT_EN		BIT(18)
> > +#define GLOBAL_CFG_RD_BYPASS_WR		BIT(17)
> > +#define GLOBAL_CFG_QDMA_LOOPBACK	BIT(16)
> > +#define GLOBAL_CFG_LPBK_RXQ_SEL_MASK	GENMASK(13, 8)
> > +#define GLOBAL_CFG_CHECK_DONE		BIT(7)
> > +#define GLOBAL_CFG_TX_WB_DONE		BIT(6)
> > +#define GLOBAL_CFG_MAX_ISSUE_NUM_MASK	GENMASK(5, 4)
> > +#define GLOBAL_CFG_RX_DMA_BUSY		BIT(3)
> > +#define GLOBAL_CFG_RX_DMA_EN		BIT(2)
> > +#define GLOBAL_CFG_TX_DMA_BUSY		BIT(1)
> > +#define GLOBAL_CFG_TX_DMA_EN		BIT(0)
> > +
> > +#define REG_FWD_DSCP_BASE		0x0010
> > +#define REG_FWD_BUF_BASE		0x0014
> > +
> > +#define REG_HW_FWD_DSCP_CFG			0x0018
> > +#define HW_FWD_DSCP_PAYLOAD_SIZE_MASK		GENMASK(29, 28)
> > +#define HW_FWD_DSCP_SCATTER_LEN_MASK		GENMASK(17, 16)
> > +#define HW_FWD_DSCP_MIN_SCATTER_LEN_MASK	GENMASK(15, 0)
> > +
> > +#define REG_INT_STATUS(_n)		\
> > +	(((_n) == 4) ? 0x0730 :		\
> > +	 ((_n) == 3) ? 0x0724 :		\
> > +	 ((_n) == 2) ? 0x0720 :		\
> > +	 ((_n) == 1) ? 0x0024 : 0x0020)
> > +
> > +#define REG_INT_ENABLE(_n)		\
> > +	(((_n) == 4) ? 0x0750 :		\
> > +	 ((_n) == 3) ? 0x0744 :		\
> > +	 ((_n) == 2) ? 0x0740 :		\
> > +	 ((_n) == 1) ? 0x002c : 0x0028)
> > +
> > +/* QDMA_CSR_INT_ENABLE1 */
> > +#define RX15_COHERENT_INT_MASK		BIT(31)
> > +#define RX14_COHERENT_INT_MASK		BIT(30)
> > +#define RX13_COHERENT_INT_MASK		BIT(29)
> > +#define RX12_COHERENT_INT_MASK		BIT(28)
> > +#define RX11_COHERENT_INT_MASK		BIT(27)
> > +#define RX10_COHERENT_INT_MASK		BIT(26)
> > +#define RX9_COHERENT_INT_MASK		BIT(25)
> > +#define RX8_COHERENT_INT_MASK		BIT(24)
> > +#define RX7_COHERENT_INT_MASK		BIT(23)
> > +#define RX6_COHERENT_INT_MASK		BIT(22)
> > +#define RX5_COHERENT_INT_MASK		BIT(21)
> > +#define RX4_COHERENT_INT_MASK		BIT(20)
> > +#define RX3_COHERENT_INT_MASK		BIT(19)
> > +#define RX2_COHERENT_INT_MASK		BIT(18)
> > +#define RX1_COHERENT_INT_MASK		BIT(17)
> > +#define RX0_COHERENT_INT_MASK		BIT(16)
> > +#define TX7_COHERENT_INT_MASK		BIT(15)
> > +#define TX6_COHERENT_INT_MASK		BIT(14)
> > +#define TX5_COHERENT_INT_MASK		BIT(13)
> > +#define TX4_COHERENT_INT_MASK		BIT(12)
> > +#define TX3_COHERENT_INT_MASK		BIT(11)
> > +#define TX2_COHERENT_INT_MASK		BIT(10)
> > +#define TX1_COHERENT_INT_MASK		BIT(9)
> > +#define TX0_COHERENT_INT_MASK		BIT(8)
> > +#define CNT_OVER_FLOW_INT_MASK		BIT(7)
> > +#define IRQ1_FULL_INT_MASK		BIT(5)
> > +#define IRQ1_INT_MASK			BIT(4)
> > +#define HWFWD_DSCP_LOW_INT_MASK		BIT(3)
> > +#define HWFWD_DSCP_EMPTY_INT_MASK	BIT(2)
> > +#define IRQ0_FULL_INT_MASK		BIT(1)
> > +#define IRQ0_INT_MASK			BIT(0)
> > +
> > +#define TX_DONE_INT_MASK(_n)					\
> > +	((_n) ? IRQ1_INT_MASK | IRQ1_FULL_INT_MASK		\
> > +	      : IRQ0_INT_MASK | IRQ0_FULL_INT_MASK)
> > +
> > +#define INT_TX_MASK						\
> > +	(IRQ1_INT_MASK | IRQ1_FULL_INT_MASK |			\
> > +	 IRQ0_INT_MASK | IRQ0_FULL_INT_MASK)
> > +
> > +#define INT_IDX0_MASK						\
> > +	(TX0_COHERENT_INT_MASK | TX1_COHERENT_INT_MASK |	\
> > +	 TX2_COHERENT_INT_MASK | TX3_COHERENT_INT_MASK |	\
> > +	 TX4_COHERENT_INT_MASK | TX5_COHERENT_INT_MASK |	\
> > +	 TX6_COHERENT_INT_MASK | TX7_COHERENT_INT_MASK |	\
> > +	 RX0_COHERENT_INT_MASK | RX1_COHERENT_INT_MASK |	\
> > +	 RX2_COHERENT_INT_MASK | RX3_COHERENT_INT_MASK |	\
> > +	 RX4_COHERENT_INT_MASK | RX7_COHERENT_INT_MASK |	\
> > +	 RX8_COHERENT_INT_MASK | RX9_COHERENT_INT_MASK |	\
> > +	 RX15_COHERENT_INT_MASK | INT_TX_MASK)
> > +
> > +/* QDMA_CSR_INT_ENABLE2 */
> > +#define RX15_NO_CPU_DSCP_INT_MASK	BIT(31)
> > +#define RX14_NO_CPU_DSCP_INT_MASK	BIT(30)
> > +#define RX13_NO_CPU_DSCP_INT_MASK	BIT(29)
> > +#define RX12_NO_CPU_DSCP_INT_MASK	BIT(28)
> > +#define RX11_NO_CPU_DSCP_INT_MASK	BIT(27)
> > +#define RX10_NO_CPU_DSCP_INT_MASK	BIT(26)
> > +#define RX9_NO_CPU_DSCP_INT_MASK	BIT(25)
> > +#define RX8_NO_CPU_DSCP_INT_MASK	BIT(24)
> > +#define RX7_NO_CPU_DSCP_INT_MASK	BIT(23)
> > +#define RX6_NO_CPU_DSCP_INT_MASK	BIT(22)
> > +#define RX5_NO_CPU_DSCP_INT_MASK	BIT(21)
> > +#define RX4_NO_CPU_DSCP_INT_MASK	BIT(20)
> > +#define RX3_NO_CPU_DSCP_INT_MASK	BIT(19)
> > +#define RX2_NO_CPU_DSCP_INT_MASK	BIT(18)
> > +#define RX1_NO_CPU_DSCP_INT_MASK	BIT(17)
> > +#define RX0_NO_CPU_DSCP_INT_MASK	BIT(16)
> > +#define RX15_DONE_INT_MASK		BIT(15)
> > +#define RX14_DONE_INT_MASK		BIT(14)
> > +#define RX13_DONE_INT_MASK		BIT(13)
> > +#define RX12_DONE_INT_MASK		BIT(12)
> > +#define RX11_DONE_INT_MASK		BIT(11)
> > +#define RX10_DONE_INT_MASK		BIT(10)
> > +#define RX9_DONE_INT_MASK		BIT(9)
> > +#define RX8_DONE_INT_MASK		BIT(8)
> > +#define RX7_DONE_INT_MASK		BIT(7)
> > +#define RX6_DONE_INT_MASK		BIT(6)
> > +#define RX5_DONE_INT_MASK		BIT(5)
> > +#define RX4_DONE_INT_MASK		BIT(4)
> > +#define RX3_DONE_INT_MASK		BIT(3)
> > +#define RX2_DONE_INT_MASK		BIT(2)
> > +#define RX1_DONE_INT_MASK		BIT(1)
> > +#define RX0_DONE_INT_MASK		BIT(0)
> > +
> > +#define RX_DONE_INT_MASK					\
> > +	(RX0_DONE_INT_MASK | RX1_DONE_INT_MASK |		\
> > +	 RX2_DONE_INT_MASK | RX3_DONE_INT_MASK |		\
> > +	 RX4_DONE_INT_MASK | RX7_DONE_INT_MASK |		\
> > +	 RX8_DONE_INT_MASK | RX9_DONE_INT_MASK |		\
> > +	 RX15_DONE_INT_MASK)
> > +#define INT_IDX1_MASK						\
> > +	(RX_DONE_INT_MASK |					\
> > +	 RX0_NO_CPU_DSCP_INT_MASK | RX1_NO_CPU_DSCP_INT_MASK |	\
> > +	 RX2_NO_CPU_DSCP_INT_MASK | RX3_NO_CPU_DSCP_INT_MASK |	\
> > +	 RX4_NO_CPU_DSCP_INT_MASK | RX7_NO_CPU_DSCP_INT_MASK |	\
> > +	 RX8_NO_CPU_DSCP_INT_MASK | RX9_NO_CPU_DSCP_INT_MASK |	\
> > +	 RX15_NO_CPU_DSCP_INT_MASK)
> > +
> > +/* QDMA_CSR_INT_ENABLE5 */
> > +#define TX31_COHERENT_INT_MASK		BIT(31)
> > +#define TX30_COHERENT_INT_MASK		BIT(30)
> > +#define TX29_COHERENT_INT_MASK		BIT(29)
> > +#define TX28_COHERENT_INT_MASK		BIT(28)
> > +#define TX27_COHERENT_INT_MASK		BIT(27)
> > +#define TX26_COHERENT_INT_MASK		BIT(26)
> > +#define TX25_COHERENT_INT_MASK		BIT(25)
> > +#define TX24_COHERENT_INT_MASK		BIT(24)
> > +#define TX23_COHERENT_INT_MASK		BIT(23)
> > +#define TX22_COHERENT_INT_MASK		BIT(22)
> > +#define TX21_COHERENT_INT_MASK		BIT(21)
> > +#define TX20_COHERENT_INT_MASK		BIT(20)
> > +#define TX19_COHERENT_INT_MASK		BIT(19)
> > +#define TX18_COHERENT_INT_MASK		BIT(18)
> > +#define TX17_COHERENT_INT_MASK		BIT(17)
> > +#define TX16_COHERENT_INT_MASK		BIT(16)
> > +#define TX15_COHERENT_INT_MASK		BIT(15)
> > +#define TX14_COHERENT_INT_MASK		BIT(14)
> > +#define TX13_COHERENT_INT_MASK		BIT(13)
> > +#define TX12_COHERENT_INT_MASK		BIT(12)
> > +#define TX11_COHERENT_INT_MASK		BIT(11)
> > +#define TX10_COHERENT_INT_MASK		BIT(10)
> > +#define TX9_COHERENT_INT_MASK		BIT(9)
> > +#define TX8_COHERENT_INT_MASK		BIT(8)
> > +
> > +#define INT_IDX4_MASK						\
> > +	(TX8_COHERENT_INT_MASK | TX9_COHERENT_INT_MASK |	\
> > +	 TX10_COHERENT_INT_MASK | TX11_COHERENT_INT_MASK |	\
> > +	 TX12_COHERENT_INT_MASK | TX13_COHERENT_INT_MASK |	\
> > +	 TX14_COHERENT_INT_MASK | TX15_COHERENT_INT_MASK |	\
> > +	 TX16_COHERENT_INT_MASK | TX17_COHERENT_INT_MASK |	\
> > +	 TX18_COHERENT_INT_MASK | TX19_COHERENT_INT_MASK |	\
> > +	 TX20_COHERENT_INT_MASK | TX21_COHERENT_INT_MASK |	\
> > +	 TX20_COHERENT_INT_MASK | TX21_COHERENT_INT_MASK |	\
> > +	 TX22_COHERENT_INT_MASK | TX23_COHERENT_INT_MASK |	\
> > +	 TX24_COHERENT_INT_MASK | TX25_COHERENT_INT_MASK |	\
> > +	 TX26_COHERENT_INT_MASK | TX27_COHERENT_INT_MASK |	\
> > +	 TX28_COHERENT_INT_MASK | TX29_COHERENT_INT_MASK |	\
> > +	 TX30_COHERENT_INT_MASK | TX31_COHERENT_INT_MASK)
> > +
> > +#define REG_TX_IRQ_BASE(_n)		((_n) ? 0x0048 : 0x0050)
> > +
> > +#define REG_TX_IRQ_CFG(_n)		((_n) ? 0x004c : 0x0054)
> > +#define TX_IRQ_THR_MASK			GENMASK(27, 16)
> > +#define TX_IRQ_DEPTH_MASK		GENMASK(11, 0)
> > +
> > +#define REG_IRQ_CLEAR_LEN(_n)		((_n) ? 0x0064 : 0x0058)
> > +#define IRQ_CLEAR_LEN_MASK		GENMASK(7, 0)
> > +
> > +#define REG_IRQ_STATUS(_n)		((_n) ? 0x0068 : 0x005c)
> > +#define IRQ_ENTRY_LEN_MASK		GENMASK(27, 16)
> > +#define IRQ_HEAD_IDX_MASK		GENMASK(11, 0)
> > +
> > +#define REG_TX_RING_BASE(_n)	\
> > +	(((_n) < 8) ? 0x0100 + ((_n) << 5) : 0x0b00 + (((_n) - 8) << 5))
> > +
> > +#define REG_TX_RING_BLOCKING(_n)	\
> > +	(((_n) < 8) ? 0x0104 + ((_n) << 5) : 0x0b04 + (((_n) - 8) << 5))
> > +
> > +#define TX_RING_IRQ_BLOCKING_MAP_MASK			BIT(6)
> > +#define TX_RING_IRQ_BLOCKING_CFG_MASK			BIT(4)
> > +#define TX_RING_IRQ_BLOCKING_TX_DROP_EN_MASK		BIT(2)
> > +#define TX_RING_IRQ_BLOCKING_MAX_TH_TXRING_EN_MASK	BIT(1)
> > +#define TX_RING_IRQ_BLOCKING_MIN_TH_TXRING_EN_MASK	BIT(0)
> > +
> > +#define REG_TX_CPU_IDX(_n)	\
> > +	(((_n) < 8) ? 0x0108 + ((_n) << 5) : 0x0b08 + (((_n) - 8) << 5))
> > +
> > +#define TX_RING_CPU_IDX_MASK		GENMASK(15, 0)
> > +
> > +#define REG_TX_DMA_IDX(_n)	\
> > +	(((_n) < 8) ? 0x010c + ((_n) << 5) : 0x0b0c + (((_n) - 8) << 5))
> > +
> > +#define TX_RING_DMA_IDX_MASK		GENMASK(15, 0)
> > +
> > +#define IRQ_RING_IDX_MASK		GENMASK(20, 16)
> > +#define IRQ_DESC_IDX_MASK		GENMASK(15, 0)
> > +
> > +#define REG_RX_RING_BASE(_n)	\
> > +	(((_n) < 16) ? 0x0200 + ((_n) << 5) : 0x0e00 + (((_n) - 16) << 5))
> > +
> > +#define REG_RX_RING_SIZE(_n)	\
> > +	(((_n) < 16) ? 0x0204 + ((_n) << 5) : 0x0e04 + (((_n) - 16) << 5))
> > +
> > +#define RX_RING_THR_MASK		GENMASK(31, 16)
> > +#define RX_RING_SIZE_MASK		GENMASK(15, 0)
> > +
> > +#define REG_RX_CPU_IDX(_n)	\
> > +	(((_n) < 16) ? 0x0208 + ((_n) << 5) : 0x0e08 + (((_n) - 16) << 5))
> > +
> > +#define RX_RING_CPU_IDX_MASK		GENMASK(15, 0)
> > +
> > +#define REG_RX_DMA_IDX(_n)	\
> > +	(((_n) < 16) ? 0x020c + ((_n) << 5) : 0x0e0c + (((_n) - 16) << 5))
> > +
> > +#define REG_RX_DELAY_INT_IDX(_n)	\
> > +	(((_n) < 16) ? 0x0210 + ((_n) << 5) : 0x0e10 + (((_n) - 16) << 5))
> > +
> > +#define RX_DELAY_INT_MASK		GENMASK(15, 0)
> > +
> > +#define RX_RING_DMA_IDX_MASK		GENMASK(15, 0)
> > +
> > +#define REG_INGRESS_TRTCM_CFG		0x0070
> > +#define INGRESS_TRTCM_EN_MASK		BIT(31)
> > +#define INGRESS_TRTCM_MODE_MASK		BIT(30)
> > +#define INGRESS_SLOW_TICK_RATIO_MASK	GENMASK(29, 16)
> > +#define INGRESS_FAST_TICK_MASK		GENMASK(15, 0)
> > +
> > +#define REG_TXQ_DIS_CFG_BASE(_n)	((_n) ? 0x20a0 : 0x00a0)
> > +#define REG_TXQ_DIS_CFG(_n, _m)		(REG_TXQ_DIS_CFG_BASE((_n)) + (_m) << 2)
> > +
> > +#define REG_LMGR_INIT_CFG		0x1000
> > +#define LMGR_INIT_START			BIT(31)
> > +#define LMGR_SRAM_MODE_MASK		BIT(30)
> > +#define HW_FWD_PKTSIZE_OVERHEAD_MASK	GENMASK(27, 20)
> > +#define HW_FWD_DESC_NUM_MASK		GENMASK(16, 0)
> > +
> > +#define REG_FWD_DSCP_LOW_THR		0x1004
> > +#define FWD_DSCP_LOW_THR_MASK		GENMASK(17, 0)
> > +
> > +#define REG_EGRESS_RATE_METER_CFG		0x100c
> > +#define EGRESS_RATE_METER_EN_MASK		BIT(29)
> > +#define EGRESS_RATE_METER_EQ_RATE_EN_MASK	BIT(17)
> > +#define EGRESS_RATE_METER_WINDOW_SZ_MASK	GENMASK(16, 12)
> > +#define EGRESS_RATE_METER_TIMESLICE_MASK	GENMASK(10, 0)
> > +
> > +#define REG_EGRESS_TRTCM_CFG		0x1010
> > +#define EGRESS_TRTCM_EN_MASK		BIT(31)
> > +#define EGRESS_TRTCM_MODE_MASK		BIT(30)
> > +#define EGRESS_SLOW_TICK_RATIO_MASK	GENMASK(29, 16)
> > +#define EGRESS_FAST_TICK_MASK		GENMASK(15, 0)
> > +
> > +#define REG_TXWRR_MODE_CFG		0x1020
> > +#define TWRR_WEIGHT_SCALE_MASK		BIT(31)
> > +#define TWRR_WEIGHT_BASE_MASK		BIT(3)
> > +
> > +#define REG_PSE_BUF_USAGE_CFG		0x1028
> > +#define PSE_BUF_ESTIMATE_EN_MASK	BIT(29)
> > +
> > +#define REG_GLB_TRTCM_CFG		0x1080
> > +#define GLB_TRTCM_EN_MASK		BIT(31)
> > +#define GLB_TRTCM_MODE_MASK		BIT(30)
> > +#define GLB_SLOW_TICK_RATIO_MASK	GENMASK(29, 16)
> > +#define GLB_FAST_TICK_MASK		GENMASK(15, 0)
> > +
> > +#define REG_TXQ_CNGST_CFG		0x10a0
> > +#define TXQ_CNGST_DROP_EN		BIT(31)
> > +#define TXQ_CNGST_DEI_DROP_EN		BIT(30)
> > +
> > +#define REG_SLA_TRTCM_CFG		0x1150
> > +#define SLA_TRTCM_EN_MASK		BIT(31)
> > +#define SLA_TRTCM_MODE_MASK		BIT(30)
> > +#define SLA_SLOW_TICK_RATIO_MASK	GENMASK(29, 16)
> > +#define SLA_FAST_TICK_MASK		GENMASK(15, 0)
> > +
> > +/* CTRL */
> > +#define QDMA_DESC_DONE_MASK		BIT(31)
> > +#define QDMA_DESC_DROP_MASK		BIT(30) /* tx: drop pkt - rx: overflow */
> > +#define QDMA_DESC_MORE_MASK		BIT(29) /* more SG elements */
> > +#define QDMA_DESC_DEI_MASK		BIT(25)
> > +#define QDMA_DESC_NO_DROP_MASK		BIT(24)
> > +#define QDMA_DESC_LEN_MASK		GENMASK(15, 0)
> > +/* DATA */
> > +#define QDMA_DESC_NEXT_ID_MASK		GENMASK(15, 0)
> > +/* MSG0 */
> > +#define QDMA_ETH_TXMSG_MIC_IDX_MASK	BIT(30)
> > +#define QDMA_ETH_TXMSG_SP_TAG_MASK	GENMASK(29, 14)
> > +#define QDMA_ETH_TXMSG_ICO_MASK		BIT(13)
> > +#define QDMA_ETH_TXMSG_UCO_MASK		BIT(12)
> > +#define QDMA_ETH_TXMSG_TCO_MASK		BIT(11)
> > +#define QDMA_ETH_TXMSG_TSO_MASK		BIT(10)
> > +#define QDMA_ETH_TXMSG_FAST_MASK	BIT(9)
> > +#define QDMA_ETH_TXMSG_OAM_MASK		BIT(8)
> > +#define QDMA_ETH_TXMSG_CHAN_MASK	GENMASK(7, 3)
> > +#define QDMA_ETH_TXMSG_QUEUE_MASK	GENMASK(2, 0)
> > +/* MSG1 */
> > +#define QDMA_ETH_TXMSG_NO_DROP		BIT(31)
> > +#define QDMA_ETH_TXMSG_METER_MASK	GENMASK(30, 24)	/* 0x7f means do not apply meters */
> > +#define QDMA_ETH_TXMSG_FPORT_MASK	GENMASK(23, 20)
> > +#define QDMA_ETH_TXMSG_NBOQ_MASK	GENMASK(19, 15)
> > +#define QDMA_ETH_TXMSG_HWF_MASK		BIT(14)
> > +#define QDMA_ETH_TXMSG_HOP_MASK		BIT(13)
> > +#define QDMA_ETH_TXMSG_PTP_MASK		BIT(12)
> > +#define QDMA_ETH_TXMSG_ACNT_G1_MASK	GENMASK(10, 6)	/* 0x1f means do not count */
> > +#define QDMA_ETH_TXMSG_ACNT_G0_MASK	GENMASK(5, 0)	/* 0x3f means do not count */
> > +
> > +struct airoha_qdma_desc {
> > +	__le32 rsv;
> > +	__le32 ctrl;
> > +	__le32 addr;
> > +	__le32 data;
> > +	__le32 msg0;
> > +	__le32 msg1;
> > +	__le32 msg2;
> > +	__le32 msg3;
> > +};
> > +
> > +/* CTRL0 */
> > +#define QDMA_FWD_DESC_CTX_MASK		BIT(31)
> > +#define QDMA_FWD_DESC_RING_MASK		GENMASK(30, 28)
> > +#define QDMA_FWD_DESC_IDX_MASK		GENMASK(27, 16)
> > +#define QDMA_FWD_DESC_LEN_MASK		GENMASK(15, 0)
> > +/* CTRL1 */
> > +#define QDMA_FWD_DESC_FIRST_IDX_MASK	GENMASK(15, 0)
> > +/* CTRL2 */
> > +#define QDMA_FWD_DESC_MORE_PKT_NUM_MASK	GENMASK(2, 0)
> > +
> > +struct airoha_qdma_fwd_desc {
> > +	__le32 addr;
> > +	__le32 ctrl0;
> > +	__le32 ctrl1;
> > +	__le32 ctrl2;
> > +	__le32 msg0;
> > +	__le32 msg1;
> > +	__le32 rsv0;
> > +	__le32 rsv1;
> > +};
> > +
> > +enum {
> > +	QDMA_INT_REG_IDX0,
> > +	QDMA_INT_REG_IDX1,
> > +	QDMA_INT_REG_IDX2,
> > +	QDMA_INT_REG_IDX3,
> > +	QDMA_INT_REG_IDX4,
> > +	QDMA_INT_REG_MAX
> > +};
> > +
> > +enum airoha_dport {
> > +	DPORT_PDMA,
> > +	DPORT_GDM1,
> > +	DPORT_GDM2,
> > +	DPORT_GDM3,
> > +	DPORT_PPE,
> > +	DPORT_QDMA,
> > +	DPORT_QDMA_HW,
> > +	DPORT_DISCARD,
> > +	DPORT_GDM4 = 9,
> > +};
> > +
> > +enum {
> > +	FE_DP_CPU,
> > +	FE_DP_GDM1,
> > +	FE_DP_GDM2,
> > +	FE_DP_QDMA1_HWF,
> > +	FE_DP_GDMA3_HWF = 3,
> > +	FE_DP_PPE,
> > +	FE_DP_QDMA2_CPU,
> > +	FE_DP_QDMA2_HWF,
> > +	FE_DP_DISCARD,
> > +	FE_DP_PPE2 = 8,
> > +	FE_DP_DROP = 15,
> > +};
> > +
> > +enum {
> > +	CDM_CRSN_QSEL_Q1 = 1,
> > +	CDM_CRSN_QSEL_Q5 = 5,
> > +	CDM_CRSN_QSEL_Q6 = 6,
> > +	CDM_CRSN_QSEL_Q15 = 15,
> > +};
> > +
> > +enum {
> > +	CRSN_08 = 0x8,
> > +	CRSN_21 = 0x15, /* KA */
> > +	CRSN_22 = 0x16, /* hit bind and force route to CPU */
> > +	CRSN_24 = 0x18,
> > +	CRSN_25 = 0x19,
> > +};
> > +
> > +enum {
> > +	DEV_STATE_INITIALIZED,
> > +};
> > +
> > +struct airoha_queue_entry {
> > +	union {
> > +		void *buf;
> > +		struct sk_buff *skb;
> > +	};
> > +	dma_addr_t dma_addr;
> > +	u16 dma_len;
> > +};
> > +
> > +struct airoha_queue {
> > +	struct airoha_eth *eth;
> > +
> > +	spinlock_t lock;
> > +	struct airoha_queue_entry *entry;
> > +	struct airoha_qdma_desc *desc;
> > +	u16 head;
> > +	u16 tail;
> > +
> > +	int queued;
> > +	int ndesc;
> > +	int free_thr;
> > +	int buf_size;
> > +
> > +	struct napi_struct napi;
> > +	struct page_pool *page_pool;
> > +};
> > +
> > +struct airoha_tx_irq_queue {
> > +	struct airoha_eth *eth;
> > +
> > +	struct napi_struct napi;
> > +	u32 *q;
> > +
> > +	int size;
> > +	int queued;
> > +	u16 head;
> > +};
> > +
> > +struct airoha_eth {
> > +	struct net_device *net_dev;
> > +
> > +	unsigned long state;
> > +
> > +	void __iomem *qdma_regs;
> > +	void __iomem *fe_regs;
> > +
> > +	spinlock_t irq_lock;
> > +	u32 irqmask[QDMA_INT_REG_MAX];
> > +	int irq;
> > +
> > +	struct reset_control_bulk_data rsts[AIROHA_MAX_NUM_RSTS];
> > +	struct reset_control_bulk_data xsi_rsts[AIROHA_MAX_NUM_XSI_RSTS];
> > +
> > +	struct airoha_queue q_tx[AIROHA_NUM_TX_RING];
> > +	struct airoha_queue q_rx[AIROHA_NUM_RX_RING];
> > +
> > +	struct airoha_tx_irq_queue q_tx_irq[AIROHA_NUM_TX_IRQ];
> > +
> > +	/* descriptor and packet buffers for qdma hw forward */
> > +	struct {
> > +		void *desc;
> > +		void *q;
> > +	} hfwd;
> > +
> > +	struct dentry *debugfs_dir;
> > +};
> > +
> > +#define airoha_qdma_for_each_q_rx(eth, i)		\
> > +	for (i = 0; i < ARRAY_SIZE((eth)->q_rx); i++)	\
> > +		if ((eth)->q_rx[i].ndesc)
> > +
> > +static inline void airoha_qdma_start_napi(struct airoha_eth *eth)
> > +{
> > +	int i;
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++)
> > +		napi_enable(&eth->q_tx_irq[i].napi);
> > +
> > +	airoha_qdma_for_each_q_rx(eth, i)
> > +		napi_enable(&eth->q_rx[i].napi);
> > +}
> > +
> > +static inline void airoha_qdma_stop_napi(struct airoha_eth *eth)
> > +{
> > +	int i;
> > +
> > +	for (i = 0; i < ARRAY_SIZE(eth->q_tx_irq); i++)
> > +		napi_disable(&eth->q_tx_irq[i].napi);
> > +
> > +	airoha_qdma_for_each_q_rx(eth, i)
> > +		napi_disable(&eth->q_rx[i].napi);
> > +}
> > --
> > 2.45.1
> >

Attachment: signature.asc
Description: PGP signature


[Index of Archives]     [Device Tree Compilter]     [Device Tree Spec]     [Linux Driver Backports]     [Video for Linux]     [Linux USB Devel]     [Linux PCI Devel]     [Linux Audio Users]     [Linux Kernel]     [Linux SCSI]     [XFree86]     [Yosemite Backpacking]


  Powered by Linux