* [PATCH 0/2] net: macb: fix dma usage
@ 2023-11-28 16:29 Steffen Trumtrar
2023-11-28 16:29 ` [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer Steffen Trumtrar
2023-11-28 16:29 ` [PATCH 2/2] net: macb: convert to volatile accesses Steffen Trumtrar
0 siblings, 2 replies; 7+ messages in thread
From: Steffen Trumtrar @ 2023-11-28 16:29 UTC (permalink / raw)
To: barebox
The rx_buffer is only dma_alloc'ed but never properly flushed.
Fix that.
While at it, also use proper volatile access instead of sw barriers.
Signed-off-by: Steffen Trumtrar <s.trumtrar@pengutronix.de>
---
Steffen Trumtrar (2):
net: macb: fix dma_alloc for rx_buffer
net: macb: convert to volatile accesses
drivers/net/macb.c | 90 ++++++++++++++++++++++++++++++------------------------
1 file changed, 50 insertions(+), 40 deletions(-)
---
base-commit: 5f200dd534c848dfa5d948334b6373f0310b8f73
change-id: 20231128-v2023-08-0-topic-macb-0c13ed91179d
Best regards,
--
Steffen Trumtrar <s.trumtrar@pengutronix.de>
^ permalink raw reply [flat|nested] 7+ messages in thread
* [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer
2023-11-28 16:29 [PATCH 0/2] net: macb: fix dma usage Steffen Trumtrar
@ 2023-11-28 16:29 ` Steffen Trumtrar
2023-11-28 16:56 ` Lucas Stach
2023-11-29 6:25 ` Ahmad Fatoum
2023-11-28 16:29 ` [PATCH 2/2] net: macb: convert to volatile accesses Steffen Trumtrar
1 sibling, 2 replies; 7+ messages in thread
From: Steffen Trumtrar @ 2023-11-28 16:29 UTC (permalink / raw)
To: barebox
rx_buffer gets dma_alloc'ed but is never dma_map'ed and therefor not
flushed before it is initially used.
Map the rx_buffer when the macb is initialized and unmap it on ether_halt.
While at it, cleanup the dma_alloc_coherent rx_ring/tx_ring, too.
Signed-off-by: Steffen Trumtrar <s.trumtrar@pengutronix.de>
---
drivers/net/macb.c | 37 ++++++++++++++++++++++++++++---------
1 file changed, 28 insertions(+), 9 deletions(-)
diff --git a/drivers/net/macb.c b/drivers/net/macb.c
index 260c1e806a..92f78f7253 100644
--- a/drivers/net/macb.c
+++ b/drivers/net/macb.c
@@ -63,10 +63,13 @@ struct macb_device {
unsigned int tx_head;
void *rx_buffer;
+ dma_addr_t rx_buffer_phys;
void *tx_buffer;
void *rx_packet_buf;
struct macb_dma_desc *rx_ring;
+ dma_addr_t rx_ring_phys;
struct macb_dma_desc *tx_ring;
+ dma_addr_t tx_ring_phys;
struct macb_dma_desc *gem_q1_descs;
int rx_buffer_size;
@@ -181,7 +184,7 @@ static int gem_recv(struct eth_device *edev)
barrier();
status = macb->rx_ring[macb->rx_tail].ctrl;
length = MACB_BFEXT(RX_FRMLEN, status);
- buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
+ buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer, length,
DMA_FROM_DEVICE);
net_receive(edev, buffer, length);
@@ -221,7 +224,7 @@ static int macb_recv(struct eth_device *edev)
}
if (status & MACB_BIT(RX_EOF)) {
- buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
+ buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
length = MACB_BFEXT(RX_FRMLEN, status);
if (wrapped) {
unsigned int headlen, taillen;
@@ -232,12 +235,12 @@ static int macb_recv(struct eth_device *edev)
dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer,
headlen, DMA_FROM_DEVICE);
memcpy(macb->rx_packet_buf, buffer, headlen);
- dma_sync_single_for_cpu(macb->dev, (unsigned long)macb->rx_buffer,
+ dma_sync_single_for_cpu(macb->dev, (unsigned long)macb->rx_buffer_phys,
taillen, DMA_FROM_DEVICE);
memcpy(macb->rx_packet_buf + headlen, macb->rx_buffer, taillen);
dma_sync_single_for_device(macb->dev, (unsigned long)buffer,
headlen, DMA_FROM_DEVICE);
- dma_sync_single_for_device(macb->dev, (unsigned long)macb->rx_buffer,
+ dma_sync_single_for_device(macb->dev, (unsigned long)macb->rx_buffer_phys,
taillen, DMA_FROM_DEVICE);
net_receive(edev, macb->rx_packet_buf, length);
} else {
@@ -377,7 +380,7 @@ static int gmac_init_dummy_tx_queues(struct macb_device *macb)
return 0;
}
-static void macb_init(struct macb_device *macb)
+static int macb_init(struct macb_device *macb)
{
unsigned long paddr, val = 0;
int i;
@@ -386,6 +389,11 @@ static void macb_init(struct macb_device *macb)
* macb_halt should have been called at some point before now,
* so we'll assume the controller is idle.
*/
+ macb->rx_buffer_phys = dma_map_single(macb->dev, macb->rx_buffer,
+ macb->rx_buffer_size * macb->rx_ring_size,
+ DMA_TO_DEVICE);
+ if (dma_mapping_error(macb->dev, macb->rx_buffer_phys))
+ return -EFAULT;
/* initialize DMA descriptors */
paddr = (ulong)macb->rx_buffer;
@@ -442,6 +450,7 @@ static void macb_init(struct macb_device *macb)
macb_or_gem_writel(macb, USRIO, val);
+ return 0;
}
static void macb_halt(struct eth_device *edev)
@@ -460,6 +469,13 @@ static void macb_halt(struct eth_device *edev)
/* Disable TX and RX, and clear statistics */
macb_writel(macb, NCR, MACB_BIT(CLRSTAT));
+
+ dma_unmap_single(macb->dev, macb->rx_buffer_phys,
+ macb->rx_buffer_size * macb->rx_ring_size,
+ DMA_TO_DEVICE);
+ free(macb->rx_buffer);
+ dma_free_coherent((void *)macb->rx_ring, macb->rx_ring_phys, RX_RING_BYTES(macb));
+ dma_free_coherent((void *)macb->tx_ring, macb->tx_ring_phys, TX_RING_BYTES);
}
static int macb_phy_read(struct mii_bus *bus, int addr, int reg)
@@ -780,6 +796,7 @@ static int macb_probe(struct device *dev)
const char *pclk_name, *hclk_name;
const struct macb_config *config = NULL;
u32 ncfgr;
+ int ret;
macb = xzalloc(sizeof(*macb));
edev = &macb->netdev;
@@ -877,7 +894,7 @@ static int macb_probe(struct device *dev)
clk_enable(macb->rxclk);
if (config) {
- int ret = config->txclk_init(dev, &macb->txclk);
+ ret = config->txclk_init(dev, &macb->txclk);
if (ret)
return ret;
}
@@ -891,8 +908,8 @@ static int macb_probe(struct device *dev)
macb_init_rx_buffer_size(macb, PKTSIZE);
macb->rx_buffer = dma_alloc(macb->rx_buffer_size * macb->rx_ring_size);
- macb->rx_ring = dma_alloc_coherent(RX_RING_BYTES(macb), DMA_ADDRESS_BROKEN);
- macb->tx_ring = dma_alloc_coherent(TX_RING_BYTES, DMA_ADDRESS_BROKEN);
+ macb->rx_ring = dma_alloc_coherent(RX_RING_BYTES(macb), &macb->rx_ring_phys);
+ macb->tx_ring = dma_alloc_coherent(TX_RING_BYTES, &macb->tx_ring_phys);
if (macb->is_gem)
macb->gem_q1_descs = dma_alloc_coherent(GEM_Q1_DESC_BYTES,
@@ -907,7 +924,9 @@ static int macb_probe(struct device *dev)
ncfgr |= macb_dbw(macb);
macb_writel(macb, NCFGR, ncfgr);
- macb_init(macb);
+ ret = macb_init(macb);
+ if (ret)
+ return ret;
mdiobus_register(&macb->miibus);
eth_register(edev);
--
2.40.1
^ permalink raw reply [flat|nested] 7+ messages in thread
* [PATCH 2/2] net: macb: convert to volatile accesses
2023-11-28 16:29 [PATCH 0/2] net: macb: fix dma usage Steffen Trumtrar
2023-11-28 16:29 ` [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer Steffen Trumtrar
@ 2023-11-28 16:29 ` Steffen Trumtrar
2023-11-29 6:31 ` Ahmad Fatoum
1 sibling, 1 reply; 7+ messages in thread
From: Steffen Trumtrar @ 2023-11-28 16:29 UTC (permalink / raw)
To: barebox
Instead of directly reading from memory addresses and inserting
sw barriers to be sure that the compiler will not move loads/stores
behind this point, just use proper volatile writel/readl accesses.
Signed-off-by: Steffen Trumtrar <s.trumtrar@pengutronix.de>
---
drivers/net/macb.c | 53 ++++++++++++++++++++++-------------------------------
1 file changed, 22 insertions(+), 31 deletions(-)
diff --git a/drivers/net/macb.c b/drivers/net/macb.c
index 92f78f7253..c9a7e395d6 100644
--- a/drivers/net/macb.c
+++ b/drivers/net/macb.c
@@ -119,17 +119,15 @@ static int macb_send(struct eth_device *edev, void *packet,
macb->tx_head++;
}
- macb->tx_ring[tx_head].ctrl = ctrl;
- macb->tx_ring[tx_head].addr = (ulong)packet;
- barrier();
+ writel(ctrl, &macb->tx_ring[tx_head].ctrl);
+ writel((ulong)packet, &macb->tx_ring[tx_head].addr);
dma_sync_single_for_device(macb->dev, (unsigned long)packet, length, DMA_TO_DEVICE);
macb_writel(macb, NCR, MACB_BIT(TE) | MACB_BIT(RE) | MACB_BIT(TSTART));
start = get_time_ns();
ret = -ETIMEDOUT;
do {
- barrier();
- ctrl = macb->tx_ring[0].ctrl;
+ ctrl = readl(&macb->tx_ring[0].ctrl);
if (ctrl & MACB_BIT(TX_USED)) {
ret = 0;
break;
@@ -154,18 +152,17 @@ static void reclaim_rx_buffers(struct macb_device *macb,
i = macb->rx_tail;
while (i > new_tail) {
- macb->rx_ring[i].addr &= ~MACB_BIT(RX_USED);
+ clrbits_le32(&macb->rx_ring[i].addr, MACB_BIT(RX_USED));
i++;
if (i > macb->rx_ring_size)
i = 0;
}
while (i < new_tail) {
- macb->rx_ring[i].addr &= ~MACB_BIT(RX_USED);
+ clrbits_le32(&macb->rx_ring[i].addr, MACB_BIT(RX_USED));
i++;
}
- barrier();
macb->rx_tail = new_tail;
}
@@ -177,12 +174,10 @@ static int gem_recv(struct eth_device *edev)
u32 status;
for (;;) {
- barrier();
- if (!(macb->rx_ring[macb->rx_tail].addr & MACB_BIT(RX_USED)))
+ if (!(readl(&macb->rx_ring[macb->rx_tail].addr) & MACB_BIT(RX_USED)))
return -1;
- barrier();
- status = macb->rx_ring[macb->rx_tail].ctrl;
+ status = readl(&macb->rx_ring[macb->rx_tail].ctrl);
length = MACB_BFEXT(RX_FRMLEN, status);
buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer, length,
@@ -190,8 +185,7 @@ static int gem_recv(struct eth_device *edev)
net_receive(edev, buffer, length);
dma_sync_single_for_device(macb->dev, (unsigned long)buffer, length,
DMA_FROM_DEVICE);
- macb->rx_ring[macb->rx_tail].addr &= ~MACB_BIT(RX_USED);
- barrier();
+ clrbits_le32(&macb->rx_ring[macb->rx_tail].addr, MACB_BIT(RX_USED));
macb->rx_tail++;
if (macb->rx_tail >= macb->rx_ring_size)
@@ -211,12 +205,10 @@ static int macb_recv(struct eth_device *edev)
u32 status;
for (;;) {
- barrier();
- if (!(macb->rx_ring[rx_tail].addr & MACB_BIT(RX_USED)))
+ if (!(readl(&macb->rx_ring[rx_tail].addr) & MACB_BIT(RX_USED)))
return -1;
- barrier();
- status = macb->rx_ring[rx_tail].ctrl;
+ status = readl(&macb->rx_ring[rx_tail].ctrl);
if (status & MACB_BIT(RX_SOF)) {
if (rx_tail != macb->rx_tail)
reclaim_rx_buffers(macb, rx_tail);
@@ -250,7 +242,6 @@ static int macb_recv(struct eth_device *edev)
dma_sync_single_for_device(macb->dev, (unsigned long)buffer, length,
DMA_FROM_DEVICE);
}
- barrier();
if (++rx_tail >= macb->rx_ring_size)
rx_tail = 0;
reclaim_rx_buffers(macb, rx_tail);
@@ -370,9 +361,9 @@ static int gmac_init_dummy_tx_queues(struct macb_device *macb)
if (queue_mask & (1 << i))
num_queues++;
- macb->gem_q1_descs[0].addr = 0;
- macb->gem_q1_descs[0].ctrl = MACB_BIT(TX_WRAP) |
- MACB_BIT(TX_LAST) | MACB_BIT(TX_USED);
+ writel(0, &macb->gem_q1_descs[0].addr);
+ setbits_le32(&macb->gem_q1_descs[0].ctrl,
+ MACB_BIT(TX_WRAP) | MACB_BIT(TX_LAST) | MACB_BIT(TX_USED));
for (i = 1; i < num_queues; i++)
gem_writel_queue_TBQP(macb, (ulong)macb->gem_q1_descs, i - 1);
@@ -398,17 +389,17 @@ static int macb_init(struct macb_device *macb)
/* initialize DMA descriptors */
paddr = (ulong)macb->rx_buffer;
for (i = 0; i < macb->rx_ring_size; i++) {
- macb->rx_ring[i].addr = paddr;
- macb->rx_ring[i].ctrl = 0;
+ writel(paddr, &macb->rx_ring[i].addr);
+ writel(0, &macb->rx_ring[i].ctrl);
paddr += macb->rx_buffer_size;
}
- macb->rx_ring[macb->rx_ring_size - 1].addr |= MACB_BIT(RX_WRAP);
+ setbits_le32(&macb->rx_ring[macb->rx_ring_size - 1].addr, MACB_BIT(RX_WRAP));
for (i = 0; i < TX_RING_SIZE; i++) {
- macb->tx_ring[i].addr = 0;
- macb->tx_ring[i].ctrl = MACB_BIT(TX_USED);
+ writel(0, &macb->tx_ring[i].addr);
+ writel(MACB_BIT(TX_USED), &macb->tx_ring[i].ctrl);
}
- macb->tx_ring[TX_RING_SIZE - 1].addr |= MACB_BIT(TX_WRAP);
+ writel(MACB_BIT(TX_WRAP), &macb->tx_ring[TX_RING_SIZE - 1].addr);
macb->rx_tail = macb->tx_head = 0;
@@ -421,9 +412,9 @@ static int macb_init(struct macb_device *macb)
gmac_init_dummy_tx_queues(macb);
/* Disable the second priority rx queue */
- macb->gem_q1_descs[1].addr = MACB_BIT(RX_USED) |
- MACB_BIT(RX_WRAP);
- macb->gem_q1_descs[1].ctrl = 0;
+ setbits_le32(&macb->gem_q1_descs[1].addr,
+ MACB_BIT(RX_USED) | MACB_BIT(RX_WRAP));
+ writel(0, &macb->gem_q1_descs[1].ctrl);
gem_writel(macb, RQ1, (ulong)&macb->gem_q1_descs[1]);
}
--
2.40.1
^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer
2023-11-28 16:29 ` [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer Steffen Trumtrar
@ 2023-11-28 16:56 ` Lucas Stach
2023-11-29 6:48 ` Steffen Trumtrar
2023-11-29 6:25 ` Ahmad Fatoum
1 sibling, 1 reply; 7+ messages in thread
From: Lucas Stach @ 2023-11-28 16:56 UTC (permalink / raw)
To: Steffen Trumtrar, barebox
Am Dienstag, dem 28.11.2023 um 17:29 +0100 schrieb Steffen Trumtrar:
> rx_buffer gets dma_alloc'ed but is never dma_map'ed and therefor not
> flushed before it is initially used.
>
> Map the rx_buffer when the macb is initialized and unmap it on ether_halt.
>
> While at it, cleanup the dma_alloc_coherent rx_ring/tx_ring, too.
>
> Signed-off-by: Steffen Trumtrar <s.trumtrar@pengutronix.de>
> ---
> drivers/net/macb.c | 37 ++++++++++++++++++++++++++++---------
> 1 file changed, 28 insertions(+), 9 deletions(-)
>
> diff --git a/drivers/net/macb.c b/drivers/net/macb.c
> index 260c1e806a..92f78f7253 100644
> --- a/drivers/net/macb.c
> +++ b/drivers/net/macb.c
> @@ -63,10 +63,13 @@ struct macb_device {
> unsigned int tx_head;
>
> void *rx_buffer;
> + dma_addr_t rx_buffer_phys;
> void *tx_buffer;
> void *rx_packet_buf;
> struct macb_dma_desc *rx_ring;
> + dma_addr_t rx_ring_phys;
> struct macb_dma_desc *tx_ring;
> + dma_addr_t tx_ring_phys;
> struct macb_dma_desc *gem_q1_descs;
>
> int rx_buffer_size;
> @@ -181,7 +184,7 @@ static int gem_recv(struct eth_device *edev)
> barrier();
> status = macb->rx_ring[macb->rx_tail].ctrl;
> length = MACB_BFEXT(RX_FRMLEN, status);
> - buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
> + buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
> dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer, length,
> DMA_FROM_DEVICE);
> net_receive(edev, buffer, length);
> @@ -221,7 +224,7 @@ static int macb_recv(struct eth_device *edev)
> }
>
> if (status & MACB_BIT(RX_EOF)) {
> - buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
> + buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
> length = MACB_BFEXT(RX_FRMLEN, status);
> if (wrapped) {
> unsigned int headlen, taillen;
> @@ -232,12 +235,12 @@ static int macb_recv(struct eth_device *edev)
> dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer,
> headlen, DMA_FROM_DEVICE);
> memcpy(macb->rx_packet_buf, buffer, headlen);
> - dma_sync_single_for_cpu(macb->dev, (unsigned long)macb->rx_buffer,
> + dma_sync_single_for_cpu(macb->dev, (unsigned long)macb->rx_buffer_phys,
You can drop all those (unsigned long) casts in calls to
dma_sync_single, now that you are passing a argument of the proper
dma_addr_t type.
> taillen, DMA_FROM_DEVICE);
> memcpy(macb->rx_packet_buf + headlen, macb->rx_buffer, taillen);
> dma_sync_single_for_device(macb->dev, (unsigned long)buffer,
> headlen, DMA_FROM_DEVICE);
> - dma_sync_single_for_device(macb->dev, (unsigned long)macb->rx_buffer,
> + dma_sync_single_for_device(macb->dev, (unsigned long)macb->rx_buffer_phys,
> taillen, DMA_FROM_DEVICE);
> net_receive(edev, macb->rx_packet_buf, length);
> } else {
> @@ -377,7 +380,7 @@ static int gmac_init_dummy_tx_queues(struct macb_device *macb)
> return 0;
> }
>
> -static void macb_init(struct macb_device *macb)
> +static int macb_init(struct macb_device *macb)
> {
> unsigned long paddr, val = 0;
> int i;
> @@ -386,6 +389,11 @@ static void macb_init(struct macb_device *macb)
> * macb_halt should have been called at some point before now,
> * so we'll assume the controller is idle.
> */
> + macb->rx_buffer_phys = dma_map_single(macb->dev, macb->rx_buffer,
> + macb->rx_buffer_size * macb->rx_ring_size,
> + DMA_TO_DEVICE);
The RX buffer is used to hold data written by the device, so it must be
mapped with DMA_FROM_DEVICE.
Regards,
Lucas
> + if (dma_mapping_error(macb->dev, macb->rx_buffer_phys))
> + return -EFAULT;
>
> /* initialize DMA descriptors */
> paddr = (ulong)macb->rx_buffer;
> @@ -442,6 +450,7 @@ static void macb_init(struct macb_device *macb)
>
> macb_or_gem_writel(macb, USRIO, val);
>
> + return 0;
> }
>
> static void macb_halt(struct eth_device *edev)
> @@ -460,6 +469,13 @@ static void macb_halt(struct eth_device *edev)
>
> /* Disable TX and RX, and clear statistics */
> macb_writel(macb, NCR, MACB_BIT(CLRSTAT));
> +
> + dma_unmap_single(macb->dev, macb->rx_buffer_phys,
> + macb->rx_buffer_size * macb->rx_ring_size,
> + DMA_TO_DEVICE);
> + free(macb->rx_buffer);
> + dma_free_coherent((void *)macb->rx_ring, macb->rx_ring_phys, RX_RING_BYTES(macb));
> + dma_free_coherent((void *)macb->tx_ring, macb->tx_ring_phys, TX_RING_BYTES);
> }
>
> static int macb_phy_read(struct mii_bus *bus, int addr, int reg)
> @@ -780,6 +796,7 @@ static int macb_probe(struct device *dev)
> const char *pclk_name, *hclk_name;
> const struct macb_config *config = NULL;
> u32 ncfgr;
> + int ret;
>
> macb = xzalloc(sizeof(*macb));
> edev = &macb->netdev;
> @@ -877,7 +894,7 @@ static int macb_probe(struct device *dev)
> clk_enable(macb->rxclk);
>
> if (config) {
> - int ret = config->txclk_init(dev, &macb->txclk);
> + ret = config->txclk_init(dev, &macb->txclk);
> if (ret)
> return ret;
> }
> @@ -891,8 +908,8 @@ static int macb_probe(struct device *dev)
>
> macb_init_rx_buffer_size(macb, PKTSIZE);
> macb->rx_buffer = dma_alloc(macb->rx_buffer_size * macb->rx_ring_size);
> - macb->rx_ring = dma_alloc_coherent(RX_RING_BYTES(macb), DMA_ADDRESS_BROKEN);
> - macb->tx_ring = dma_alloc_coherent(TX_RING_BYTES, DMA_ADDRESS_BROKEN);
> + macb->rx_ring = dma_alloc_coherent(RX_RING_BYTES(macb), &macb->rx_ring_phys);
> + macb->tx_ring = dma_alloc_coherent(TX_RING_BYTES, &macb->tx_ring_phys);
>
> if (macb->is_gem)
> macb->gem_q1_descs = dma_alloc_coherent(GEM_Q1_DESC_BYTES,
> @@ -907,7 +924,9 @@ static int macb_probe(struct device *dev)
> ncfgr |= macb_dbw(macb);
> macb_writel(macb, NCFGR, ncfgr);
>
> - macb_init(macb);
> + ret = macb_init(macb);
> + if (ret)
> + return ret;
>
> mdiobus_register(&macb->miibus);
> eth_register(edev);
>
^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer
2023-11-28 16:29 ` [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer Steffen Trumtrar
2023-11-28 16:56 ` Lucas Stach
@ 2023-11-29 6:25 ` Ahmad Fatoum
1 sibling, 0 replies; 7+ messages in thread
From: Ahmad Fatoum @ 2023-11-29 6:25 UTC (permalink / raw)
To: Steffen Trumtrar, barebox
Hello Steffen,
On 28.11.23 17:29, Steffen Trumtrar wrote:
> rx_buffer gets dma_alloc'ed but is never dma_map'ed and therefor not
> flushed before it is initially used.
>
> Map the rx_buffer when the macb is initialized and unmap it on ether_halt.
>
> While at it, cleanup the dma_alloc_coherent rx_ring/tx_ring, too.
>
> Signed-off-by: Steffen Trumtrar <s.trumtrar@pengutronix.de>
> ---
> drivers/net/macb.c | 37 ++++++++++++++++++++++++++++---------
> 1 file changed, 28 insertions(+), 9 deletions(-)
>
> diff --git a/drivers/net/macb.c b/drivers/net/macb.c
> index 260c1e806a..92f78f7253 100644
> --- a/drivers/net/macb.c
> +++ b/drivers/net/macb.c
> @@ -63,10 +63,13 @@ struct macb_device {
> unsigned int tx_head;
>
> void *rx_buffer;
> + dma_addr_t rx_buffer_phys;
> void *tx_buffer;
> void *rx_packet_buf;
> struct macb_dma_desc *rx_ring;
> + dma_addr_t rx_ring_phys;
> struct macb_dma_desc *tx_ring;
> + dma_addr_t tx_ring_phys;
> struct macb_dma_desc *gem_q1_descs;
>
> int rx_buffer_size;
> @@ -181,7 +184,7 @@ static int gem_recv(struct eth_device *edev)
> barrier();
> status = macb->rx_ring[macb->rx_tail].ctrl;
> length = MACB_BFEXT(RX_FRMLEN, status);
> - buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
> + buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
For GEM-type NICs, rx_buffer_size is PKTSIZE (1518 bytes currently), which is not a multiple
of the cache line size of the 64 bytes cache line on the ZynqMP's Cortex-A53 the driver
is supposed to support.
> dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer, length,
> DMA_FROM_DEVICE);
This means this could potentially invalidate adjacent buffer contents.
> }
> @@ -891,8 +908,8 @@ static int macb_probe(struct device *dev)
>
> macb_init_rx_buffer_size(macb, PKTSIZE);
^ Here's where PKTSIZE comes from. I'd be in favor of changing the global PKTSIZE
definition to be a multiple of 64 bytes (or use DMA_ALIGNMENT, but this isn't
correctly set for ARM yet. I just sent out a patch for that).
Cheers,
Ahmad
--
Pengutronix e.K. | |
Steuerwalder Str. 21 | http://www.pengutronix.de/ |
31137 Hildesheim, Germany | Phone: +49-5121-206917-0 |
Amtsgericht Hildesheim, HRA 2686 | Fax: +49-5121-206917-5555 |
^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH 2/2] net: macb: convert to volatile accesses
2023-11-28 16:29 ` [PATCH 2/2] net: macb: convert to volatile accesses Steffen Trumtrar
@ 2023-11-29 6:31 ` Ahmad Fatoum
0 siblings, 0 replies; 7+ messages in thread
From: Ahmad Fatoum @ 2023-11-29 6:31 UTC (permalink / raw)
To: Steffen Trumtrar, barebox
Hello Steffen,
On 28.11.23 17:29, Steffen Trumtrar wrote:
> + writel(ctrl, &macb->tx_ring[tx_head].ctrl);
> + writel((ulong)packet, &macb->tx_ring[tx_head].addr);
> dma_sync_single_for_device(macb->dev, (unsigned long)packet, length, DMA_TO_DEVICE);
For this buffer dma_map_single is missing. I just sent out a series to implement
CONFIG_DMA_API_DEBUG by the way that should catch this (as well as the original
issue in the Rx path).
> - macb->gem_q1_descs[0].addr = 0;
> - macb->gem_q1_descs[0].ctrl = MACB_BIT(TX_WRAP) |
> - MACB_BIT(TX_LAST) | MACB_BIT(TX_USED);
> + writel(0, &macb->gem_q1_descs[0].addr);
> + setbits_le32(&macb->gem_q1_descs[0].ctrl,
> + MACB_BIT(TX_WRAP) | MACB_BIT(TX_LAST) | MACB_BIT(TX_USED));
Should be writel to maintain previous semantics.
> - macb->tx_ring[TX_RING_SIZE - 1].addr |= MACB_BIT(TX_WRAP);
> + writel(MACB_BIT(TX_WRAP), &macb->tx_ring[TX_RING_SIZE - 1].addr);
Should be a setbits_le32 to maintain previous semantics.
> /* Disable the second priority rx queue */
> - macb->gem_q1_descs[1].addr = MACB_BIT(RX_USED) |
> - MACB_BIT(RX_WRAP);
> - macb->gem_q1_descs[1].ctrl = 0;
> + setbits_le32(&macb->gem_q1_descs[1].addr,
> + MACB_BIT(RX_USED) | MACB_BIT(RX_WRAP));
Should be a writel to maintain previous semantics.
> + writel(0, &macb->gem_q1_descs[1].ctrl);
>
> gem_writel(macb, RQ1, (ulong)&macb->gem_q1_descs[1]);
> }
>
Cheers,
Ahmad
--
Pengutronix e.K. | |
Steuerwalder Str. 21 | http://www.pengutronix.de/ |
31137 Hildesheim, Germany | Phone: +49-5121-206917-0 |
Amtsgericht Hildesheim, HRA 2686 | Fax: +49-5121-206917-5555 |
^ permalink raw reply [flat|nested] 7+ messages in thread
* Re: [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer
2023-11-28 16:56 ` Lucas Stach
@ 2023-11-29 6:48 ` Steffen Trumtrar
0 siblings, 0 replies; 7+ messages in thread
From: Steffen Trumtrar @ 2023-11-29 6:48 UTC (permalink / raw)
To: Lucas Stach; +Cc: barebox
On 2023-11-28 at 17:56 +01, Lucas Stach <l.stach@pengutronix.de> wrote:
> Am Dienstag, dem 28.11.2023 um 17:29 +0100 schrieb Steffen Trumtrar:
>> rx_buffer gets dma_alloc'ed but is never dma_map'ed and therefor not
>> flushed before it is initially used.
>>
>> Map the rx_buffer when the macb is initialized and unmap it on ether_halt.
>>
>> While at it, cleanup the dma_alloc_coherent rx_ring/tx_ring, too.
>>
>> Signed-off-by: Steffen Trumtrar <s.trumtrar@pengutronix.de>
>> ---
>> drivers/net/macb.c | 37 ++++++++++++++++++++++++++++---------
>> 1 file changed, 28 insertions(+), 9 deletions(-)
>>
>> diff --git a/drivers/net/macb.c b/drivers/net/macb.c
>> index 260c1e806a..92f78f7253 100644
>> --- a/drivers/net/macb.c
>> +++ b/drivers/net/macb.c
>> @@ -63,10 +63,13 @@ struct macb_device {
>> unsigned int tx_head;
>>
>> void *rx_buffer;
>> + dma_addr_t rx_buffer_phys;
>> void *tx_buffer;
>> void *rx_packet_buf;
>> struct macb_dma_desc *rx_ring;
>> + dma_addr_t rx_ring_phys;
>> struct macb_dma_desc *tx_ring;
>> + dma_addr_t tx_ring_phys;
>> struct macb_dma_desc *gem_q1_descs;
>>
>> int rx_buffer_size;
>> @@ -181,7 +184,7 @@ static int gem_recv(struct eth_device *edev)
>> barrier();
>> status = macb->rx_ring[macb->rx_tail].ctrl;
>> length = MACB_BFEXT(RX_FRMLEN, status);
>> - buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
>> + buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
>> dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer, length,
>> DMA_FROM_DEVICE);
>> net_receive(edev, buffer, length);
>> @@ -221,7 +224,7 @@ static int macb_recv(struct eth_device *edev)
>> }
>>
>> if (status & MACB_BIT(RX_EOF)) {
>> - buffer = macb->rx_buffer + macb->rx_buffer_size * macb->rx_tail;
>> + buffer = (void *)macb->rx_buffer_phys + macb->rx_buffer_size * macb->rx_tail;
>> length = MACB_BFEXT(RX_FRMLEN, status);
>> if (wrapped) {
>> unsigned int headlen, taillen;
>> @@ -232,12 +235,12 @@ static int macb_recv(struct eth_device *edev)
>> dma_sync_single_for_cpu(macb->dev, (unsigned long)buffer,
>> headlen, DMA_FROM_DEVICE);
>> memcpy(macb->rx_packet_buf, buffer, headlen);
>> - dma_sync_single_for_cpu(macb->dev, (unsigned long)macb->rx_buffer,
>> + dma_sync_single_for_cpu(macb->dev, (unsigned long)macb->rx_buffer_phys,
>
> You can drop all those (unsigned long) casts in calls to
> dma_sync_single, now that you are passing a argument of the proper
> dma_addr_t type.
>
Thanks, will drop.
>> taillen, DMA_FROM_DEVICE);
>> memcpy(macb->rx_packet_buf + headlen, macb->rx_buffer, taillen);
>> dma_sync_single_for_device(macb->dev, (unsigned long)buffer,
>> headlen, DMA_FROM_DEVICE);
>> - dma_sync_single_for_device(macb->dev, (unsigned long)macb->rx_buffer,
>> + dma_sync_single_for_device(macb->dev, (unsigned long)macb->rx_buffer_phys,
>> taillen, DMA_FROM_DEVICE);
>> net_receive(edev, macb->rx_packet_buf, length);
>> } else {
>> @@ -377,7 +380,7 @@ static int gmac_init_dummy_tx_queues(struct macb_device *macb)
>> return 0;
>> }
>>
>> -static void macb_init(struct macb_device *macb)
>> +static int macb_init(struct macb_device *macb)
>> {
>> unsigned long paddr, val = 0;
>> int i;
>> @@ -386,6 +389,11 @@ static void macb_init(struct macb_device *macb)
>> * macb_halt should have been called at some point before now,
>> * so we'll assume the controller is idle.
>> */
>> + macb->rx_buffer_phys = dma_map_single(macb->dev, macb->rx_buffer,
>> + macb->rx_buffer_size * macb->rx_ring_size,
>> + DMA_TO_DEVICE);
>
> The RX buffer is used to hold data written by the device, so it must be
> mapped with DMA_FROM_DEVICE.
>
Argh, of course :(
Thanks,
Steffen
--
Pengutronix e.K. | Dipl.-Inform. Steffen Trumtrar |
Steuerwalder Str. 21 | https://www.pengutronix.de/ |
31137 Hildesheim, Germany | Phone: +49-5121-206917-0 |
Amtsgericht Hildesheim, HRA 2686| Fax: +49-5121-206917-5555 |
^ permalink raw reply [flat|nested] 7+ messages in thread
end of thread, other threads:[~2023-11-29 6:51 UTC | newest]
Thread overview: 7+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2023-11-28 16:29 [PATCH 0/2] net: macb: fix dma usage Steffen Trumtrar
2023-11-28 16:29 ` [PATCH 1/2] net: macb: fix dma_alloc for rx_buffer Steffen Trumtrar
2023-11-28 16:56 ` Lucas Stach
2023-11-29 6:48 ` Steffen Trumtrar
2023-11-29 6:25 ` Ahmad Fatoum
2023-11-28 16:29 ` [PATCH 2/2] net: macb: convert to volatile accesses Steffen Trumtrar
2023-11-29 6:31 ` Ahmad Fatoum
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox