Commit a29b6235 authored by Marcin Wojtas's avatar Marcin Wojtas Committed by David S. Miller

net: mvneta: add BQL support

Tests showed that when whole bandwidth is consumed, the latency for
various kind of traffic can reach high values. With saturated
link (e.g. with iperf from target to host) simple ping could take
significant amount of time. BQL proved to improve this situation
when implemented in mvneta driver. Measurements of ping latency
for 3 link speeds:
Speed | Latency w/o BQL | Latency with BQL
10    |      7-14 ms    |     3.5 ms
100   |      2-12 ms    |     0.6 ms
1000  |   often timeout |   up to 2ms

Decreasing latency as above result in sligt performance cost - 4kpps
(-1.4%) when pushing 64B packets via two bridged interfaces of Armada 38x.
For 1500B packets in the same setup, the mpstat tool showed +8% of
CPU occupation (default affinity, second CPU idle). Even though this
cost seems reasonable to take, considering other improvements.

This commit adds byte queue limit mechanism for the mvneta driver.
Signed-off-by: default avatarMarcin Wojtas <mw@semihalf.com>
Signed-off-by: default avatarDavid S. Miller <davem@davemloft.net>
parent 2a90f7e1
...@@ -1759,8 +1759,10 @@ static struct mvneta_tx_queue *mvneta_tx_done_policy(struct mvneta_port *pp, ...@@ -1759,8 +1759,10 @@ static struct mvneta_tx_queue *mvneta_tx_done_policy(struct mvneta_port *pp,
/* Free tx queue skbuffs */ /* Free tx queue skbuffs */
static void mvneta_txq_bufs_free(struct mvneta_port *pp, static void mvneta_txq_bufs_free(struct mvneta_port *pp,
struct mvneta_tx_queue *txq, int num) struct mvneta_tx_queue *txq, int num,
struct netdev_queue *nq)
{ {
unsigned int bytes_compl = 0, pkts_compl = 0;
int i; int i;
for (i = 0; i < num; i++) { for (i = 0; i < num; i++) {
...@@ -1768,6 +1770,11 @@ static void mvneta_txq_bufs_free(struct mvneta_port *pp, ...@@ -1768,6 +1770,11 @@ static void mvneta_txq_bufs_free(struct mvneta_port *pp,
txq->txq_get_index; txq->txq_get_index;
struct sk_buff *skb = txq->tx_skb[txq->txq_get_index]; struct sk_buff *skb = txq->tx_skb[txq->txq_get_index];
if (skb) {
bytes_compl += skb->len;
pkts_compl++;
}
mvneta_txq_inc_get(txq); mvneta_txq_inc_get(txq);
if (!IS_TSO_HEADER(txq, tx_desc->buf_phys_addr)) if (!IS_TSO_HEADER(txq, tx_desc->buf_phys_addr))
...@@ -1778,6 +1785,8 @@ static void mvneta_txq_bufs_free(struct mvneta_port *pp, ...@@ -1778,6 +1785,8 @@ static void mvneta_txq_bufs_free(struct mvneta_port *pp,
continue; continue;
dev_kfree_skb_any(skb); dev_kfree_skb_any(skb);
} }
netdev_tx_completed_queue(nq, pkts_compl, bytes_compl);
} }
/* Handle end of transmission */ /* Handle end of transmission */
...@@ -1791,7 +1800,7 @@ static void mvneta_txq_done(struct mvneta_port *pp, ...@@ -1791,7 +1800,7 @@ static void mvneta_txq_done(struct mvneta_port *pp,
if (!tx_done) if (!tx_done)
return; return;
mvneta_txq_bufs_free(pp, txq, tx_done); mvneta_txq_bufs_free(pp, txq, tx_done, nq);
txq->count -= tx_done; txq->count -= tx_done;
...@@ -2401,6 +2410,8 @@ static int mvneta_tx(struct sk_buff *skb, struct net_device *dev) ...@@ -2401,6 +2410,8 @@ static int mvneta_tx(struct sk_buff *skb, struct net_device *dev)
struct mvneta_pcpu_stats *stats = this_cpu_ptr(pp->stats); struct mvneta_pcpu_stats *stats = this_cpu_ptr(pp->stats);
struct netdev_queue *nq = netdev_get_tx_queue(dev, txq_id); struct netdev_queue *nq = netdev_get_tx_queue(dev, txq_id);
netdev_tx_sent_queue(nq, len);
txq->count += frags; txq->count += frags;
if (txq->count >= txq->tx_stop_threshold) if (txq->count >= txq->tx_stop_threshold)
netif_tx_stop_queue(nq); netif_tx_stop_queue(nq);
...@@ -2429,9 +2440,10 @@ static void mvneta_txq_done_force(struct mvneta_port *pp, ...@@ -2429,9 +2440,10 @@ static void mvneta_txq_done_force(struct mvneta_port *pp,
struct mvneta_tx_queue *txq) struct mvneta_tx_queue *txq)
{ {
struct netdev_queue *nq = netdev_get_tx_queue(pp->dev, txq->id);
int tx_done = txq->count; int tx_done = txq->count;
mvneta_txq_bufs_free(pp, txq, tx_done); mvneta_txq_bufs_free(pp, txq, tx_done, nq);
/* reset txq */ /* reset txq */
txq->count = 0; txq->count = 0;
...@@ -2957,6 +2969,8 @@ static int mvneta_txq_init(struct mvneta_port *pp, ...@@ -2957,6 +2969,8 @@ static int mvneta_txq_init(struct mvneta_port *pp,
static void mvneta_txq_deinit(struct mvneta_port *pp, static void mvneta_txq_deinit(struct mvneta_port *pp,
struct mvneta_tx_queue *txq) struct mvneta_tx_queue *txq)
{ {
struct netdev_queue *nq = netdev_get_tx_queue(pp->dev, txq->id);
kfree(txq->tx_skb); kfree(txq->tx_skb);
if (txq->tso_hdrs) if (txq->tso_hdrs)
...@@ -2968,6 +2982,8 @@ static void mvneta_txq_deinit(struct mvneta_port *pp, ...@@ -2968,6 +2982,8 @@ static void mvneta_txq_deinit(struct mvneta_port *pp,
txq->size * MVNETA_DESC_ALIGNED_SIZE, txq->size * MVNETA_DESC_ALIGNED_SIZE,
txq->descs, txq->descs_phys); txq->descs, txq->descs_phys);
netdev_tx_reset_queue(nq);
txq->descs = NULL; txq->descs = NULL;
txq->last_desc = 0; txq->last_desc = 0;
txq->next_desc_to_proc = 0; txq->next_desc_to_proc = 0;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment