]> git.ipfire.org Git - thirdparty/kernel/linux.git/commitdiff
net: ntb_netdev: Introduce per-queue context
authorKoichiro Den <den@valinux.co.jp>
Thu, 5 Mar 2026 15:56:36 +0000 (00:56 +0900)
committerJakub Kicinski <kuba@kernel.org>
Sat, 7 Mar 2026 03:15:20 +0000 (19:15 -0800)
Prepare ntb_netdev for multi-queue operation by moving queue-pair state
out of struct ntb_netdev.

Introduce struct ntb_netdev_queue to carry the ntb_transport_qp pointer,
the per-QP TX timer and queue id. Pass this object as the callback
context and convert the RX/TX handlers and link event path accordingly.

The probe path allocates a fixed upper bound for netdev queues while
instantiating only a single ntb_transport queue pair, preserving the
previous behavior. Also store client_dev for future queue pair
creation/removal via the ntb_transport API.

Signed-off-by: Koichiro Den <den@valinux.co.jp>
Link: https://patch.msgid.link/20260305155639.1885517-2-den@valinux.co.jp
Signed-off-by: Jakub Kicinski <kuba@kernel.org>
drivers/net/ntb_netdev.c

index fbeae05817e9ff05692e2ac6fb16a804b853fb36..4b65e938d549fa742bf3b54725338ecd226b5153 100644 (file)
@@ -53,6 +53,7 @@
 #include <linux/pci.h>
 #include <linux/ntb.h>
 #include <linux/ntb_transport.h>
+#include <linux/slab.h>
 
 #define NTB_NETDEV_VER "0.7"
 
@@ -70,11 +71,24 @@ static unsigned int tx_start = 10;
 /* Number of descriptors still available before stop upper layer tx */
 static unsigned int tx_stop = 5;
 
+#define NTB_NETDEV_MAX_QUEUES          64
+#define NTB_NETDEV_DEFAULT_QUEUES      1
+
+struct ntb_netdev;
+
+struct ntb_netdev_queue {
+       struct ntb_netdev *ntdev;
+       struct ntb_transport_qp *qp;
+       struct timer_list tx_timer;
+       u16 qid;
+};
+
 struct ntb_netdev {
        struct pci_dev *pdev;
+       struct device *client_dev;
        struct net_device *ndev;
-       struct ntb_transport_qp *qp;
-       struct timer_list tx_timer;
+       unsigned int num_queues;
+       struct ntb_netdev_queue *queues;
 };
 
 #define        NTB_TX_TIMEOUT_MS       1000
@@ -82,14 +96,17 @@ struct ntb_netdev {
 
 static void ntb_netdev_event_handler(void *data, int link_is_up)
 {
-       struct net_device *ndev = data;
-       struct ntb_netdev *dev = netdev_priv(ndev);
+       struct ntb_netdev_queue *q = data;
+       struct ntb_netdev *dev = q->ntdev;
+       struct net_device *ndev;
+
+       ndev = dev->ndev;
 
-       netdev_dbg(ndev, "Event %x, Link %x\n", link_is_up,
-                  ntb_transport_link_query(dev->qp));
+       netdev_dbg(ndev, "Event %x, Link %x, qp %u\n", link_is_up,
+                  ntb_transport_link_query(q->qp), q->qid);
 
        if (link_is_up) {
-               if (ntb_transport_link_query(dev->qp))
+               if (ntb_transport_link_query(q->qp))
                        netif_carrier_on(ndev);
        } else {
                netif_carrier_off(ndev);
@@ -99,10 +116,13 @@ static void ntb_netdev_event_handler(void *data, int link_is_up)
 static void ntb_netdev_rx_handler(struct ntb_transport_qp *qp, void *qp_data,
                                  void *data, int len)
 {
-       struct net_device *ndev = qp_data;
+       struct ntb_netdev_queue *q = qp_data;
+       struct ntb_netdev *dev = q->ntdev;
+       struct net_device *ndev;
        struct sk_buff *skb;
        int rc;
 
+       ndev = dev->ndev;
        skb = data;
        if (!skb)
                return;
@@ -118,6 +138,7 @@ static void ntb_netdev_rx_handler(struct ntb_transport_qp *qp, void *qp_data,
        skb_put(skb, len);
        skb->protocol = eth_type_trans(skb, ndev);
        skb->ip_summed = CHECKSUM_NONE;
+       skb_record_rx_queue(skb, q->qid);
 
        if (netif_rx(skb) == NET_RX_DROP) {
                ndev->stats.rx_errors++;
@@ -144,42 +165,43 @@ enqueue_again:
 }
 
 static int __ntb_netdev_maybe_stop_tx(struct net_device *netdev,
-                                     struct ntb_transport_qp *qp, int size)
+                                     struct ntb_netdev_queue *q, int size)
 {
-       struct ntb_netdev *dev = netdev_priv(netdev);
+       netif_stop_subqueue(netdev, q->qid);
 
-       netif_stop_queue(netdev);
        /* Make sure to see the latest value of ntb_transport_tx_free_entry()
         * since the queue was last started.
         */
        smp_mb();
 
-       if (likely(ntb_transport_tx_free_entry(qp) < size)) {
-               mod_timer(&dev->tx_timer, jiffies + usecs_to_jiffies(tx_time));
+       if (likely(ntb_transport_tx_free_entry(q->qp) < size)) {
+               mod_timer(&q->tx_timer, jiffies + usecs_to_jiffies(tx_time));
                return -EBUSY;
        }
 
-       netif_start_queue(netdev);
+       netif_start_subqueue(netdev, q->qid);
        return 0;
 }
 
 static int ntb_netdev_maybe_stop_tx(struct net_device *ndev,
-                                   struct ntb_transport_qp *qp, int size)
+                                   struct ntb_netdev_queue *q, int size)
 {
-       if (netif_queue_stopped(ndev) ||
-           (ntb_transport_tx_free_entry(qp) >= size))
+       if (__netif_subqueue_stopped(ndev, q->qid) ||
+           (ntb_transport_tx_free_entry(q->qp) >= size))
                return 0;
 
-       return __ntb_netdev_maybe_stop_tx(ndev, qp, size);
+       return __ntb_netdev_maybe_stop_tx(ndev, q, size);
 }
 
 static void ntb_netdev_tx_handler(struct ntb_transport_qp *qp, void *qp_data,
                                  void *data, int len)
 {
-       struct net_device *ndev = qp_data;
+       struct ntb_netdev_queue *q = qp_data;
+       struct ntb_netdev *dev = q->ntdev;
+       struct net_device *ndev;
        struct sk_buff *skb;
-       struct ntb_netdev *dev = netdev_priv(ndev);
 
+       ndev = dev->ndev;
        skb = data;
        if (!skb || !ndev)
                return;
@@ -194,13 +216,13 @@ static void ntb_netdev_tx_handler(struct ntb_transport_qp *qp, void *qp_data,
 
        dev_kfree_skb_any(skb);
 
-       if (ntb_transport_tx_free_entry(dev->qp) >= tx_start) {
+       if (ntb_transport_tx_free_entry(qp) >= tx_start) {
                /* Make sure anybody stopping the queue after this sees the new
                 * value of ntb_transport_tx_free_entry()
                 */
                smp_mb();
-               if (netif_queue_stopped(ndev))
-                       netif_wake_queue(ndev);
+               if (__netif_subqueue_stopped(ndev, q->qid))
+                       netif_wake_subqueue(ndev, q->qid);
        }
 }
 
@@ -208,16 +230,20 @@ static netdev_tx_t ntb_netdev_start_xmit(struct sk_buff *skb,
                                         struct net_device *ndev)
 {
        struct ntb_netdev *dev = netdev_priv(ndev);
+       u16 qid = skb_get_queue_mapping(skb);
+       struct ntb_netdev_queue *q;
        int rc;
 
-       ntb_netdev_maybe_stop_tx(ndev, dev->qp, tx_stop);
+       q = &dev->queues[qid];
+
+       ntb_netdev_maybe_stop_tx(ndev, q, tx_stop);
 
-       rc = ntb_transport_tx_enqueue(dev->qp, skb, skb->data, skb->len);
+       rc = ntb_transport_tx_enqueue(q->qp, skb, skb->data, skb->len);
        if (rc)
                goto err;
 
        /* check for next submit */
-       ntb_netdev_maybe_stop_tx(ndev, dev->qp, tx_stop);
+       ntb_netdev_maybe_stop_tx(ndev, q, tx_stop);
 
        return NETDEV_TX_OK;
 
@@ -229,80 +255,104 @@ err:
 
 static void ntb_netdev_tx_timer(struct timer_list *t)
 {
-       struct ntb_netdev *dev = timer_container_of(dev, t, tx_timer);
-       struct net_device *ndev = dev->ndev;
+       struct ntb_netdev_queue *q = timer_container_of(q, t, tx_timer);
+       struct ntb_netdev *dev = q->ntdev;
+       struct net_device *ndev;
+
+       ndev = dev->ndev;
 
-       if (ntb_transport_tx_free_entry(dev->qp) < tx_stop) {
-               mod_timer(&dev->tx_timer, jiffies + usecs_to_jiffies(tx_time));
+       if (ntb_transport_tx_free_entry(q->qp) < tx_stop) {
+               mod_timer(&q->tx_timer, jiffies + usecs_to_jiffies(tx_time));
        } else {
                /* Make sure anybody stopping the queue after this sees the new
                 * value of ntb_transport_tx_free_entry()
                 */
                smp_mb();
-               if (netif_queue_stopped(ndev))
-                       netif_wake_queue(ndev);
+               if (__netif_subqueue_stopped(ndev, q->qid))
+                       netif_wake_subqueue(ndev, q->qid);
        }
 }
 
 static int ntb_netdev_open(struct net_device *ndev)
 {
        struct ntb_netdev *dev = netdev_priv(ndev);
+       struct ntb_netdev_queue *queue;
        struct sk_buff *skb;
-       int rc, i, len;
-
-       /* Add some empty rx bufs */
-       for (i = 0; i < NTB_RXQ_SIZE; i++) {
-               skb = netdev_alloc_skb(ndev, ndev->mtu + ETH_HLEN);
-               if (!skb) {
-                       rc = -ENOMEM;
-                       goto err;
-               }
+       int rc = 0, i, len;
+       unsigned int q;
 
-               rc = ntb_transport_rx_enqueue(dev->qp, skb, skb->data,
-                                             ndev->mtu + ETH_HLEN);
-               if (rc) {
-                       dev_kfree_skb(skb);
-                       goto err;
+       /* Add some empty rx bufs for each queue */
+       for (q = 0; q < dev->num_queues; q++) {
+               queue = &dev->queues[q];
+
+               for (i = 0; i < NTB_RXQ_SIZE; i++) {
+                       skb = netdev_alloc_skb(ndev, ndev->mtu + ETH_HLEN);
+                       if (!skb) {
+                               rc = -ENOMEM;
+                               goto err;
+                       }
+
+                       rc = ntb_transport_rx_enqueue(queue->qp, skb, skb->data,
+                                                     ndev->mtu + ETH_HLEN);
+                       if (rc) {
+                               dev_kfree_skb(skb);
+                               goto err;
+                       }
                }
-       }
 
-       timer_setup(&dev->tx_timer, ntb_netdev_tx_timer, 0);
+               timer_setup(&queue->tx_timer, ntb_netdev_tx_timer, 0);
+       }
 
        netif_carrier_off(ndev);
-       ntb_transport_link_up(dev->qp);
+
+       for (q = 0; q < dev->num_queues; q++)
+               ntb_transport_link_up(dev->queues[q].qp);
+
        netif_start_queue(ndev);
 
        return 0;
 
 err:
-       while ((skb = ntb_transport_rx_remove(dev->qp, &len)))
-               dev_kfree_skb(skb);
+       for (q = 0; q < dev->num_queues; q++) {
+               queue = &dev->queues[q];
+
+               while ((skb = ntb_transport_rx_remove(queue->qp, &len)))
+                       dev_kfree_skb(skb);
+       }
        return rc;
 }
 
 static int ntb_netdev_close(struct net_device *ndev)
 {
        struct ntb_netdev *dev = netdev_priv(ndev);
+       struct ntb_netdev_queue *queue;
        struct sk_buff *skb;
+       unsigned int q;
        int len;
 
-       ntb_transport_link_down(dev->qp);
 
-       while ((skb = ntb_transport_rx_remove(dev->qp, &len)))
-               dev_kfree_skb(skb);
+       for (q = 0; q < dev->num_queues; q++) {
+               queue = &dev->queues[q];
+
+               ntb_transport_link_down(queue->qp);
 
-       timer_delete_sync(&dev->tx_timer);
+               while ((skb = ntb_transport_rx_remove(queue->qp, &len)))
+                       dev_kfree_skb(skb);
 
+               timer_delete_sync(&queue->tx_timer);
+       }
        return 0;
 }
 
 static int ntb_netdev_change_mtu(struct net_device *ndev, int new_mtu)
 {
        struct ntb_netdev *dev = netdev_priv(ndev);
+       struct ntb_netdev_queue *queue;
        struct sk_buff *skb;
-       int len, rc;
+       unsigned int q, i;
+       int len, rc = 0;
 
-       if (new_mtu > ntb_transport_max_size(dev->qp) - ETH_HLEN)
+       if (new_mtu > ntb_transport_max_size(dev->queues[0].qp) - ETH_HLEN)
                return -EINVAL;
 
        if (!netif_running(ndev)) {
@@ -311,41 +361,54 @@ static int ntb_netdev_change_mtu(struct net_device *ndev, int new_mtu)
        }
 
        /* Bring down the link and dispose of posted rx entries */
-       ntb_transport_link_down(dev->qp);
+       for (q = 0; q < dev->num_queues; q++)
+               ntb_transport_link_down(dev->queues[q].qp);
 
        if (ndev->mtu < new_mtu) {
-               int i;
-
-               for (i = 0; (skb = ntb_transport_rx_remove(dev->qp, &len)); i++)
-                       dev_kfree_skb(skb);
+               for (q = 0; q < dev->num_queues; q++) {
+                       queue = &dev->queues[q];
 
-               for (; i; i--) {
-                       skb = netdev_alloc_skb(ndev, new_mtu + ETH_HLEN);
-                       if (!skb) {
-                               rc = -ENOMEM;
-                               goto err;
-                       }
-
-                       rc = ntb_transport_rx_enqueue(dev->qp, skb, skb->data,
-                                                     new_mtu + ETH_HLEN);
-                       if (rc) {
+                       for (i = 0;
+                            (skb = ntb_transport_rx_remove(queue->qp, &len));
+                            i++)
                                dev_kfree_skb(skb);
-                               goto err;
+
+                       for (; i; i--) {
+                               skb = netdev_alloc_skb(ndev,
+                                                      new_mtu + ETH_HLEN);
+                               if (!skb) {
+                                       rc = -ENOMEM;
+                                       goto err;
+                               }
+
+                               rc = ntb_transport_rx_enqueue(queue->qp, skb,
+                                                             skb->data,
+                                                             new_mtu +
+                                                             ETH_HLEN);
+                               if (rc) {
+                                       dev_kfree_skb(skb);
+                                       goto err;
+                               }
                        }
                }
        }
 
        WRITE_ONCE(ndev->mtu, new_mtu);
 
-       ntb_transport_link_up(dev->qp);
+       for (q = 0; q < dev->num_queues; q++)
+               ntb_transport_link_up(dev->queues[q].qp);
 
        return 0;
 
 err:
-       ntb_transport_link_down(dev->qp);
+       for (q = 0; q < dev->num_queues; q++) {
+               struct ntb_netdev_queue *queue = &dev->queues[q];
 
-       while ((skb = ntb_transport_rx_remove(dev->qp, &len)))
-               dev_kfree_skb(skb);
+               ntb_transport_link_down(queue->qp);
+
+               while ((skb = ntb_transport_rx_remove(queue->qp, &len)))
+                       dev_kfree_skb(skb);
+       }
 
        netdev_err(ndev, "Error changing MTU, device inoperable\n");
        return rc;
@@ -404,6 +467,7 @@ static int ntb_netdev_probe(struct device *client_dev)
        struct net_device *ndev;
        struct pci_dev *pdev;
        struct ntb_netdev *dev;
+       unsigned int q;
        int rc;
 
        ntb = dev_ntb(client_dev->parent);
@@ -411,7 +475,7 @@ static int ntb_netdev_probe(struct device *client_dev)
        if (!pdev)
                return -ENODEV;
 
-       ndev = alloc_etherdev(sizeof(*dev));
+       ndev = alloc_etherdev_mq(sizeof(*dev), NTB_NETDEV_MAX_QUEUES);
        if (!ndev)
                return -ENOMEM;
 
@@ -420,6 +484,16 @@ static int ntb_netdev_probe(struct device *client_dev)
        dev = netdev_priv(ndev);
        dev->ndev = ndev;
        dev->pdev = pdev;
+       dev->client_dev = client_dev;
+       dev->num_queues = 0;
+
+       dev->queues = kzalloc_objs(*dev->queues, NTB_NETDEV_MAX_QUEUES,
+                                  GFP_KERNEL);
+       if (!dev->queues) {
+               rc = -ENOMEM;
+               goto err_free_netdev;
+       }
+
        ndev->features = NETIF_F_HIGHDMA;
 
        ndev->priv_flags |= IFF_LIVE_ADDR_CHANGE;
@@ -436,26 +510,47 @@ static int ntb_netdev_probe(struct device *client_dev)
        ndev->min_mtu = 0;
        ndev->max_mtu = ETH_MAX_MTU;
 
-       dev->qp = ntb_transport_create_queue(ndev, client_dev,
-                                            &ntb_netdev_handlers);
-       if (!dev->qp) {
+       for (q = 0; q < NTB_NETDEV_DEFAULT_QUEUES; q++) {
+               struct ntb_netdev_queue *queue = &dev->queues[q];
+
+               queue->ntdev = dev;
+               queue->qid = q;
+               queue->qp = ntb_transport_create_queue(queue, client_dev,
+                                                      &ntb_netdev_handlers);
+               if (!queue->qp)
+                       break;
+
+               dev->num_queues++;
+       }
+
+       if (!dev->num_queues) {
                rc = -EIO;
-               goto err;
+               goto err_free_queues;
        }
 
-       ndev->mtu = ntb_transport_max_size(dev->qp) - ETH_HLEN;
+       rc = netif_set_real_num_queues(ndev, dev->num_queues, dev->num_queues);
+       if (rc)
+               goto err_free_qps;
+
+       ndev->mtu = ntb_transport_max_size(dev->queues[0].qp) - ETH_HLEN;
 
        rc = register_netdev(ndev);
        if (rc)
-               goto err1;
+               goto err_free_qps;
 
        dev_set_drvdata(client_dev, ndev);
-       dev_info(&pdev->dev, "%s created\n", ndev->name);
+       dev_info(&pdev->dev, "%s created with %u queue pairs\n",
+                ndev->name, dev->num_queues);
        return 0;
 
-err1:
-       ntb_transport_free_queue(dev->qp);
-err:
+err_free_qps:
+       for (q = 0; q < dev->num_queues; q++)
+               ntb_transport_free_queue(dev->queues[q].qp);
+
+err_free_queues:
+       kfree(dev->queues);
+
+err_free_netdev:
        free_netdev(ndev);
        return rc;
 }
@@ -464,9 +559,13 @@ static void ntb_netdev_remove(struct device *client_dev)
 {
        struct net_device *ndev = dev_get_drvdata(client_dev);
        struct ntb_netdev *dev = netdev_priv(ndev);
+       unsigned int q;
 
        unregister_netdev(ndev);
-       ntb_transport_free_queue(dev->qp);
+       for (q = 0; q < dev->num_queues; q++)
+               ntb_transport_free_queue(dev->queues[q].qp);
+
+       kfree(dev->queues);
        free_netdev(ndev);
 }