Blame SOURCES/0006-net-virtio-implement-Rx-path-for-packed-queues.patch

2c1bf6
From a1168f29a051eba2344407d72267b5d5f648d80c Mon Sep 17 00:00:00 2001
2c1bf6
From: Jens Freimann <jfreimann@redhat.com>
2c1bf6
Date: Mon, 17 Dec 2018 22:31:35 +0100
2c1bf6
Subject: [PATCH 06/18] net/virtio: implement Rx path for packed queues
2c1bf6
2c1bf6
[ upstream commit a76290c8f1cf9c4774c23592921302a04a90bded ]
2c1bf6
2c1bf6
Implement the receive part.
2c1bf6
2c1bf6
Signed-off-by: Jens Freimann <jfreimann@redhat.com>
2c1bf6
Signed-off-by: Tiwei Bie <tiwei.bie@intel.com>
2c1bf6
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>
2c1bf6
(cherry picked from commit a76290c8f1cf9c4774c23592921302a04a90bded)
2c1bf6
Signed-off-by: Jens Freimann <jfreimann@redhat.com>
2c1bf6
---
2c1bf6
 drivers/net/virtio/virtio_ethdev.c |  56 +++--
2c1bf6
 drivers/net/virtio/virtio_ethdev.h |   5 +
2c1bf6
 drivers/net/virtio/virtio_rxtx.c   | 375 ++++++++++++++++++++++++++++-
2c1bf6
 drivers/net/virtio/virtqueue.c     |  43 +++-
2c1bf6
 4 files changed, 457 insertions(+), 22 deletions(-)
2c1bf6
2c1bf6
diff --git a/drivers/net/virtio/virtio_ethdev.c b/drivers/net/virtio/virtio_ethdev.c
2c1bf6
index 6023d6f2c..4ef1da393 100644
2c1bf6
--- a/drivers/net/virtio/virtio_ethdev.c
2c1bf6
+++ b/drivers/net/virtio/virtio_ethdev.c
2c1bf6
@@ -1363,24 +1363,40 @@ set_rxtx_funcs(struct rte_eth_dev *eth_dev)
2c1bf6
 		}
2c1bf6
 	}
2c1bf6
 
2c1bf6
-	if (hw->use_simple_rx) {
2c1bf6
-		PMD_INIT_LOG(INFO, "virtio: using simple Rx path on port %u",
2c1bf6
-			eth_dev->data->port_id);
2c1bf6
-		eth_dev->rx_pkt_burst = virtio_recv_pkts_vec;
2c1bf6
-	} else if (hw->use_inorder_rx) {
2c1bf6
-		PMD_INIT_LOG(INFO,
2c1bf6
-			"virtio: using inorder mergeable buffer Rx path on port %u",
2c1bf6
-			eth_dev->data->port_id);
2c1bf6
-		eth_dev->rx_pkt_burst = &virtio_recv_mergeable_pkts_inorder;
2c1bf6
-	} else if (vtpci_with_feature(hw, VIRTIO_NET_F_MRG_RXBUF)) {
2c1bf6
-		PMD_INIT_LOG(INFO,
2c1bf6
-			"virtio: using mergeable buffer Rx path on port %u",
2c1bf6
-			eth_dev->data->port_id);
2c1bf6
-		eth_dev->rx_pkt_burst = &virtio_recv_mergeable_pkts;
2c1bf6
+	if (vtpci_packed_queue(hw)) {
2c1bf6
+		if (vtpci_with_feature(hw, VIRTIO_NET_F_MRG_RXBUF)) {
2c1bf6
+			PMD_INIT_LOG(INFO,
2c1bf6
+				"virtio: using packed ring mergeable buffer Rx path on port %u",
2c1bf6
+				eth_dev->data->port_id);
2c1bf6
+			eth_dev->rx_pkt_burst =
2c1bf6
+				&virtio_recv_mergeable_pkts_packed;
2c1bf6
+		} else {
2c1bf6
+			PMD_INIT_LOG(INFO,
2c1bf6
+				"virtio: using packed ring standard Rx path on port %u",
2c1bf6
+				eth_dev->data->port_id);
2c1bf6
+			eth_dev->rx_pkt_burst = &virtio_recv_pkts_packed;
2c1bf6
+		}
2c1bf6
 	} else {
2c1bf6
-		PMD_INIT_LOG(INFO, "virtio: using standard Rx path on port %u",
2c1bf6
-			eth_dev->data->port_id);
2c1bf6
-		eth_dev->rx_pkt_burst = &virtio_recv_pkts;
2c1bf6
+		if (hw->use_simple_rx) {
2c1bf6
+			PMD_INIT_LOG(INFO, "virtio: using simple Rx path on port %u",
2c1bf6
+				eth_dev->data->port_id);
2c1bf6
+			eth_dev->rx_pkt_burst = virtio_recv_pkts_vec;
2c1bf6
+		} else if (hw->use_inorder_rx) {
2c1bf6
+			PMD_INIT_LOG(INFO,
2c1bf6
+				"virtio: using inorder mergeable buffer Rx path on port %u",
2c1bf6
+				eth_dev->data->port_id);
2c1bf6
+			eth_dev->rx_pkt_burst =
2c1bf6
+				&virtio_recv_mergeable_pkts_inorder;
2c1bf6
+		} else if (vtpci_with_feature(hw, VIRTIO_NET_F_MRG_RXBUF)) {
2c1bf6
+			PMD_INIT_LOG(INFO,
2c1bf6
+				"virtio: using mergeable buffer Rx path on port %u",
2c1bf6
+				eth_dev->data->port_id);
2c1bf6
+			eth_dev->rx_pkt_burst = &virtio_recv_mergeable_pkts;
2c1bf6
+		} else {
2c1bf6
+			PMD_INIT_LOG(INFO, "virtio: using standard Rx path on port %u",
2c1bf6
+				eth_dev->data->port_id);
2c1bf6
+			eth_dev->rx_pkt_burst = &virtio_recv_pkts;
2c1bf6
+		}
2c1bf6
 	}
2c1bf6
 
2c1bf6
 }
2c1bf6
@@ -1944,6 +1960,12 @@ virtio_dev_configure(struct rte_eth_dev *dev)
2c1bf6
 		}
2c1bf6
 	}
2c1bf6
 
2c1bf6
+	if (vtpci_packed_queue(hw)) {
2c1bf6
+		hw->use_simple_rx = 0;
2c1bf6
+		hw->use_inorder_rx = 0;
2c1bf6
+		hw->use_inorder_tx = 0;
2c1bf6
+	}
2c1bf6
+
2c1bf6
 #if defined RTE_ARCH_ARM64 || defined RTE_ARCH_ARM
2c1bf6
 	if (!rte_cpu_get_flag_enabled(RTE_CPUFLAG_NEON)) {
2c1bf6
 		hw->use_simple_rx = 0;
2c1bf6
diff --git a/drivers/net/virtio/virtio_ethdev.h b/drivers/net/virtio/virtio_ethdev.h
2c1bf6
index 05d355180..88b8c42a3 100644
2c1bf6
--- a/drivers/net/virtio/virtio_ethdev.h
2c1bf6
+++ b/drivers/net/virtio/virtio_ethdev.h
2c1bf6
@@ -73,10 +73,15 @@ int virtio_dev_tx_queue_setup_finish(struct rte_eth_dev *dev,
2c1bf6
 
2c1bf6
 uint16_t virtio_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
2c1bf6
 		uint16_t nb_pkts);
2c1bf6
+uint16_t virtio_recv_pkts_packed(void *rx_queue, struct rte_mbuf **rx_pkts,
2c1bf6
+		uint16_t nb_pkts);
2c1bf6
 
2c1bf6
 uint16_t virtio_recv_mergeable_pkts(void *rx_queue, struct rte_mbuf **rx_pkts,
2c1bf6
 		uint16_t nb_pkts);
2c1bf6
 
2c1bf6
+uint16_t virtio_recv_mergeable_pkts_packed(void *rx_queue,
2c1bf6
+		struct rte_mbuf **rx_pkts, uint16_t nb_pkts);
2c1bf6
+
2c1bf6
 uint16_t virtio_recv_mergeable_pkts_inorder(void *rx_queue,
2c1bf6
 		struct rte_mbuf **rx_pkts, uint16_t nb_pkts);
2c1bf6
 
2c1bf6
diff --git a/drivers/net/virtio/virtio_rxtx.c b/drivers/net/virtio/virtio_rxtx.c
2c1bf6
index ab74917a8..0bcf3b08a 100644
2c1bf6
--- a/drivers/net/virtio/virtio_rxtx.c
2c1bf6
+++ b/drivers/net/virtio/virtio_rxtx.c
2c1bf6
@@ -31,6 +31,7 @@
2c1bf6
 #include "virtqueue.h"
2c1bf6
 #include "virtio_rxtx.h"
2c1bf6
 #include "virtio_rxtx_simple.h"
2c1bf6
+#include "virtio_ring.h"
2c1bf6
 
2c1bf6
 #ifdef RTE_LIBRTE_VIRTIO_DEBUG_DUMP
2c1bf6
 #define VIRTIO_DUMP_PACKET(m, len) rte_pktmbuf_dump(stdout, m, len)
2c1bf6
@@ -105,6 +106,47 @@ vq_ring_free_id_packed(struct virtqueue *vq, uint16_t id)
2c1bf6
 	dxp->next = VQ_RING_DESC_CHAIN_END;
2c1bf6
 }
2c1bf6
 
2c1bf6
+static uint16_t
2c1bf6
+virtqueue_dequeue_burst_rx_packed(struct virtqueue *vq,
2c1bf6
+				  struct rte_mbuf **rx_pkts,
2c1bf6
+				  uint32_t *len,
2c1bf6
+				  uint16_t num)
2c1bf6
+{
2c1bf6
+	struct rte_mbuf *cookie;
2c1bf6
+	uint16_t used_idx;
2c1bf6
+	uint16_t id;
2c1bf6
+	struct vring_packed_desc *desc;
2c1bf6
+	uint16_t i;
2c1bf6
+
2c1bf6
+	desc = vq->ring_packed.desc_packed;
2c1bf6
+
2c1bf6
+	for (i = 0; i < num; i++) {
2c1bf6
+		used_idx = vq->vq_used_cons_idx;
2c1bf6
+		if (!desc_is_used(&desc[used_idx], vq))
2c1bf6
+			return i;
2c1bf6
+		len[i] = desc[used_idx].len;
2c1bf6
+		id = desc[used_idx].id;
2c1bf6
+		cookie = (struct rte_mbuf *)vq->vq_descx[id].cookie;
2c1bf6
+		if (unlikely(cookie == NULL)) {
2c1bf6
+			PMD_DRV_LOG(ERR, "vring descriptor with no mbuf cookie at %u",
2c1bf6
+				vq->vq_used_cons_idx);
2c1bf6
+			break;
2c1bf6
+		}
2c1bf6
+		rte_prefetch0(cookie);
2c1bf6
+		rte_packet_prefetch(rte_pktmbuf_mtod(cookie, void *));
2c1bf6
+		rx_pkts[i] = cookie;
2c1bf6
+
2c1bf6
+		vq->vq_free_cnt++;
2c1bf6
+		vq->vq_used_cons_idx++;
2c1bf6
+		if (vq->vq_used_cons_idx >= vq->vq_nentries) {
2c1bf6
+			vq->vq_used_cons_idx -= vq->vq_nentries;
2c1bf6
+			vq->used_wrap_counter ^= 1;
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	return i;
2c1bf6
+}
2c1bf6
+
2c1bf6
 static uint16_t
2c1bf6
 virtqueue_dequeue_burst_rx(struct virtqueue *vq, struct rte_mbuf **rx_pkts,
2c1bf6
 			   uint32_t *len, uint16_t num)
2c1bf6
@@ -350,6 +392,51 @@ virtqueue_enqueue_recv_refill(struct virtqueue *vq, struct rte_mbuf *cookie)
2c1bf6
 	return 0;
2c1bf6
 }
2c1bf6
 
2c1bf6
+static inline int
2c1bf6
+virtqueue_enqueue_recv_refill_packed(struct virtqueue *vq,
2c1bf6
+				     struct rte_mbuf **cookie, uint16_t num)
2c1bf6
+{
2c1bf6
+	struct vring_packed_desc *start_dp = vq->ring_packed.desc_packed;
2c1bf6
+	uint16_t flags = VRING_DESC_F_WRITE | vq->avail_used_flags;
2c1bf6
+	struct virtio_hw *hw = vq->hw;
2c1bf6
+	struct vq_desc_extra *dxp;
2c1bf6
+	uint16_t idx;
2c1bf6
+	int i;
2c1bf6
+
2c1bf6
+	if (unlikely(vq->vq_free_cnt == 0))
2c1bf6
+		return -ENOSPC;
2c1bf6
+	if (unlikely(vq->vq_free_cnt < num))
2c1bf6
+		return -EMSGSIZE;
2c1bf6
+
2c1bf6
+	for (i = 0; i < num; i++) {
2c1bf6
+		idx = vq->vq_avail_idx;
2c1bf6
+		dxp = &vq->vq_descx[idx];
2c1bf6
+		dxp->cookie = (void *)cookie[i];
2c1bf6
+		dxp->ndescs = 1;
2c1bf6
+
2c1bf6
+		start_dp[idx].addr = VIRTIO_MBUF_ADDR(cookie[i], vq) +
2c1bf6
+				RTE_PKTMBUF_HEADROOM - hw->vtnet_hdr_size;
2c1bf6
+		start_dp[idx].len = cookie[i]->buf_len - RTE_PKTMBUF_HEADROOM
2c1bf6
+					+ hw->vtnet_hdr_size;
2c1bf6
+
2c1bf6
+		vq->vq_desc_head_idx = dxp->next;
2c1bf6
+		if (vq->vq_desc_head_idx == VQ_RING_DESC_CHAIN_END)
2c1bf6
+			vq->vq_desc_tail_idx = vq->vq_desc_head_idx;
2c1bf6
+		rte_smp_wmb();
2c1bf6
+		start_dp[idx].flags = flags;
2c1bf6
+		if (++vq->vq_avail_idx >= vq->vq_nentries) {
2c1bf6
+			vq->vq_avail_idx -= vq->vq_nentries;
2c1bf6
+			vq->avail_wrap_counter ^= 1;
2c1bf6
+			vq->avail_used_flags =
2c1bf6
+				VRING_DESC_F_AVAIL(vq->avail_wrap_counter) |
2c1bf6
+				VRING_DESC_F_USED(!vq->avail_wrap_counter);
2c1bf6
+			flags = VRING_DESC_F_WRITE | vq->avail_used_flags;
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+	vq->vq_free_cnt = (uint16_t)(vq->vq_free_cnt - num);
2c1bf6
+	return 0;
2c1bf6
+}
2c1bf6
+
2c1bf6
 /* When doing TSO, the IP length is not included in the pseudo header
2c1bf6
  * checksum of the packet given to the PMD, but for virtio it is
2c1bf6
  * expected.
2c1bf6
@@ -801,7 +888,11 @@ virtio_dev_rx_queue_setup_finish(struct rte_eth_dev *dev, uint16_t queue_idx)
2c1bf6
 				break;
2c1bf6
 
2c1bf6
 			/* Enqueue allocated buffers */
2c1bf6
-			error = virtqueue_enqueue_recv_refill(vq, m);
2c1bf6
+			if (vtpci_packed_queue(vq->hw))
2c1bf6
+				error = virtqueue_enqueue_recv_refill_packed(vq,
2c1bf6
+						&m, 1);
2c1bf6
+			else
2c1bf6
+				error = virtqueue_enqueue_recv_refill(vq, m);
2c1bf6
 			if (error) {
2c1bf6
 				rte_pktmbuf_free(m);
2c1bf6
 				break;
2c1bf6
@@ -809,7 +900,8 @@ virtio_dev_rx_queue_setup_finish(struct rte_eth_dev *dev, uint16_t queue_idx)
2c1bf6
 			nbufs++;
2c1bf6
 		}
2c1bf6
 
2c1bf6
-		vq_update_avail_idx(vq);
2c1bf6
+		if (!vtpci_packed_queue(vq->hw))
2c1bf6
+			vq_update_avail_idx(vq);
2c1bf6
 	}
2c1bf6
 
2c1bf6
 	PMD_INIT_LOG(DEBUG, "Allocated %d bufs", nbufs);
2c1bf6
@@ -896,7 +988,10 @@ virtio_discard_rxbuf(struct virtqueue *vq, struct rte_mbuf *m)
2c1bf6
 	 * Requeue the discarded mbuf. This should always be
2c1bf6
 	 * successful since it was just dequeued.
2c1bf6
 	 */
2c1bf6
-	error = virtqueue_enqueue_recv_refill(vq, m);
2c1bf6
+	if (vtpci_packed_queue(vq->hw))
2c1bf6
+		error = virtqueue_enqueue_recv_refill_packed(vq, &m, 1);
2c1bf6
+	else
2c1bf6
+		error = virtqueue_enqueue_recv_refill(vq, m);
2c1bf6
 
2c1bf6
 	if (unlikely(error)) {
2c1bf6
 		RTE_LOG(ERR, PMD, "cannot requeue discarded mbuf");
2c1bf6
@@ -1135,6 +1230,104 @@ virtio_recv_pkts(void *rx_queue, struct rte_mbuf **rx_pkts, uint16_t nb_pkts)
2c1bf6
 	return nb_rx;
2c1bf6
 }
2c1bf6
 
2c1bf6
+uint16_t
2c1bf6
+virtio_recv_pkts_packed(void *rx_queue, struct rte_mbuf **rx_pkts,
2c1bf6
+			uint16_t nb_pkts)
2c1bf6
+{
2c1bf6
+	struct virtnet_rx *rxvq = rx_queue;
2c1bf6
+	struct virtqueue *vq = rxvq->vq;
2c1bf6
+	struct virtio_hw *hw = vq->hw;
2c1bf6
+	struct rte_mbuf *rxm, *new_mbuf;
2c1bf6
+	uint16_t num, nb_rx;
2c1bf6
+	uint32_t len[VIRTIO_MBUF_BURST_SZ];
2c1bf6
+	struct rte_mbuf *rcv_pkts[VIRTIO_MBUF_BURST_SZ];
2c1bf6
+	int error;
2c1bf6
+	uint32_t i, nb_enqueued;
2c1bf6
+	uint32_t hdr_size;
2c1bf6
+	struct virtio_net_hdr *hdr;
2c1bf6
+
2c1bf6
+	nb_rx = 0;
2c1bf6
+	if (unlikely(hw->started == 0))
2c1bf6
+		return nb_rx;
2c1bf6
+
2c1bf6
+	num = RTE_MIN(VIRTIO_MBUF_BURST_SZ, nb_pkts);
2c1bf6
+	if (likely(num > DESC_PER_CACHELINE))
2c1bf6
+		num = num - ((vq->vq_used_cons_idx + num) % DESC_PER_CACHELINE);
2c1bf6
+
2c1bf6
+	num = virtqueue_dequeue_burst_rx_packed(vq, rcv_pkts, len, num);
2c1bf6
+	PMD_RX_LOG(DEBUG, "dequeue:%d", num);
2c1bf6
+
2c1bf6
+	nb_enqueued = 0;
2c1bf6
+	hdr_size = hw->vtnet_hdr_size;
2c1bf6
+
2c1bf6
+	for (i = 0; i < num; i++) {
2c1bf6
+		rxm = rcv_pkts[i];
2c1bf6
+
2c1bf6
+		PMD_RX_LOG(DEBUG, "packet len:%d", len[i]);
2c1bf6
+
2c1bf6
+		if (unlikely(len[i] < hdr_size + ETHER_HDR_LEN)) {
2c1bf6
+			PMD_RX_LOG(ERR, "Packet drop");
2c1bf6
+			nb_enqueued++;
2c1bf6
+			virtio_discard_rxbuf(vq, rxm);
2c1bf6
+			rxvq->stats.errors++;
2c1bf6
+			continue;
2c1bf6
+		}
2c1bf6
+
2c1bf6
+		rxm->port = rxvq->port_id;
2c1bf6
+		rxm->data_off = RTE_PKTMBUF_HEADROOM;
2c1bf6
+		rxm->ol_flags = 0;
2c1bf6
+		rxm->vlan_tci = 0;
2c1bf6
+
2c1bf6
+		rxm->pkt_len = (uint32_t)(len[i] - hdr_size);
2c1bf6
+		rxm->data_len = (uint16_t)(len[i] - hdr_size);
2c1bf6
+
2c1bf6
+		hdr = (struct virtio_net_hdr *)((char *)rxm->buf_addr +
2c1bf6
+			RTE_PKTMBUF_HEADROOM - hdr_size);
2c1bf6
+
2c1bf6
+		if (hw->vlan_strip)
2c1bf6
+			rte_vlan_strip(rxm);
2c1bf6
+
2c1bf6
+		if (hw->has_rx_offload && virtio_rx_offload(rxm, hdr) < 0) {
2c1bf6
+			virtio_discard_rxbuf(vq, rxm);
2c1bf6
+			rxvq->stats.errors++;
2c1bf6
+			continue;
2c1bf6
+		}
2c1bf6
+
2c1bf6
+		virtio_rx_stats_updated(rxvq, rxm);
2c1bf6
+
2c1bf6
+		rx_pkts[nb_rx++] = rxm;
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	rxvq->stats.packets += nb_rx;
2c1bf6
+
2c1bf6
+	/* Allocate new mbuf for the used descriptor */
2c1bf6
+	while (likely(!virtqueue_full(vq))) {
2c1bf6
+		new_mbuf = rte_mbuf_raw_alloc(rxvq->mpool);
2c1bf6
+		if (unlikely(new_mbuf == NULL)) {
2c1bf6
+			struct rte_eth_dev *dev =
2c1bf6
+				&rte_eth_devices[rxvq->port_id];
2c1bf6
+			dev->data->rx_mbuf_alloc_failed++;
2c1bf6
+			break;
2c1bf6
+		}
2c1bf6
+		error = virtqueue_enqueue_recv_refill_packed(vq, &new_mbuf, 1);
2c1bf6
+		if (unlikely(error)) {
2c1bf6
+			rte_pktmbuf_free(new_mbuf);
2c1bf6
+			break;
2c1bf6
+		}
2c1bf6
+		nb_enqueued++;
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	if (likely(nb_enqueued)) {
2c1bf6
+		if (unlikely(virtqueue_kick_prepare_packed(vq))) {
2c1bf6
+			virtqueue_notify(vq);
2c1bf6
+			PMD_RX_LOG(DEBUG, "Notified");
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	return nb_rx;
2c1bf6
+}
2c1bf6
+
2c1bf6
+
2c1bf6
 uint16_t
2c1bf6
 virtio_recv_mergeable_pkts_inorder(void *rx_queue,
2c1bf6
 			struct rte_mbuf **rx_pkts,
2c1bf6
@@ -1493,6 +1686,182 @@ virtio_recv_mergeable_pkts(void *rx_queue,
2c1bf6
 	return nb_rx;
2c1bf6
 }
2c1bf6
 
2c1bf6
+uint16_t
2c1bf6
+virtio_recv_mergeable_pkts_packed(void *rx_queue,
2c1bf6
+			struct rte_mbuf **rx_pkts,
2c1bf6
+			uint16_t nb_pkts)
2c1bf6
+{
2c1bf6
+	struct virtnet_rx *rxvq = rx_queue;
2c1bf6
+	struct virtqueue *vq = rxvq->vq;
2c1bf6
+	struct virtio_hw *hw = vq->hw;
2c1bf6
+	struct rte_mbuf *rxm;
2c1bf6
+	struct rte_mbuf *prev = NULL;
2c1bf6
+	uint16_t num, nb_rx = 0;
2c1bf6
+	uint32_t len[VIRTIO_MBUF_BURST_SZ];
2c1bf6
+	struct rte_mbuf *rcv_pkts[VIRTIO_MBUF_BURST_SZ];
2c1bf6
+	uint32_t nb_enqueued = 0;
2c1bf6
+	uint32_t seg_num = 0;
2c1bf6
+	uint32_t seg_res = 0;
2c1bf6
+	uint32_t hdr_size = hw->vtnet_hdr_size;
2c1bf6
+	int32_t i;
2c1bf6
+	int error;
2c1bf6
+
2c1bf6
+	if (unlikely(hw->started == 0))
2c1bf6
+		return nb_rx;
2c1bf6
+
2c1bf6
+
2c1bf6
+	num = nb_pkts;
2c1bf6
+	if (unlikely(num > VIRTIO_MBUF_BURST_SZ))
2c1bf6
+		num = VIRTIO_MBUF_BURST_SZ;
2c1bf6
+	if (likely(num > DESC_PER_CACHELINE))
2c1bf6
+		num = num - ((vq->vq_used_cons_idx + num) % DESC_PER_CACHELINE);
2c1bf6
+
2c1bf6
+	num = virtqueue_dequeue_burst_rx_packed(vq, rcv_pkts, len, num);
2c1bf6
+
2c1bf6
+	for (i = 0; i < num; i++) {
2c1bf6
+		struct virtio_net_hdr_mrg_rxbuf *header;
2c1bf6
+
2c1bf6
+		PMD_RX_LOG(DEBUG, "dequeue:%d", num);
2c1bf6
+		PMD_RX_LOG(DEBUG, "packet len:%d", len[i]);
2c1bf6
+
2c1bf6
+		rxm = rcv_pkts[i];
2c1bf6
+
2c1bf6
+		if (unlikely(len[i] < hdr_size + ETHER_HDR_LEN)) {
2c1bf6
+			PMD_RX_LOG(ERR, "Packet drop");
2c1bf6
+			nb_enqueued++;
2c1bf6
+			virtio_discard_rxbuf(vq, rxm);
2c1bf6
+			rxvq->stats.errors++;
2c1bf6
+			continue;
2c1bf6
+		}
2c1bf6
+
2c1bf6
+		header = (struct virtio_net_hdr_mrg_rxbuf *)((char *)
2c1bf6
+			  rxm->buf_addr + RTE_PKTMBUF_HEADROOM - hdr_size);
2c1bf6
+		seg_num = header->num_buffers;
2c1bf6
+
2c1bf6
+		if (seg_num == 0)
2c1bf6
+			seg_num = 1;
2c1bf6
+
2c1bf6
+		rxm->data_off = RTE_PKTMBUF_HEADROOM;
2c1bf6
+		rxm->nb_segs = seg_num;
2c1bf6
+		rxm->ol_flags = 0;
2c1bf6
+		rxm->vlan_tci = 0;
2c1bf6
+		rxm->pkt_len = (uint32_t)(len[i] - hdr_size);
2c1bf6
+		rxm->data_len = (uint16_t)(len[i] - hdr_size);
2c1bf6
+
2c1bf6
+		rxm->port = rxvq->port_id;
2c1bf6
+		rx_pkts[nb_rx] = rxm;
2c1bf6
+		prev = rxm;
2c1bf6
+
2c1bf6
+		if (hw->has_rx_offload &&
2c1bf6
+				virtio_rx_offload(rxm, &header->hdr) < 0) {
2c1bf6
+			virtio_discard_rxbuf(vq, rxm);
2c1bf6
+			rxvq->stats.errors++;
2c1bf6
+			continue;
2c1bf6
+		}
2c1bf6
+
2c1bf6
+		if (hw->vlan_strip)
2c1bf6
+			rte_vlan_strip(rx_pkts[nb_rx]);
2c1bf6
+
2c1bf6
+		seg_res = seg_num - 1;
2c1bf6
+
2c1bf6
+		/* Merge remaining segments */
2c1bf6
+		while (seg_res != 0 && i < (num - 1)) {
2c1bf6
+			i++;
2c1bf6
+
2c1bf6
+			rxm = rcv_pkts[i];
2c1bf6
+			rxm->data_off = RTE_PKTMBUF_HEADROOM - hdr_size;
2c1bf6
+			rxm->pkt_len = (uint32_t)(len[i]);
2c1bf6
+			rxm->data_len = (uint16_t)(len[i]);
2c1bf6
+
2c1bf6
+			rx_pkts[nb_rx]->pkt_len += (uint32_t)(len[i]);
2c1bf6
+			rx_pkts[nb_rx]->data_len += (uint16_t)(len[i]);
2c1bf6
+
2c1bf6
+			if (prev)
2c1bf6
+				prev->next = rxm;
2c1bf6
+
2c1bf6
+			prev = rxm;
2c1bf6
+			seg_res -= 1;
2c1bf6
+		}
2c1bf6
+
2c1bf6
+		if (!seg_res) {
2c1bf6
+			virtio_rx_stats_updated(rxvq, rx_pkts[nb_rx]);
2c1bf6
+			nb_rx++;
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	/* Last packet still need merge segments */
2c1bf6
+	while (seg_res != 0) {
2c1bf6
+		uint16_t rcv_cnt = RTE_MIN((uint16_t)seg_res,
2c1bf6
+					VIRTIO_MBUF_BURST_SZ);
2c1bf6
+		if (likely(vq->vq_free_cnt >= rcv_cnt)) {
2c1bf6
+			num = virtqueue_dequeue_burst_rx_packed(vq, rcv_pkts,
2c1bf6
+					len, rcv_cnt);
2c1bf6
+			uint16_t extra_idx = 0;
2c1bf6
+
2c1bf6
+			rcv_cnt = num;
2c1bf6
+
2c1bf6
+			while (extra_idx < rcv_cnt) {
2c1bf6
+				rxm = rcv_pkts[extra_idx];
2c1bf6
+
2c1bf6
+				rxm->data_off =
2c1bf6
+					RTE_PKTMBUF_HEADROOM - hdr_size;
2c1bf6
+				rxm->pkt_len = (uint32_t)(len[extra_idx]);
2c1bf6
+				rxm->data_len = (uint16_t)(len[extra_idx]);
2c1bf6
+
2c1bf6
+				prev->next = rxm;
2c1bf6
+				prev = rxm;
2c1bf6
+				rx_pkts[nb_rx]->pkt_len += len[extra_idx];
2c1bf6
+				rx_pkts[nb_rx]->data_len += len[extra_idx];
2c1bf6
+				extra_idx += 1;
2c1bf6
+			}
2c1bf6
+			seg_res -= rcv_cnt;
2c1bf6
+			if (!seg_res) {
2c1bf6
+				virtio_rx_stats_updated(rxvq, rx_pkts[nb_rx]);
2c1bf6
+				nb_rx++;
2c1bf6
+			}
2c1bf6
+		} else {
2c1bf6
+			PMD_RX_LOG(ERR,
2c1bf6
+					"No enough segments for packet.");
2c1bf6
+			if (prev)
2c1bf6
+				virtio_discard_rxbuf(vq, prev);
2c1bf6
+			rxvq->stats.errors++;
2c1bf6
+			break;
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	rxvq->stats.packets += nb_rx;
2c1bf6
+
2c1bf6
+	/* Allocate new mbuf for the used descriptor */
2c1bf6
+	if (likely(!virtqueue_full(vq))) {
2c1bf6
+		/* free_cnt may include mrg descs */
2c1bf6
+		uint16_t free_cnt = vq->vq_free_cnt;
2c1bf6
+		struct rte_mbuf *new_pkts[free_cnt];
2c1bf6
+
2c1bf6
+		if (!rte_pktmbuf_alloc_bulk(rxvq->mpool, new_pkts, free_cnt)) {
2c1bf6
+			error = virtqueue_enqueue_recv_refill_packed(vq,
2c1bf6
+					new_pkts, free_cnt);
2c1bf6
+			if (unlikely(error)) {
2c1bf6
+				for (i = 0; i < free_cnt; i++)
2c1bf6
+					rte_pktmbuf_free(new_pkts[i]);
2c1bf6
+			}
2c1bf6
+			nb_enqueued += free_cnt;
2c1bf6
+		} else {
2c1bf6
+			struct rte_eth_dev *dev =
2c1bf6
+				&rte_eth_devices[rxvq->port_id];
2c1bf6
+			dev->data->rx_mbuf_alloc_failed += free_cnt;
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	if (likely(nb_enqueued)) {
2c1bf6
+		if (unlikely(virtqueue_kick_prepare_packed(vq))) {
2c1bf6
+			virtqueue_notify(vq);
2c1bf6
+			PMD_RX_LOG(DEBUG, "Notified");
2c1bf6
+		}
2c1bf6
+	}
2c1bf6
+
2c1bf6
+	return nb_rx;
2c1bf6
+}
2c1bf6
+
2c1bf6
 uint16_t
2c1bf6
 virtio_xmit_pkts_packed(void *tx_queue, struct rte_mbuf **tx_pkts,
2c1bf6
 			uint16_t nb_pkts)
2c1bf6
diff --git a/drivers/net/virtio/virtqueue.c b/drivers/net/virtio/virtqueue.c
2c1bf6
index 56a77cc71..5b03f7a27 100644
2c1bf6
--- a/drivers/net/virtio/virtqueue.c
2c1bf6
+++ b/drivers/net/virtio/virtqueue.c
2c1bf6
@@ -54,9 +54,36 @@ virtqueue_detach_unused(struct virtqueue *vq)
2c1bf6
 	return NULL;
2c1bf6
 }
2c1bf6
 
2c1bf6
+/* Flush used descs */
2c1bf6
+static void
2c1bf6
+virtqueue_rxvq_flush_packed(struct virtqueue *vq)
2c1bf6
+{
2c1bf6
+	struct vq_desc_extra *dxp;
2c1bf6
+	uint16_t i;
2c1bf6
+
2c1bf6
+	struct vring_packed_desc *descs = vq->ring_packed.desc_packed;
2c1bf6
+	int cnt = 0;
2c1bf6
+
2c1bf6
+	i = vq->vq_used_cons_idx;
2c1bf6
+	while (desc_is_used(&descs[i], vq) && cnt++ < vq->vq_nentries) {
2c1bf6
+		dxp = &vq->vq_descx[descs[i].id];
2c1bf6
+		if (dxp->cookie != NULL) {
2c1bf6
+			rte_pktmbuf_free(dxp->cookie);
2c1bf6
+			dxp->cookie = NULL;
2c1bf6
+		}
2c1bf6
+		vq->vq_free_cnt++;
2c1bf6
+		vq->vq_used_cons_idx++;
2c1bf6
+		if (vq->vq_used_cons_idx >= vq->vq_nentries) {
2c1bf6
+			vq->vq_used_cons_idx -= vq->vq_nentries;
2c1bf6
+			vq->used_wrap_counter ^= 1;
2c1bf6
+		}
2c1bf6
+		i = vq->vq_used_cons_idx;
2c1bf6
+	}
2c1bf6
+}
2c1bf6
+
2c1bf6
 /* Flush the elements in the used ring. */
2c1bf6
-void
2c1bf6
-virtqueue_rxvq_flush(struct virtqueue *vq)
2c1bf6
+static void
2c1bf6
+virtqueue_rxvq_flush_split(struct virtqueue *vq)
2c1bf6
 {
2c1bf6
 	struct virtnet_rx *rxq = &vq->rxq;
2c1bf6
 	struct virtio_hw *hw = vq->hw;
2c1bf6
@@ -102,3 +129,15 @@ virtqueue_rxvq_flush(struct virtqueue *vq)
2c1bf6
 		}
2c1bf6
 	}
2c1bf6
 }
2c1bf6
+
2c1bf6
+/* Flush the elements in the used ring. */
2c1bf6
+void
2c1bf6
+virtqueue_rxvq_flush(struct virtqueue *vq)
2c1bf6
+{
2c1bf6
+	struct virtio_hw *hw = vq->hw;
2c1bf6
+
2c1bf6
+	if (vtpci_packed_queue(hw))
2c1bf6
+		virtqueue_rxvq_flush_packed(vq);
2c1bf6
+	else
2c1bf6
+		virtqueue_rxvq_flush_split(vq);
2c1bf6
+}
2c1bf6
-- 
2c1bf6
2.21.0
2c1bf6