[v3] vhost: allocate and free packets in bulk
Checks
Commit Message
Move allocation out further and perform all allocation in bulk. The same
goes for freeing packets. In the process, also rename
virtio_dev_pktmbuf_alloc to virtio_dev_pktmbuf_prep. This
function now receives an already allocated mbuf pointer.
Signed-off-by: Balazs Nemeth <bnemeth@redhat.com>
---
lib/librte_vhost/virtio_net.c | 58 +++++++++++++++++++++++------------
1 file changed, 38 insertions(+), 20 deletions(-)
Comments
On 4/16/21 10:18 AM, Balazs Nemeth wrote:
> Move allocation out further and perform all allocation in bulk. The same
> goes for freeing packets. In the process, also rename
> virtio_dev_pktmbuf_alloc to virtio_dev_pktmbuf_prep. This
> function now receives an already allocated mbuf pointer.
>
> Signed-off-by: Balazs Nemeth <bnemeth@redhat.com>
> ---
> lib/librte_vhost/virtio_net.c | 58 +++++++++++++++++++++++------------
> 1 file changed, 38 insertions(+), 20 deletions(-)
>
Reviewed-by: Maxime Coquelin <maxime.coquelin@redhat.com>
Thanks,
Maxime
On Fri, Apr 16, 2021 at 10:18 AM Balazs Nemeth <bnemeth@redhat.com> wrote:
>
> Move allocation out further and perform all allocation in bulk. The same
> goes for freeing packets. In the process, also rename
> virtio_dev_pktmbuf_alloc to virtio_dev_pktmbuf_prep. This
> function now receives an already allocated mbuf pointer.
>
> Signed-off-by: Balazs Nemeth <bnemeth@redhat.com>
The title should indicate we are only touching the tx packed path.
What about tx split?
If it is too complex to rework, this can wait.
> ---
> lib/librte_vhost/virtio_net.c | 58 +++++++++++++++++++++++------------
> 1 file changed, 38 insertions(+), 20 deletions(-)
>
> diff --git a/lib/librte_vhost/virtio_net.c b/lib/librte_vhost/virtio_net.c
> index ff39878609..d6d5636e0f 100644
> --- a/lib/librte_vhost/virtio_net.c
> +++ b/lib/librte_vhost/virtio_net.c
> @@ -2168,6 +2168,24 @@ virtio_dev_pktmbuf_alloc(struct virtio_net *dev, struct rte_mempool *mp,
> return NULL;
> }
>
> +static __rte_always_inline int
> +virtio_dev_pktmbuf_prep(struct virtio_net *dev, struct rte_mbuf *pkt,
> + uint32_t data_len)
> +{
> + if (rte_pktmbuf_tailroom(pkt) >= data_len)
> + return 0;
> +
> + /* attach an external buffer if supported */
> + if (dev->extbuf && !virtio_dev_extbuf_alloc(pkt, data_len))
> + return 0;
> +
> + /* check if chained buffers are allowed */
> + if (!dev->linearbuf)
> + return 0;
> +
> + return -1;
> +}
> +
If virtio_dev_pktmbuf_alloc() uses this new helper, we avoid
duplicating the logic.
> static __rte_noinline uint16_t
> virtio_dev_tx_split(struct virtio_net *dev, struct vhost_virtqueue *vq,
> struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts, uint16_t count)
[snip]
> @@ -2429,7 +2440,7 @@ static __rte_always_inline int
> virtio_dev_tx_single_packed(struct virtio_net *dev,
> struct vhost_virtqueue *vq,
> struct rte_mempool *mbuf_pool,
> - struct rte_mbuf **pkts)
> + struct rte_mbuf *pkts)
> {
>
> uint16_t buf_id, desc_count = 0;
> @@ -2462,26 +2473,33 @@ virtio_dev_tx_packed(struct virtio_net *dev,
> uint32_t pkt_idx = 0;
> uint32_t remained = count;
>
> + if (rte_pktmbuf_alloc_bulk(mbuf_pool, pkts, count))
> + return 0;
> +
> do {
> rte_prefetch0(&vq->desc_packed[vq->last_avail_idx]);
>
> if (remained >= PACKED_BATCH_SIZE) {
> - if (!virtio_dev_tx_batch_packed(dev, vq, mbuf_pool,
> + if (!virtio_dev_tx_batch_packed(dev, vq,
> &pkts[pkt_idx])) {
> pkt_idx += PACKED_BATCH_SIZE;
> remained -= PACKED_BATCH_SIZE;
> +
No need for the extra line.
> continue;
> }
> }
>
> if (virtio_dev_tx_single_packed(dev, vq, mbuf_pool,
> - &pkts[pkt_idx]))
> + pkts[pkt_idx]))
> break;
> pkt_idx++;
> remained--;
>
> } while (remained);
>
> + if (pkt_idx != count)
> + rte_pktmbuf_free_bulk(&pkts[pkt_idx], count - pkt_idx);
> +
> if (vq->shadow_used_idx) {
> do_data_copy_dequeue(vq);
>
With those comments addressed,
Reviewed-by: David Marchand <david.marchand@redhat.com>
Thanks Balazs!
Hi David,
I was also thinking about using the same idea for tx split so that
virtio_dev_pktmbuf_alloc can be removed completely. I don't have those
patches yet. However, I can make virtio_dev_pktmbuf_alloc use
virtio_dev_pktmbuf_prep for this patch that addresses the packed
version and submit other patches for tx split later. Would that work for
now?
Regards,
Balazs
On Fri, Apr 16, 2021 at 11:05 AM David Marchand <david.marchand@redhat.com>
wrote:
> On Fri, Apr 16, 2021 at 10:18 AM Balazs Nemeth <bnemeth@redhat.com> wrote:
> >
> > Move allocation out further and perform all allocation in bulk. The same
> > goes for freeing packets. In the process, also rename
> > virtio_dev_pktmbuf_alloc to virtio_dev_pktmbuf_prep. This
> > function now receives an already allocated mbuf pointer.
> >
> > Signed-off-by: Balazs Nemeth <bnemeth@redhat.com>
>
> The title should indicate we are only touching the tx packed path.
>
> What about tx split?
> If it is too complex to rework, this can wait.
>
>
> > ---
> > lib/librte_vhost/virtio_net.c | 58 +++++++++++++++++++++++------------
> > 1 file changed, 38 insertions(+), 20 deletions(-)
> >
> > diff --git a/lib/librte_vhost/virtio_net.c
> b/lib/librte_vhost/virtio_net.c
> > index ff39878609..d6d5636e0f 100644
> > --- a/lib/librte_vhost/virtio_net.c
> > +++ b/lib/librte_vhost/virtio_net.c
> > @@ -2168,6 +2168,24 @@ virtio_dev_pktmbuf_alloc(struct virtio_net *dev,
> struct rte_mempool *mp,
> > return NULL;
> > }
> >
> > +static __rte_always_inline int
> > +virtio_dev_pktmbuf_prep(struct virtio_net *dev, struct rte_mbuf *pkt,
> > + uint32_t data_len)
> > +{
> > + if (rte_pktmbuf_tailroom(pkt) >= data_len)
> > + return 0;
> > +
> > + /* attach an external buffer if supported */
> > + if (dev->extbuf && !virtio_dev_extbuf_alloc(pkt, data_len))
> > + return 0;
> > +
> > + /* check if chained buffers are allowed */
> > + if (!dev->linearbuf)
> > + return 0;
> > +
> > + return -1;
> > +}
> > +
>
> If virtio_dev_pktmbuf_alloc() uses this new helper, we avoid
> duplicating the logic.
>
>
> > static __rte_noinline uint16_t
> > virtio_dev_tx_split(struct virtio_net *dev, struct vhost_virtqueue *vq,
> > struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts, uint16_t
> count)
>
> [snip]
>
> > @@ -2429,7 +2440,7 @@ static __rte_always_inline int
> > virtio_dev_tx_single_packed(struct virtio_net *dev,
> > struct vhost_virtqueue *vq,
> > struct rte_mempool *mbuf_pool,
> > - struct rte_mbuf **pkts)
> > + struct rte_mbuf *pkts)
> > {
> >
> > uint16_t buf_id, desc_count = 0;
> > @@ -2462,26 +2473,33 @@ virtio_dev_tx_packed(struct virtio_net *dev,
> > uint32_t pkt_idx = 0;
> > uint32_t remained = count;
> >
> > + if (rte_pktmbuf_alloc_bulk(mbuf_pool, pkts, count))
> > + return 0;
> > +
> > do {
> > rte_prefetch0(&vq->desc_packed[vq->last_avail_idx]);
> >
> > if (remained >= PACKED_BATCH_SIZE) {
> > - if (!virtio_dev_tx_batch_packed(dev, vq,
> mbuf_pool,
> > + if (!virtio_dev_tx_batch_packed(dev, vq,
> > &pkts[pkt_idx]))
> {
> > pkt_idx += PACKED_BATCH_SIZE;
> > remained -= PACKED_BATCH_SIZE;
> > +
>
> No need for the extra line.
>
>
> > continue;
> > }
> > }
> >
> > if (virtio_dev_tx_single_packed(dev, vq, mbuf_pool,
> > - &pkts[pkt_idx]))
> > + pkts[pkt_idx]))
> > break;
> > pkt_idx++;
> > remained--;
> >
> > } while (remained);
> >
> > + if (pkt_idx != count)
> > + rte_pktmbuf_free_bulk(&pkts[pkt_idx], count - pkt_idx);
> > +
> > if (vq->shadow_used_idx) {
> > do_data_copy_dequeue(vq);
> >
>
> With those comments addressed,
> Reviewed-by: David Marchand <david.marchand@redhat.com>
>
> Thanks Balazs!
>
>
> --
> David Marchand
>
>
Hi Balazs,
On 4/16/21 11:12 AM, Balazs Nemeth wrote:
> Hi David,
>
> I was also thinking about using the same idea for tx split so that
> virtio_dev_pktmbuf_alloc can be removed completely. I don't have those
> patches yet. However, I can make virtio_dev_pktmbuf_alloc use
> virtio_dev_pktmbuf_prep for this patch that addresses the packed
> version and submit other patches for tx split later. Would that work for
> now?
I think so.
That would be great to have the same for split ring, but more rework may
be necessary than for packed ring. So I'm fine if the split ring part is
done after this release.
Thanks,
Maxime
> Regards,
> Balazs
>
> On Fri, Apr 16, 2021 at 11:05 AM David Marchand
> <david.marchand@redhat.com <mailto:david.marchand@redhat.com>> wrote:
>
> On Fri, Apr 16, 2021 at 10:18 AM Balazs Nemeth <bnemeth@redhat.com
> <mailto:bnemeth@redhat.com>> wrote:
> >
> > Move allocation out further and perform all allocation in bulk.
> The same
> > goes for freeing packets. In the process, also rename
> > virtio_dev_pktmbuf_alloc to virtio_dev_pktmbuf_prep. This
> > function now receives an already allocated mbuf pointer.
> >
> > Signed-off-by: Balazs Nemeth <bnemeth@redhat.com
> <mailto:bnemeth@redhat.com>>
>
> The title should indicate we are only touching the tx packed path.
>
> What about tx split?
> If it is too complex to rework, this can wait.
>
>
> > ---
> > lib/librte_vhost/virtio_net.c | 58
> +++++++++++++++++++++++------------
> > 1 file changed, 38 insertions(+), 20 deletions(-)
> >
> > diff --git a/lib/librte_vhost/virtio_net.c
> b/lib/librte_vhost/virtio_net.c
> > index ff39878609..d6d5636e0f 100644
> > --- a/lib/librte_vhost/virtio_net.c
> > +++ b/lib/librte_vhost/virtio_net.c
> > @@ -2168,6 +2168,24 @@ virtio_dev_pktmbuf_alloc(struct virtio_net
> *dev, struct rte_mempool *mp,
> > return NULL;
> > }
> >
> > +static __rte_always_inline int
> > +virtio_dev_pktmbuf_prep(struct virtio_net *dev, struct rte_mbuf *pkt,
> > + uint32_t data_len)
> > +{
> > + if (rte_pktmbuf_tailroom(pkt) >= data_len)
> > + return 0;
> > +
> > + /* attach an external buffer if supported */
> > + if (dev->extbuf && !virtio_dev_extbuf_alloc(pkt, data_len))
> > + return 0;
> > +
> > + /* check if chained buffers are allowed */
> > + if (!dev->linearbuf)
> > + return 0;
> > +
> > + return -1;
> > +}
> > +
>
> If virtio_dev_pktmbuf_alloc() uses this new helper, we avoid
> duplicating the logic.
>
>
> > static __rte_noinline uint16_t
> > virtio_dev_tx_split(struct virtio_net *dev, struct
> vhost_virtqueue *vq,
> > struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts,
> uint16_t count)
>
> [snip]
>
> > @@ -2429,7 +2440,7 @@ static __rte_always_inline int
> > virtio_dev_tx_single_packed(struct virtio_net *dev,
> > struct vhost_virtqueue *vq,
> > struct rte_mempool *mbuf_pool,
> > - struct rte_mbuf **pkts)
> > + struct rte_mbuf *pkts)
> > {
> >
> > uint16_t buf_id, desc_count = 0;
> > @@ -2462,26 +2473,33 @@ virtio_dev_tx_packed(struct virtio_net *dev,
> > uint32_t pkt_idx = 0;
> > uint32_t remained = count;
> >
> > + if (rte_pktmbuf_alloc_bulk(mbuf_pool, pkts, count))
> > + return 0;
> > +
> > do {
> > rte_prefetch0(&vq->desc_packed[vq->last_avail_idx]);
> >
> > if (remained >= PACKED_BATCH_SIZE) {
> > - if (!virtio_dev_tx_batch_packed(dev, vq,
> mbuf_pool,
> > + if (!virtio_dev_tx_batch_packed(dev, vq,
> >
> &pkts[pkt_idx])) {
> > pkt_idx += PACKED_BATCH_SIZE;
> > remained -= PACKED_BATCH_SIZE;
> > +
>
> No need for the extra line.
>
>
> > continue;
> > }
> > }
> >
> > if (virtio_dev_tx_single_packed(dev, vq, mbuf_pool,
> > - &pkts[pkt_idx]))
> > + pkts[pkt_idx]))
> > break;
> > pkt_idx++;
> > remained--;
> >
> > } while (remained);
> >
> > + if (pkt_idx != count)
> > + rte_pktmbuf_free_bulk(&pkts[pkt_idx], count -
> pkt_idx);
> > +
> > if (vq->shadow_used_idx) {
> > do_data_copy_dequeue(vq);
> >
>
> With those comments addressed,
> Reviewed-by: David Marchand <david.marchand@redhat.com
> <mailto:david.marchand@redhat.com>>
>
> Thanks Balazs!
>
>
> --
> David Marchand
>
On Fri, Apr 16, 2021 at 11:12 AM Balazs Nemeth <bnemeth@redhat.com> wrote:
> I was also thinking about using the same idea for tx split so that virtio_dev_pktmbuf_alloc can be removed completely. I don't have those patches yet. However, I can make virtio_dev_pktmbuf_alloc use virtio_dev_pktmbuf_prep for this patch that addresses the packed version and submit other patches for tx split later. Would that work for now?
Ok for me.
And revisit the tx split part in 21.08 :-).
@@ -2168,6 +2168,24 @@ virtio_dev_pktmbuf_alloc(struct virtio_net *dev, struct rte_mempool *mp,
return NULL;
}
+static __rte_always_inline int
+virtio_dev_pktmbuf_prep(struct virtio_net *dev, struct rte_mbuf *pkt,
+ uint32_t data_len)
+{
+ if (rte_pktmbuf_tailroom(pkt) >= data_len)
+ return 0;
+
+ /* attach an external buffer if supported */
+ if (dev->extbuf && !virtio_dev_extbuf_alloc(pkt, data_len))
+ return 0;
+
+ /* check if chained buffers are allowed */
+ if (!dev->linearbuf)
+ return 0;
+
+ return -1;
+}
+
static __rte_noinline uint16_t
virtio_dev_tx_split(struct virtio_net *dev, struct vhost_virtqueue *vq,
struct rte_mempool *mbuf_pool, struct rte_mbuf **pkts, uint16_t count)
@@ -2261,7 +2279,6 @@ virtio_dev_tx_split(struct virtio_net *dev, struct vhost_virtqueue *vq,
static __rte_always_inline int
vhost_reserve_avail_batch_packed(struct virtio_net *dev,
struct vhost_virtqueue *vq,
- struct rte_mempool *mbuf_pool,
struct rte_mbuf **pkts,
uint16_t avail_idx,
uintptr_t *desc_addrs,
@@ -2306,9 +2323,8 @@ vhost_reserve_avail_batch_packed(struct virtio_net *dev,
}
vhost_for_each_try_unroll(i, 0, PACKED_BATCH_SIZE) {
- pkts[i] = virtio_dev_pktmbuf_alloc(dev, mbuf_pool, lens[i]);
- if (!pkts[i])
- goto free_buf;
+ if (virtio_dev_pktmbuf_prep(dev, pkts[i], lens[i]))
+ goto err;
}
vhost_for_each_try_unroll(i, 0, PACKED_BATCH_SIZE)
@@ -2316,7 +2332,7 @@ vhost_reserve_avail_batch_packed(struct virtio_net *dev,
vhost_for_each_try_unroll(i, 0, PACKED_BATCH_SIZE) {
if (unlikely(buf_lens[i] < (lens[i] - buf_offset)))
- goto free_buf;
+ goto err;
}
vhost_for_each_try_unroll(i, 0, PACKED_BATCH_SIZE) {
@@ -2327,17 +2343,13 @@ vhost_reserve_avail_batch_packed(struct virtio_net *dev,
return 0;
-free_buf:
- for (i = 0; i < PACKED_BATCH_SIZE; i++)
- rte_pktmbuf_free(pkts[i]);
-
+err:
return -1;
}
static __rte_always_inline int
virtio_dev_tx_batch_packed(struct virtio_net *dev,
struct vhost_virtqueue *vq,
- struct rte_mempool *mbuf_pool,
struct rte_mbuf **pkts)
{
uint16_t avail_idx = vq->last_avail_idx;
@@ -2347,8 +2359,8 @@ virtio_dev_tx_batch_packed(struct virtio_net *dev,
uint16_t ids[PACKED_BATCH_SIZE];
uint16_t i;
- if (vhost_reserve_avail_batch_packed(dev, vq, mbuf_pool, pkts,
- avail_idx, desc_addrs, ids))
+ if (vhost_reserve_avail_batch_packed(dev, vq, pkts, avail_idx,
+ desc_addrs, ids))
return -1;
vhost_for_each_try_unroll(i, 0, PACKED_BATCH_SIZE)
@@ -2381,7 +2393,7 @@ static __rte_always_inline int
vhost_dequeue_single_packed(struct virtio_net *dev,
struct vhost_virtqueue *vq,
struct rte_mempool *mbuf_pool,
- struct rte_mbuf **pkts,
+ struct rte_mbuf *pkts,
uint16_t *buf_id,
uint16_t *desc_count)
{
@@ -2398,8 +2410,8 @@ vhost_dequeue_single_packed(struct virtio_net *dev,
VHOST_ACCESS_RO) < 0))
return -1;
- *pkts = virtio_dev_pktmbuf_alloc(dev, mbuf_pool, buf_len);
- if (unlikely(*pkts == NULL)) {
+
+ if (unlikely(virtio_dev_pktmbuf_prep(dev, pkts, buf_len))) {
if (!allocerr_warned) {
VHOST_LOG_DATA(ERR,
"Failed mbuf alloc of size %d from %s on %s.\n",
@@ -2409,7 +2421,7 @@ vhost_dequeue_single_packed(struct virtio_net *dev,
return -1;
}
- err = copy_desc_to_mbuf(dev, vq, buf_vec, nr_vec, *pkts,
+ err = copy_desc_to_mbuf(dev, vq, buf_vec, nr_vec, pkts,
mbuf_pool);
if (unlikely(err)) {
if (!allocerr_warned) {
@@ -2418,7 +2430,6 @@ vhost_dequeue_single_packed(struct virtio_net *dev,
dev->ifname);
allocerr_warned = true;
}
- rte_pktmbuf_free(*pkts);
return -1;
}
@@ -2429,7 +2440,7 @@ static __rte_always_inline int
virtio_dev_tx_single_packed(struct virtio_net *dev,
struct vhost_virtqueue *vq,
struct rte_mempool *mbuf_pool,
- struct rte_mbuf **pkts)
+ struct rte_mbuf *pkts)
{
uint16_t buf_id, desc_count = 0;
@@ -2462,26 +2473,33 @@ virtio_dev_tx_packed(struct virtio_net *dev,
uint32_t pkt_idx = 0;
uint32_t remained = count;
+ if (rte_pktmbuf_alloc_bulk(mbuf_pool, pkts, count))
+ return 0;
+
do {
rte_prefetch0(&vq->desc_packed[vq->last_avail_idx]);
if (remained >= PACKED_BATCH_SIZE) {
- if (!virtio_dev_tx_batch_packed(dev, vq, mbuf_pool,
+ if (!virtio_dev_tx_batch_packed(dev, vq,
&pkts[pkt_idx])) {
pkt_idx += PACKED_BATCH_SIZE;
remained -= PACKED_BATCH_SIZE;
+
continue;
}
}
if (virtio_dev_tx_single_packed(dev, vq, mbuf_pool,
- &pkts[pkt_idx]))
+ pkts[pkt_idx]))
break;
pkt_idx++;
remained--;
} while (remained);
+ if (pkt_idx != count)
+ rte_pktmbuf_free_bulk(&pkts[pkt_idx], count - pkt_idx);
+
if (vq->shadow_used_idx) {
do_data_copy_dequeue(vq);