From: David Gibson <david@gibson.dropbear.id.au>
To: Laurent Vivier <lvivier@redhat.com>
Cc: passt-dev@passt.top
Subject: Re: [PATCH v8 04/30] tap: Use iov_tail with tap_add_packet()
Date: Wed, 6 Aug 2025 11:56:56 +1000 [thread overview]
Message-ID: <aJK2aGTa0R0rE5EZ@zatzit> (raw)
In-Reply-To: <20250805154628.301343-5-lvivier@redhat.com>
[-- Attachment #1: Type: text/plain, Size: 8105 bytes --]
On Tue, Aug 05, 2025 at 05:46:02PM +0200, Laurent Vivier wrote:
> Use IOV_PEEK_HEADER() to get the ethernet header from the iovec.
>
> Move the workaround about multiple iovec array from vu_handle_tx() to
> tap_add_packet(). Removing the offset out of the iovec array should
> reduce the iovec count to 1.
>
> Signed-off-by: Laurent Vivier <lvivier@redhat.com>
> Reviewed-by: David Gibson <david@gibson.dropbear.id.au>
> ---
> iov.c | 1 -
> pcap.c | 1 +
> tap.c | 30 +++++++++++++++++++++---------
> tap.h | 3 +--
> vu_common.c | 26 +++++---------------------
> 5 files changed, 28 insertions(+), 33 deletions(-)
>
> diff --git a/iov.c b/iov.c
> index d39bb099fa69..97e4ea733540 100644
> --- a/iov.c
> +++ b/iov.c
> @@ -200,7 +200,6 @@ size_t iov_tail_size(struct iov_tail *tail)
> *
> * Return: true if the item still contains any bytes, otherwise false
> */
> -/* cppcheck-suppress unusedFunction */
> bool iov_tail_drop(struct iov_tail *tail, size_t len)
> {
> tail->off = tail->off + len;
> diff --git a/pcap.c b/pcap.c
> index 46d11a2a6daa..03adc4c55f4b 100644
> --- a/pcap.c
> +++ b/pcap.c
> @@ -74,6 +74,7 @@ static void pcap_frame(const struct iovec *iov, size_t iovcnt,
> * @pkt: Pointer to data buffer, including L2 headers
> * @l2len: L2 frame length
> */
> +/* cppcheck-suppress unusedFunction */
Are we going to get any new users of this? Maybe we can just remove
it now.
> void pcap(const char *pkt, size_t l2len)
> {
> struct iovec iov = { (char *)pkt, l2len };
> diff --git a/tap.c b/tap.c
> index 6db5d88b1760..c5520bf3bc76 100644
> --- a/tap.c
> +++ b/tap.c
> @@ -1070,24 +1070,29 @@ void tap_handler(struct ctx *c, const struct timespec *now)
> /**
> * tap_add_packet() - Queue/capture packet, update notion of guest MAC address
> * @c: Execution context
> - * @l2len: Total L2 packet length
> - * @p: Packet buffer
> + * @data: Packet to add to the pool
> * @now: Current timestamp
> */
> -void tap_add_packet(struct ctx *c, ssize_t l2len, char *p,
> +void tap_add_packet(struct ctx *c, struct iov_tail *data,
> const struct timespec *now)
> {
> + struct ethhdr eh_storage;
> const struct ethhdr *eh;
>
> - pcap(p, l2len);
> + pcap_iov(data->iov, data->cnt, data->off);
>
> - eh = (struct ethhdr *)p;
> + eh = IOV_PEEK_HEADER(data, eh_storage);
> + if (!eh)
> + return;
>
> if (memcmp(c->guest_mac, eh->h_source, ETH_ALEN)) {
> memcpy(c->guest_mac, eh->h_source, ETH_ALEN);
> proto_update_l2_buf(c->guest_mac, NULL);
> }
>
> + iov_tail_prune(data);
> + ASSERT(data->cnt == 1); /* packet_add() doesn't support iovec */
So.. the IOV_PEEK_HEADER will have already pruned, but I think it
would be a layering violation to assume that here.
I'm wondering if we should change the invariants for the iov_tail
structure and say they must *always* be pruned, outside of the innards
of the iov_tail handling. That would mean pruning in all
"constructors" of an iov_tail. It would also mean moving the prune to
the end of iov_tail_drop() instead of the beginning. It would have
the nice bonus that peek_header could take the iov_tail as a const *.
> switch (ntohs(eh->h_proto)) {
> case ETH_P_ARP:
> case ETH_P_IP:
> @@ -1095,14 +1100,16 @@ void tap_add_packet(struct ctx *c, ssize_t l2len, char *p,
> tap4_handler(c, pool_tap4, now);
> pool_flush(pool_tap4);
> }
> - packet_add(pool_tap4, l2len, p);
> + packet_add(pool_tap4, data->iov[0].iov_len - data->off,
> + (char *)data->iov[0].iov_base + data->off);
> break;
> case ETH_P_IPV6:
> if (pool_full(pool_tap6)) {
> tap6_handler(c, pool_tap6, now);
> pool_flush(pool_tap6);
> }
> - packet_add(pool_tap6, l2len, p);
> + packet_add(pool_tap6, data->iov[0].iov_len - data->off,
> + (char *)data->iov[0].iov_base + data->off);
> break;
> default:
> break;
> @@ -1168,6 +1175,7 @@ static void tap_passt_input(struct ctx *c, const struct timespec *now)
>
> while (n >= (ssize_t)sizeof(uint32_t)) {
> uint32_t l2len = ntohl_unaligned(p);
> + struct iov_tail data;
>
> if (l2len < sizeof(struct ethhdr) || l2len > L2_MAX_LEN_PASST) {
> err("Bad frame size from guest, resetting connection");
> @@ -1182,7 +1190,8 @@ static void tap_passt_input(struct ctx *c, const struct timespec *now)
> p += sizeof(uint32_t);
> n -= sizeof(uint32_t);
>
> - tap_add_packet(c, l2len, p, now);
> + data = IOV_TAIL_FROM_BUF(p, l2len, 0);
> + tap_add_packet(c, &data, now);
>
> p += l2len;
> n -= l2len;
> @@ -1226,6 +1235,8 @@ static void tap_pasta_input(struct ctx *c, const struct timespec *now)
> for (n = 0;
> n <= (ssize_t)(sizeof(pkt_buf) - L2_MAX_LEN_PASTA);
> n += len) {
> + struct iov_tail data;
> +
> len = read(c->fd_tap, pkt_buf + n, L2_MAX_LEN_PASTA);
>
> if (len == 0) {
> @@ -1247,7 +1258,8 @@ static void tap_pasta_input(struct ctx *c, const struct timespec *now)
> len > (ssize_t)L2_MAX_LEN_PASTA)
> continue;
>
> - tap_add_packet(c, len, pkt_buf + n, now);
> + data = IOV_TAIL_FROM_BUF(pkt_buf + n, len, 0);
> + tap_add_packet(c, &data, now);
> }
>
> tap_handler(c, now);
> diff --git a/tap.h b/tap.h
> index 936ae9371fd6..ce5510882d5d 100644
> --- a/tap.h
> +++ b/tap.h
> @@ -119,7 +119,6 @@ void tap_sock_update_pool(void *base, size_t size);
> void tap_backend_init(struct ctx *c);
> void tap_flush_pools(void);
> void tap_handler(struct ctx *c, const struct timespec *now);
> -void tap_add_packet(struct ctx *c, ssize_t l2len, char *p,
> +void tap_add_packet(struct ctx *c, struct iov_tail *data,
> const struct timespec *now);
> -
> #endif /* TAP_H */
> diff --git a/vu_common.c b/vu_common.c
> index 5e6fd4a8261f..b77b21420c57 100644
> --- a/vu_common.c
> +++ b/vu_common.c
> @@ -163,7 +163,6 @@ static void vu_handle_tx(struct vu_dev *vdev, int index,
> struct vu_virtq_element elem[VIRTQUEUE_MAX_SIZE];
> struct iovec out_sg[VIRTQUEUE_MAX_SIZE];
> struct vu_virtq *vq = &vdev->vq[index];
> - int hdrlen = sizeof(struct virtio_net_hdr_mrg_rxbuf);
> int out_sg_count;
> int count;
>
> @@ -176,6 +175,7 @@ static void vu_handle_tx(struct vu_dev *vdev, int index,
> while (count < VIRTQUEUE_MAX_SIZE &&
> out_sg_count + VU_MAX_TX_BUFFER_NB <= VIRTQUEUE_MAX_SIZE) {
> int ret;
> + struct iov_tail data;
>
> elem[count].out_num = VU_MAX_TX_BUFFER_NB;
> elem[count].out_sg = &out_sg[out_sg_count];
> @@ -191,26 +191,10 @@ static void vu_handle_tx(struct vu_dev *vdev, int index,
> warn("virtio-net transmit queue contains no out buffers");
> break;
> }
> - if (elem[count].out_num == 1) {
> - tap_add_packet(vdev->context,
> - elem[count].out_sg[0].iov_len - hdrlen,
> - (char *)elem[count].out_sg[0].iov_base +
> - hdrlen, now);
> - } else {
> - /* vnet header can be in a separate iovec */
> - if (elem[count].out_num != 2) {
> - debug("virtio-net transmit queue contains more than one buffer ([%d]: %u)",
> - count, elem[count].out_num);
> - } else if (elem[count].out_sg[0].iov_len != (size_t)hdrlen) {
> - debug("virtio-net transmit queue entry not aligned on hdrlen ([%d]: %d != %zu)",
> - count, hdrlen, elem[count].out_sg[0].iov_len);
> - } else {
> - tap_add_packet(vdev->context,
> - elem[count].out_sg[1].iov_len,
> - (char *)elem[count].out_sg[1].iov_base,
> - now);
> - }
> - }
> +
> + data = IOV_TAIL(elem[count].out_sg, elem[count].out_num, 0);
> + if (IOV_DROP_HEADER(&data, struct virtio_net_hdr_mrg_rxbuf))
> + tap_add_packet(vdev->context, &data, now);
Nice simplification here.
>
> count++;
> }
--
David Gibson (he or they) | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au | minimalist, thank you, not the other way
| around.
http://www.ozlabs.org/~dgibson
[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 833 bytes --]
next prev parent reply other threads:[~2025-08-06 1:58 UTC|newest]
Thread overview: 66+ messages / expand[flat|nested] mbox.gz Atom feed top
2025-08-05 15:45 [PATCH v8 00/30] Introduce discontiguous frames management Laurent Vivier
2025-08-05 15:45 ` [PATCH v8 01/30] arp: Don't mix incoming and outgoing buffers Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 02/30] iov: Introduce iov_tail_clone() and iov_tail_drop() Laurent Vivier
2025-08-06 1:32 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 03/30] iov: Update IOV_REMOVE_HEADER() and IOV_PEEK_HEADER() Laurent Vivier
2025-08-06 1:45 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 04/30] tap: Use iov_tail with tap_add_packet() Laurent Vivier
2025-08-06 1:56 ` David Gibson [this message]
2025-08-05 15:46 ` [PATCH v8 05/30] packet: Use iov_tail with packet_add() Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 06/30] packet: Add packet_data() Laurent Vivier
2025-08-06 2:14 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 07/30] arp: Convert to iov_tail Laurent Vivier
2025-08-06 2:17 ` David Gibson
2025-08-07 12:58 ` Laurent Vivier
2025-08-07 13:11 ` Stefano Brivio
2025-08-13 2:21 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 08/30] ndp: " Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 09/30] icmp: " Laurent Vivier
2025-08-06 2:20 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 10/30] udp: " Laurent Vivier
2025-08-06 2:23 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 11/30] tcp: Convert tcp_tap_handler() to use iov_tail Laurent Vivier
2025-08-06 2:35 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 12/30] tcp: Convert tcp_data_from_tap() " Laurent Vivier
2025-08-06 2:37 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 13/30] dhcpv6: move offset initialization out of dhcpv6_opt() Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 14/30] dhcpv6: Extract sending of NotOnLink status Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 15/30] dhcpv6: Convert to iov_tail Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 16/30] dhcpv6: Use iov_tail in dhcpv6_opt() Laurent Vivier
2025-08-06 4:14 ` David Gibson
2025-08-08 13:59 ` Laurent Vivier
2025-08-13 2:29 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 17/30] dhcp: Convert to iov_tail Laurent Vivier
2025-08-06 4:38 ` David Gibson
2025-08-08 9:33 ` Laurent Vivier
2025-08-13 2:27 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 18/30] ip: Use iov_tail in ipv6_l4hdr() Laurent Vivier
2025-08-06 5:12 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 19/30] tap: Convert tap4_handler() to iov_tail Laurent Vivier
2025-08-06 5:17 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 20/30] tap: Convert tap6_handler() " Laurent Vivier
2025-08-06 6:21 ` David Gibson
2025-08-08 13:57 ` Laurent Vivier
2025-08-13 3:22 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 21/30] packet: rename packet_data() to packet_get() Laurent Vivier
2025-08-06 6:22 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 22/30] arp: use iov_tail rather than pool Laurent Vivier
2025-08-06 6:24 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 23/30] dhcp: " Laurent Vivier
2025-08-06 6:26 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 24/30] dhcpv6: " Laurent Vivier
2025-08-06 6:27 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 25/30] icmp: " Laurent Vivier
2025-08-06 6:29 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 26/30] ndp: " Laurent Vivier
2025-08-06 6:31 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 27/30] packet: remove PACKET_POOL() and PACKET_POOL_P() Laurent Vivier
2025-08-06 6:32 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 28/30] packet: remove unused parameter from PACKET_POOL_DECL() Laurent Vivier
2025-08-06 6:33 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 29/30] packet: Refactor vhost-user memory region handling Laurent Vivier
2025-08-07 6:10 ` David Gibson
2025-08-07 9:05 ` Laurent Vivier
2025-08-07 11:44 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 30/30] packet: Add support for multi-vector packets Laurent Vivier
2025-08-07 6:17 ` David Gibson
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=aJK2aGTa0R0rE5EZ@zatzit \
--to=david@gibson.dropbear.id.au \
--cc=lvivier@redhat.com \
--cc=passt-dev@passt.top \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
Code repositories for project(s) associated with this public inbox
https://passt.top/passt
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for IMAP folder(s).