From: David Gibson <david@gibson.dropbear.id.au>
To: Laurent Vivier <lvivier@redhat.com>
Cc: passt-dev@passt.top
Subject: Re: [PATCH v8 25/30] icmp: use iov_tail rather than pool
Date: Wed, 6 Aug 2025 16:29:46 +1000 [thread overview]
Message-ID: <aJL2WvCFX2bJdFpp@zatzit> (raw)
In-Reply-To: <20250805154628.301343-26-lvivier@redhat.com>
[-- Attachment #1: Type: text/plain, Size: 6712 bytes --]
On Tue, Aug 05, 2025 at 05:46:23PM +0200, Laurent Vivier wrote:
> As the iov_tail has a non zero offset (because of the presence of
> packet headers in the iov array), we must copy it to a new
> iov array (using iov_tail_splice()) to pass it to sendmsg().
>
> We cannot use anymore iov_tail_msghdr(), so remove it.
Right, as I mentioned on that patch, it was always kind of a foot gun.
Was this the only user? Maybe just open code it earlier in the series
rather than introducing then removing the helper.
>
> Signed-off-by: Laurent Vivier <lvivier@redhat.com>
Reviewed-by: David Gibson <david@gibson.dropbear.id.au>
> ---
> icmp.c | 30 +++++++++++++++++++-----------
> icmp.h | 2 +-
> iov.c | 23 -----------------------
> iov.h | 2 --
> tap.c | 7 ++-----
> 5 files changed, 22 insertions(+), 42 deletions(-)
>
> diff --git a/icmp.c b/icmp.c
> index 71c496540310..be800e30c369 100644
> --- a/icmp.c
> +++ b/icmp.c
> @@ -44,6 +44,7 @@
>
> #define ICMP_ECHO_TIMEOUT 60 /* s, timeout for ICMP socket activity */
> #define ICMP_NUM_IDS (1U << 16)
> +#define MAX_IOV_ICMP 16 /* Arbitrary, should be enough */
>
> /**
> * ping_at_sidx() - Get ping specific flow at given sidx
> @@ -229,36 +230,33 @@ cancel:
> * @af: Address family, AF_INET or AF_INET6
> * @saddr: Source address
> * @daddr: Destination address
> - * @p: Packet pool, single packet with ICMP/ICMPv6 header
> + * @data: Single packet with ICMP/ICMPv6 header
> * @now: Current timestamp
> *
> * Return: count of consumed packets (always 1, even if malformed)
> */
> int icmp_tap_handler(const struct ctx *c, uint8_t pif, sa_family_t af,
> const void *saddr, const void *daddr,
> - const struct pool *p, const struct timespec *now)
> + struct iov_tail *data, const struct timespec *now)
> {
> + struct iovec iov[MAX_IOV_ICMP];
> struct icmp_ping_flow *pingf;
> const struct flowside *tgt;
> union sockaddr_inany sa;
> - struct iov_tail data;
> struct msghdr msh;
> uint16_t id, seq;
> union flow *flow;
> uint8_t proto;
> - socklen_t sl;
> + int cnt;
>
> (void)saddr;
> ASSERT(pif == PIF_TAP);
>
> - if (!packet_get(p, 0, &data))
> - return -1;
> -
> if (af == AF_INET) {
> struct icmphdr ih_storage;
> const struct icmphdr *ih;
>
> - ih = IOV_PEEK_HEADER(&data, ih_storage);
> + ih = IOV_PEEK_HEADER(data, ih_storage);
> if (!ih)
> return 1;
>
> @@ -272,7 +270,7 @@ int icmp_tap_handler(const struct ctx *c, uint8_t pif, sa_family_t af,
> struct icmp6hdr ih_storage;
> const struct icmp6hdr *ih;
>
> - ih = IOV_PEEK_HEADER(&data, ih_storage);
> + ih = IOV_PEEK_HEADER(data, ih_storage);
> if (!ih)
> return 1;
>
> @@ -286,6 +284,10 @@ int icmp_tap_handler(const struct ctx *c, uint8_t pif, sa_family_t af,
> ASSERT(0);
> }
>
> + cnt = iov_tail_clone(&iov[0], MAX_IOV_ICMP, data);
> + if (cnt < 0)
> + return 1;
> +
> flow = flow_at_sidx(flow_lookup_af(c, proto, PIF_TAP,
> af, saddr, daddr, id, id));
>
> @@ -300,8 +302,14 @@ int icmp_tap_handler(const struct ctx *c, uint8_t pif, sa_family_t af,
> pingf->ts = now->tv_sec;
>
>
> - pif_sockaddr(c, &sa, &sl, PIF_HOST, &tgt->eaddr, 0);
> - iov_tail_msghdr(&msh, &data, &sa, sl);
> + pif_sockaddr(c, &sa, &msh.msg_namelen, PIF_HOST, &tgt->eaddr, 0);
> + msh.msg_name = &sa;
> + msh.msg_iov = iov;
> + msh.msg_iovlen = cnt;
> + msh.msg_control = NULL;
> + msh.msg_controllen = 0;
> + msh.msg_flags = 0;
> +
> if (sendmsg(pingf->sock, &msh, MSG_NOSIGNAL) < 0) {
> flow_dbg_perror(pingf, "failed to relay request to socket");
> } else {
> diff --git a/icmp.h b/icmp.h
> index 5ce22b5eca1f..d1cecb20e29d 100644
> --- a/icmp.h
> +++ b/icmp.h
> @@ -14,7 +14,7 @@ struct icmp_ping_flow;
> void icmp_sock_handler(const struct ctx *c, union epoll_ref ref);
> int icmp_tap_handler(const struct ctx *c, uint8_t pif, sa_family_t af,
> const void *saddr, const void *daddr,
> - const struct pool *p, const struct timespec *now);
> + struct iov_tail *data, const struct timespec *now);
> void icmp_init(void);
>
> /**
> diff --git a/iov.c b/iov.c
> index d17d4dd3da09..1d734acdfea6 100644
> --- a/iov.c
> +++ b/iov.c
> @@ -157,29 +157,6 @@ size_t iov_size(const struct iovec *iov, size_t iov_cnt)
> return len;
> }
>
> -/**
> - * iov_tail_msghdr - Initialize a msghdr from an IOV tail structure
> - * @msh: msghdr to initialize
> - * @tail: iov_tail to use to set msg_iov and msg_iovlen
> - * @msg_name: Pointer to set to msg_name
> - * @msg_namelen: Size of @msg_name
> - */
> -void iov_tail_msghdr(struct msghdr *msh, struct iov_tail *tail,
> - void *msg_name, socklen_t msg_namelen)
> -{
> - iov_tail_prune(tail);
> -
> - ASSERT(tail->off == 0);
> -
> - msh->msg_name = msg_name;
> - msh->msg_namelen = msg_namelen;
> - msh->msg_iov = (struct iovec *)tail->iov;
> - msh->msg_iovlen = tail->cnt;
> - msh->msg_control = NULL;
> - msh->msg_controllen = 0;
> - msh->msg_flags = 0;
> -}
> -
> /**
> * iov_tail_prune() - Remove any unneeded buffers from an IOV tail
> * @tail: IO vector tail (modified)
> diff --git a/iov.h b/iov.h
> index 75c3b07a87e3..ccdb690ef3f1 100644
> --- a/iov.h
> +++ b/iov.h
> @@ -82,8 +82,6 @@ struct iov_tail {
> 1, \
> (off_))
>
> -void iov_tail_msghdr(struct msghdr *msh, struct iov_tail *tail,
> - void *msg_name, socklen_t msg_namelen);
> bool iov_tail_prune(struct iov_tail *tail);
> size_t iov_tail_size(struct iov_tail *tail);
> bool iov_tail_drop(struct iov_tail *tail, size_t len);
> diff --git a/tap.c b/tap.c
> index 3262b44c4287..48152a84674c 100644
> --- a/tap.c
> +++ b/tap.c
> @@ -764,17 +764,14 @@ resume:
> continue;
>
> if (iph->protocol == IPPROTO_ICMP) {
> - PACKET_POOL_P(pkt, 1, in->buf, in->buf_size);
> -
> if (c->no_icmp)
> continue;
>
> tap_packet_debug(iph, NULL, NULL, 0, NULL, 1);
>
> - packet_add(pkt, &data);
> icmp_tap_handler(c, PIF_TAP, AF_INET,
> &iph->saddr, &iph->daddr,
> - pkt, now);
> + &data, now);
> continue;
> }
>
> @@ -964,7 +961,7 @@ resume:
> tap_packet_debug(NULL, ip6h, NULL, proto, NULL, 1);
>
> icmp_tap_handler(c, PIF_TAP, AF_INET6,
> - saddr, daddr, pkt, now);
> + saddr, daddr, &data, now);
> continue;
> }
>
--
David Gibson (he or they) | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au | minimalist, thank you, not the other way
| around.
http://www.ozlabs.org/~dgibson
[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 833 bytes --]
next prev parent reply other threads:[~2025-08-06 6:35 UTC|newest]
Thread overview: 66+ messages / expand[flat|nested] mbox.gz Atom feed top
2025-08-05 15:45 [PATCH v8 00/30] Introduce discontiguous frames management Laurent Vivier
2025-08-05 15:45 ` [PATCH v8 01/30] arp: Don't mix incoming and outgoing buffers Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 02/30] iov: Introduce iov_tail_clone() and iov_tail_drop() Laurent Vivier
2025-08-06 1:32 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 03/30] iov: Update IOV_REMOVE_HEADER() and IOV_PEEK_HEADER() Laurent Vivier
2025-08-06 1:45 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 04/30] tap: Use iov_tail with tap_add_packet() Laurent Vivier
2025-08-06 1:56 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 05/30] packet: Use iov_tail with packet_add() Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 06/30] packet: Add packet_data() Laurent Vivier
2025-08-06 2:14 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 07/30] arp: Convert to iov_tail Laurent Vivier
2025-08-06 2:17 ` David Gibson
2025-08-07 12:58 ` Laurent Vivier
2025-08-07 13:11 ` Stefano Brivio
2025-08-13 2:21 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 08/30] ndp: " Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 09/30] icmp: " Laurent Vivier
2025-08-06 2:20 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 10/30] udp: " Laurent Vivier
2025-08-06 2:23 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 11/30] tcp: Convert tcp_tap_handler() to use iov_tail Laurent Vivier
2025-08-06 2:35 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 12/30] tcp: Convert tcp_data_from_tap() " Laurent Vivier
2025-08-06 2:37 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 13/30] dhcpv6: move offset initialization out of dhcpv6_opt() Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 14/30] dhcpv6: Extract sending of NotOnLink status Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 15/30] dhcpv6: Convert to iov_tail Laurent Vivier
2025-08-05 15:46 ` [PATCH v8 16/30] dhcpv6: Use iov_tail in dhcpv6_opt() Laurent Vivier
2025-08-06 4:14 ` David Gibson
2025-08-08 13:59 ` Laurent Vivier
2025-08-13 2:29 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 17/30] dhcp: Convert to iov_tail Laurent Vivier
2025-08-06 4:38 ` David Gibson
2025-08-08 9:33 ` Laurent Vivier
2025-08-13 2:27 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 18/30] ip: Use iov_tail in ipv6_l4hdr() Laurent Vivier
2025-08-06 5:12 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 19/30] tap: Convert tap4_handler() to iov_tail Laurent Vivier
2025-08-06 5:17 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 20/30] tap: Convert tap6_handler() " Laurent Vivier
2025-08-06 6:21 ` David Gibson
2025-08-08 13:57 ` Laurent Vivier
2025-08-13 3:22 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 21/30] packet: rename packet_data() to packet_get() Laurent Vivier
2025-08-06 6:22 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 22/30] arp: use iov_tail rather than pool Laurent Vivier
2025-08-06 6:24 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 23/30] dhcp: " Laurent Vivier
2025-08-06 6:26 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 24/30] dhcpv6: " Laurent Vivier
2025-08-06 6:27 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 25/30] icmp: " Laurent Vivier
2025-08-06 6:29 ` David Gibson [this message]
2025-08-05 15:46 ` [PATCH v8 26/30] ndp: " Laurent Vivier
2025-08-06 6:31 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 27/30] packet: remove PACKET_POOL() and PACKET_POOL_P() Laurent Vivier
2025-08-06 6:32 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 28/30] packet: remove unused parameter from PACKET_POOL_DECL() Laurent Vivier
2025-08-06 6:33 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 29/30] packet: Refactor vhost-user memory region handling Laurent Vivier
2025-08-07 6:10 ` David Gibson
2025-08-07 9:05 ` Laurent Vivier
2025-08-07 11:44 ` David Gibson
2025-08-05 15:46 ` [PATCH v8 30/30] packet: Add support for multi-vector packets Laurent Vivier
2025-08-07 6:17 ` David Gibson
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=aJL2WvCFX2bJdFpp@zatzit \
--to=david@gibson.dropbear.id.au \
--cc=lvivier@redhat.com \
--cc=passt-dev@passt.top \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
Code repositories for project(s) associated with this public inbox
https://passt.top/passt
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for IMAP folder(s).