From: David Gibson <david@gibson.dropbear.id.au>
To: Stefano Brivio <sbrivio@redhat.com>, passt-dev@passt.top
Subject: Re: [PATCH 7/9] epoll: Split handling of listening TCP sockets into their own handler
Date: Wed, 9 Aug 2023 16:29:54 +1000 [thread overview]
Message-ID: <ZNMyYplt2izWSudj@zatzit> (raw)
In-Reply-To: <20230807134631.1400119-8-david@gibson.dropbear.id.au>
[-- Attachment #1: Type: text/plain, Size: 6834 bytes --]
On Mon, Aug 07, 2023 at 11:46:29PM +1000, David Gibson wrote:
> tcp_sock_handler() handles both listening TCP sockets, and connected TCP
> sockets, but what it needs to do in those cases has essentially nothing in
> common. Therefore, give listening sockets their own epoll_type value and
> dispatch directly to their own handler from the top level. This also lets
> us remove the listen field from tcp_epoll_ref, since the information it
> carries is implicit in the epoll_type.
>
> Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
Stefano,
I've realized an additional change that belongs with this patch, so
I'll be making a second spin. Go ahead and review, but don't apply
just yet.
> ---
> passt.c | 8 ++++++--
> passt.h | 4 +++-
> tcp.c | 31 +++++++++----------------------
> tcp.h | 8 ++++----
> util.c | 2 +-
> 5 files changed, 23 insertions(+), 30 deletions(-)
>
> diff --git a/passt.c b/passt.c
> index c750fad..c32981d 100644
> --- a/passt.c
> +++ b/passt.c
> @@ -56,7 +56,8 @@
> char pkt_buf[PKT_BUF_BYTES] __attribute__ ((aligned(PAGE_SIZE)));
>
> char *epoll_type_str[EPOLL_TYPE_MAX+1] = {
> - [EPOLL_TYPE_TCP] = "TCP socket",
> + [EPOLL_TYPE_TCP] = "connected TCP socket",
> + [EPOLL_TYPE_TCP_LISTEN] = "listening TCP socket",
> [EPOLL_TYPE_TCP_TIMER] = "TCP timer",
> [EPOLL_TYPE_UDP] = "UDP socket",
> [EPOLL_TYPE_ICMP] = "ICMP socket",
> @@ -323,7 +324,10 @@ loop:
> break;
> case EPOLL_TYPE_TCP:
> if (!c.no_tcp)
> - tcp_sock_handler(&c, ref, eventmask, &now);
> + tcp_sock_handler(&c, ref, eventmask);
> + break;
> + case EPOLL_TYPE_TCP_LISTEN:
> + tcp_listen_handler(&c, ref, &now);
> break;
> case EPOLL_TYPE_TCP_TIMER:
> tcp_timer_handler(&c, ref);
> diff --git a/passt.h b/passt.h
> index fc1efdb..176bc85 100644
> --- a/passt.h
> +++ b/passt.h
> @@ -47,8 +47,10 @@ union epoll_ref;
> enum epoll_type {
> /* Special value to indicate an invalid type */
> EPOLL_TYPE_NONE = 0,
> - /* TCP sockets */
> + /* Connected TCP sockets */
> EPOLL_TYPE_TCP,
> + /* Listening TCP sockets */
> + EPOLL_TYPE_TCP_LISTEN,
> /* timerfds used for TCP timers */
> EPOLL_TYPE_TCP_TIMER,
> /* UDP sockets */
> diff --git a/tcp.c b/tcp.c
> index 98761a2..c237393 100644
> --- a/tcp.c
> +++ b/tcp.c
> @@ -2765,22 +2765,20 @@ static void tcp_tap_conn_from_sock(struct ctx *c, union epoll_ref ref,
> }
>
> /**
> - * tcp_conn_from_sock() - Handle new connection request from listening socket
> + * tcp_listen_handler() - Handle new connection request from listening socket
> * @c: Execution context
> * @ref: epoll reference of listening socket
> * @now: Current timestamp
> */
> -static void tcp_conn_from_sock(struct ctx *c, union epoll_ref ref,
> - const struct timespec *now)
> +void tcp_listen_handler(struct ctx *c, union epoll_ref ref,
> + const struct timespec *now)
> {
> struct sockaddr_storage sa;
> union tcp_conn *conn;
> socklen_t sl;
> int s;
>
> - ASSERT(ref.tcp.listen);
> -
> - if (c->tcp.conn_count >= TCP_MAX_CONNS)
> + if (c->no_tcp || c->tcp.conn_count >= TCP_MAX_CONNS)
> return;
>
> sl = sizeof(sa);
> @@ -2926,19 +2924,10 @@ static void tcp_tap_sock_handler(struct ctx *c, struct tcp_tap_conn *conn,
> * @c: Execution context
> * @ref: epoll reference
> * @events: epoll events bitmap
> - * @now: Current timestamp
> */
> -void tcp_sock_handler(struct ctx *c, union epoll_ref ref, uint32_t events,
> - const struct timespec *now)
> +void tcp_sock_handler(struct ctx *c, union epoll_ref ref, uint32_t events)
> {
> - union tcp_conn *conn;
> -
> - if (ref.tcp.listen) {
> - tcp_conn_from_sock(c, ref, now);
> - return;
> - }
> -
> - conn = tc + ref.tcp.index;
> + union tcp_conn *conn = tc + ref.tcp.index;
>
> if (conn->c.spliced)
> tcp_splice_sock_handler(c, &conn->splice, ref.fd, events);
> @@ -2960,7 +2949,7 @@ static int tcp_sock_init_af(const struct ctx *c, int af, in_port_t port,
> const struct in_addr *addr, const char *ifname)
> {
> in_port_t idx = port + c->tcp.fwd_in.delta[port];
> - union tcp_epoll_ref tref = { .listen = 1, .index = idx };
> + union tcp_epoll_ref tref = { .index = idx };
> int s;
>
> s = sock_l4(c, af, IPPROTO_TCP, addr, ifname, port, tref.u32);
> @@ -3020,8 +3009,7 @@ int tcp_sock_init(const struct ctx *c, sa_family_t af, const void *addr,
> static void tcp_ns_sock_init4(const struct ctx *c, in_port_t port)
> {
> in_port_t idx = port + c->tcp.fwd_out.delta[port];
> - union tcp_epoll_ref tref = { .listen = 1, .outbound = 1,
> - .index = idx };
> + union tcp_epoll_ref tref = { .outbound = 1, .index = idx };
> struct in_addr loopback = { htonl(INADDR_LOOPBACK) };
> int s;
>
> @@ -3045,8 +3033,7 @@ static void tcp_ns_sock_init4(const struct ctx *c, in_port_t port)
> static void tcp_ns_sock_init6(const struct ctx *c, in_port_t port)
> {
> in_port_t idx = port + c->tcp.fwd_out.delta[port];
> - union tcp_epoll_ref tref = { .listen = 1, .outbound = 1,
> - .index = idx };
> + union tcp_epoll_ref tref = { .outbound = 1, .index = idx };
> int s;
>
> ASSERT(c->mode == MODE_PASTA);
> diff --git a/tcp.h b/tcp.h
> index 8eb7782..8189ac0 100644
> --- a/tcp.h
> +++ b/tcp.h
> @@ -14,8 +14,9 @@
> struct ctx;
>
> void tcp_timer_handler(struct ctx *c, union epoll_ref ref);
> -void tcp_sock_handler(struct ctx *c, union epoll_ref ref, uint32_t events,
> - const struct timespec *now);
> +void tcp_listen_handler(struct ctx *c, union epoll_ref ref,
> + const struct timespec *now);
> +void tcp_sock_handler(struct ctx *c, union epoll_ref ref, uint32_t events);
> int tcp_tap_handler(struct ctx *c, int af, const void *addr,
> const struct pool *p, const struct timespec *now);
> int tcp_sock_init(const struct ctx *c, sa_family_t af, const void *addr,
> @@ -37,8 +38,7 @@ void tcp_update_l2_buf(const unsigned char *eth_d, const unsigned char *eth_s,
> */
> union tcp_epoll_ref {
> struct {
> - uint32_t listen:1,
> - outbound:1,
> + uint32_t outbound:1,
> index:20;
> };
> uint32_t u32;
> diff --git a/util.c b/util.c
> index 2cac7ba..d965f48 100644
> --- a/util.c
> +++ b/util.c
> @@ -120,7 +120,7 @@ int sock_l4(const struct ctx *c, int af, uint8_t proto,
>
> switch (proto) {
> case IPPROTO_TCP:
> - ref.type = EPOLL_TYPE_TCP;
> + ref.type = EPOLL_TYPE_TCP_LISTEN;
> break;
> case IPPROTO_UDP:
> ref.type = EPOLL_TYPE_UDP;
--
David Gibson | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au | minimalist, thank you. NOT _the_ _other_
| _way_ _around_!
http://www.ozlabs.org/~dgibson
[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 833 bytes --]
next prev parent reply other threads:[~2023-08-09 6:30 UTC|newest]
Thread overview: 17+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-08-07 13:46 [PATCH 0/9] Clean up to epoll dispatch David Gibson
2023-08-07 13:46 ` [PATCH 1/9] epoll: Generalize epoll_ref to cover things other than sockets David Gibson
2023-08-09 19:59 ` Stefano Brivio
2023-08-10 0:23 ` David Gibson
2023-08-07 13:46 ` [PATCH 2/9] epoll: Always use epoll_ref for the epoll data variable David Gibson
2023-08-07 13:46 ` [PATCH 3/9] epoll: Fold sock_handler into general switch on epoll event fd David Gibson
2023-08-07 13:46 ` [PATCH 4/9] epoll: Split handling of ICMP and ICMPv6 sockets David Gibson
2023-08-07 13:46 ` [PATCH 5/9] epoll: Tiny cleanup to udp_sock_handler() David Gibson
2023-08-07 13:46 ` [PATCH 6/9] epoll: Split handling of TCP timerfds into its own handler function David Gibson
2023-08-07 13:46 ` [PATCH 7/9] epoll: Split handling of listening TCP sockets into their own handler David Gibson
2023-08-09 6:29 ` David Gibson [this message]
2023-08-07 13:46 ` [PATCH 8/9] epoll: Split listening Unix domain socket into its own type David Gibson
2023-08-09 19:59 ` Stefano Brivio
2023-08-10 1:08 ` David Gibson
2023-08-10 7:50 ` Stefano Brivio
2023-08-11 3:17 ` David Gibson
2023-08-07 13:46 ` [PATCH 9/9] epoll: Use different epoll types for passt and pasta tap fds David Gibson
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=ZNMyYplt2izWSudj@zatzit \
--to=david@gibson.dropbear.id.au \
--cc=passt-dev@passt.top \
--cc=sbrivio@redhat.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
Code repositories for project(s) associated with this public inbox
https://passt.top/passt
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for IMAP folder(s).