* [PATCH v2 1/3] tcp: Merge tcp_ns_sock_init[46]() into tcp_sock_init_one()
2025-10-22 3:15 [PATCH v2 0/3] Reduce differences between inbound and outbound socket binding David Gibson
@ 2025-10-22 3:15 ` David Gibson
2025-10-22 3:15 ` [PATCH v2 2/3] udp: Unify some more inbound/outbound parts of udp_sock_init() David Gibson
2025-10-22 3:15 ` [PATCH v2 3/3] tcp, udp: Bind outbound listening sockets by interface instead of address David Gibson
2 siblings, 0 replies; 6+ messages in thread
From: David Gibson @ 2025-10-22 3:15 UTC (permalink / raw)
To: passt-dev, Stefano Brivio; +Cc: David Gibson
Surprisingly little logic is shared between the path for creating a
listen()ing socket in the guest namespace versus in the host namespace.
Improve this, by extending tcp_sock_init_one() to take a pif parameter
indicating where it should open the socket. This allows
tcp_ns_sock_init[46]() to be removed entirely.
We generalise tcp_sock_init() in the same way, although we don't use it
yet, due to some subtle differences in how we bind for -t versus -T.
Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
---
conf.c | 2 +-
tcp.c | 100 +++++++++++++++++++--------------------------------------
tcp.h | 5 +--
3 files changed, 37 insertions(+), 70 deletions(-)
diff --git a/conf.c b/conf.c
index 66b9e634..26f1bcc0 100644
--- a/conf.c
+++ b/conf.c
@@ -169,7 +169,7 @@ static void conf_ports_range_except(const struct ctx *c, char optname,
fwd->delta[i] = to - first;
if (optname == 't')
- ret = tcp_sock_init(c, addr, ifname, i);
+ ret = tcp_sock_init(c, PIF_HOST, addr, ifname, i);
else if (optname == 'u')
ret = udp_sock_init(c, 0, addr, ifname, i);
else
diff --git a/tcp.c b/tcp.c
index 0f9e9b3f..a62c8df1 100644
--- a/tcp.c
+++ b/tcp.c
@@ -2515,29 +2515,42 @@ void tcp_sock_handler(const struct ctx *c, union epoll_ref ref,
/**
* tcp_sock_init_one() - Initialise listening socket for address and port
* @c: Execution context
+ * @pif: Interface to open the socket for (PIF_HOST or PIF_SPLICE)
* @addr: Pointer to address for binding, NULL for dual stack any
* @ifname: Name of interface to bind to, NULL if not configured
* @port: Port, host order
*
* Return: fd for the new listening socket, negative error code on failure
+ *
+ * If pif == PIF_SPLICE, the caller must have already entered the guest ns.
*/
-static int tcp_sock_init_one(const struct ctx *c, const union inany_addr *addr,
- const char *ifname, in_port_t port)
+static int tcp_sock_init_one(const struct ctx *c, uint8_t pif,
+ const union inany_addr *addr, const char *ifname,
+ in_port_t port)
{
union tcp_listen_epoll_ref tref = {
.port = port,
- .pif = PIF_HOST,
+ .pif = pif,
};
+ const struct fwd_ports *fwd;
int s;
- s = pif_sock_l4(c, EPOLL_TYPE_TCP_LISTEN, PIF_HOST, addr,
- ifname, port, tref.u32);
+ if (pif == PIF_HOST)
+ fwd = &c->tcp.fwd_in;
+ else
+ fwd = &c->tcp.fwd_out;
+
+ s = pif_sock_l4(c, EPOLL_TYPE_TCP_LISTEN, pif, addr, ifname,
+ port, tref.u32);
+
+ if (fwd->mode == FWD_AUTO) {
+ int (*socks)[IP_VERSIONS] = pif == PIF_SPLICE ?
+ tcp_sock_ns : tcp_sock_init_ext;
- if (c->tcp.fwd_in.mode == FWD_AUTO) {
if (!addr || inany_v4(addr))
- tcp_sock_init_ext[port][V4] = s < 0 ? -1 : s;
+ socks[port][V4] = s < 0 ? -1 : s;
if (!addr || !inany_v4(addr))
- tcp_sock_init_ext[port][V6] = s < 0 ? -1 : s;
+ socks[port][V6] = s < 0 ? -1 : s;
}
if (s < 0)
@@ -2549,14 +2562,16 @@ static int tcp_sock_init_one(const struct ctx *c, const union inany_addr *addr,
/**
* tcp_sock_init() - Create listening sockets for a given host ("inbound") port
* @c: Execution context
+ * @pif: Interface to open the socket for (PIF_HOST or PIF_SPLICE)
* @addr: Pointer to address for binding, NULL if not configured
* @ifname: Name of interface to bind to, NULL if not configured
* @port: Port, host order
*
* Return: 0 on (partial) success, negative error code on (complete) failure
*/
-int tcp_sock_init(const struct ctx *c, const union inany_addr *addr,
- const char *ifname, in_port_t port)
+int tcp_sock_init(const struct ctx *c, uint8_t pif,
+ const union inany_addr *addr, const char *ifname,
+ in_port_t port)
{
int r4 = FD_REF_MAX + 1, r6 = FD_REF_MAX + 1;
@@ -2564,72 +2579,23 @@ int tcp_sock_init(const struct ctx *c, const union inany_addr *addr,
if (!addr && c->ifi4 && c->ifi6)
/* Attempt to get a dual stack socket */
- if (tcp_sock_init_one(c, NULL, ifname, port) >= 0)
+ if (tcp_sock_init_one(c, pif, NULL, ifname, port) >= 0)
return 0;
/* Otherwise create a socket per IP version */
if ((!addr || inany_v4(addr)) && c->ifi4)
- r4 = tcp_sock_init_one(c, addr ? addr : &inany_any4,
- ifname, port);
+ r4 = tcp_sock_init_one(c, pif,
+ addr ? addr : &inany_any4, ifname, port);
if ((!addr || !inany_v4(addr)) && c->ifi6)
- r6 = tcp_sock_init_one(c, addr ? addr : &inany_any6,
- ifname, port);
+ r6 = tcp_sock_init_one(c, pif,
+ addr ? addr : &inany_any6, ifname, port);
if (IN_INTERVAL(0, FD_REF_MAX, r4) || IN_INTERVAL(0, FD_REF_MAX, r6))
return 0;
return r4 < 0 ? r4 : r6;
}
-
-/**
- * tcp_ns_sock_init4() - Init socket to listen for outbound IPv4 connections
- * @c: Execution context
- * @port: Port, host order
- */
-static void tcp_ns_sock_init4(const struct ctx *c, in_port_t port)
-{
- union tcp_listen_epoll_ref tref = {
- .port = port,
- .pif = PIF_SPLICE,
- };
- int s;
-
- ASSERT(c->mode == MODE_PASTA);
-
- s = pif_sock_l4(c, EPOLL_TYPE_TCP_LISTEN, PIF_SPLICE, &inany_loopback4,
- NULL, port, tref.u32);
- if (s < 0)
- s = -1;
-
- if (c->tcp.fwd_out.mode == FWD_AUTO)
- tcp_sock_ns[port][V4] = s;
-}
-
-/**
- * tcp_ns_sock_init6() - Init socket to listen for outbound IPv6 connections
- * @c: Execution context
- * @port: Port, host order
- */
-static void tcp_ns_sock_init6(const struct ctx *c, in_port_t port)
-{
- union tcp_listen_epoll_ref tref = {
- .port = port,
- .pif = PIF_SPLICE,
- };
- int s;
-
- ASSERT(c->mode == MODE_PASTA);
-
- s = pif_sock_l4(c, EPOLL_TYPE_TCP_LISTEN, PIF_SPLICE, &inany_loopback6,
- NULL, port, tref.u32);
- if (s < 0)
- s = -1;
-
- if (c->tcp.fwd_out.mode == FWD_AUTO)
- tcp_sock_ns[port][V6] = s;
-}
-
/**
* tcp_ns_sock_init() - Init socket to listen for spliced outbound connections
* @c: Execution context
@@ -2640,9 +2606,9 @@ static void tcp_ns_sock_init(const struct ctx *c, in_port_t port)
ASSERT(!c->no_tcp);
if (c->ifi4)
- tcp_ns_sock_init4(c, port);
+ tcp_sock_init_one(c, PIF_SPLICE, &inany_loopback4, NULL, port);
if (c->ifi6)
- tcp_ns_sock_init6(c, port);
+ tcp_sock_init_one(c, PIF_SPLICE, &inany_loopback6, NULL, port);
}
/**
@@ -2845,7 +2811,7 @@ static void tcp_port_rebind(struct ctx *c, bool outbound)
if (outbound)
tcp_ns_sock_init(c, port);
else
- tcp_sock_init(c, NULL, NULL, port);
+ tcp_sock_init(c, PIF_HOST, NULL, NULL, port);
}
}
}
diff --git a/tcp.h b/tcp.h
index 234a8033..fb22bac0 100644
--- a/tcp.h
+++ b/tcp.h
@@ -18,8 +18,9 @@ void tcp_sock_handler(const struct ctx *c, union epoll_ref ref,
int tcp_tap_handler(const struct ctx *c, uint8_t pif, sa_family_t af,
const void *saddr, const void *daddr, uint32_t flow_lbl,
const struct pool *p, int idx, const struct timespec *now);
-int tcp_sock_init(const struct ctx *c, const union inany_addr *addr,
- const char *ifname, in_port_t port);
+int tcp_sock_init(const struct ctx *c, uint8_t pif,
+ const union inany_addr *addr, const char *ifname,
+ in_port_t port);
int tcp_init(struct ctx *c);
void tcp_timer(struct ctx *c, const struct timespec *now);
void tcp_defer_handler(struct ctx *c);
--
2.51.0
^ permalink raw reply [flat|nested] 6+ messages in thread* [PATCH v2 2/3] udp: Unify some more inbound/outbound parts of udp_sock_init()
2025-10-22 3:15 [PATCH v2 0/3] Reduce differences between inbound and outbound socket binding David Gibson
2025-10-22 3:15 ` [PATCH v2 1/3] tcp: Merge tcp_ns_sock_init[46]() into tcp_sock_init_one() David Gibson
@ 2025-10-22 3:15 ` David Gibson
2025-10-28 23:13 ` Stefano Brivio
2025-10-22 3:15 ` [PATCH v2 3/3] tcp, udp: Bind outbound listening sockets by interface instead of address David Gibson
2 siblings, 1 reply; 6+ messages in thread
From: David Gibson @ 2025-10-22 3:15 UTC (permalink / raw)
To: passt-dev, Stefano Brivio; +Cc: David Gibson
udp_sock_init() takes an 'ns' parameter determining if it creates a socket
in the guest namespace or host namespace. Alter it to take a pif
parameter instead, like tcp_sock_init(), and use that change to slightly
reduce code duplication between the HOST and SPLICE cases.
Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
---
conf.c | 2 +-
udp.c | 65 +++++++++++++++++++++++++++++++---------------------------
udp.h | 5 +++--
3 files changed, 39 insertions(+), 33 deletions(-)
diff --git a/conf.c b/conf.c
index 26f1bcc0..08cb50aa 100644
--- a/conf.c
+++ b/conf.c
@@ -171,7 +171,7 @@ static void conf_ports_range_except(const struct ctx *c, char optname,
if (optname == 't')
ret = tcp_sock_init(c, PIF_HOST, addr, ifname, i);
else if (optname == 'u')
- ret = udp_sock_init(c, 0, addr, ifname, i);
+ ret = udp_sock_init(c, PIF_HOST, addr, ifname, i);
else
/* No way to check in advance for -T and -U */
ret = 0;
diff --git a/udp.c b/udp.c
index 86585b7e..7f5faf20 100644
--- a/udp.c
+++ b/udp.c
@@ -1093,64 +1093,68 @@ int udp_tap_handler(const struct ctx *c, uint8_t pif,
/**
* udp_sock_init() - Initialise listening sockets for a given port
* @c: Execution context
- * @ns: In pasta mode, if set, bind with loopback address in namespace
+ * @pif: Interface to open the socket for (PIF_HOST or PIF_SPLICE)
* @addr: Pointer to address for binding, NULL if not configured
* @ifname: Name of interface to bind to, NULL if not configured
* @port: Port, host order
*
* Return: 0 on (partial) success, negative error code on (complete) failure
*/
-int udp_sock_init(const struct ctx *c, int ns, const union inany_addr *addr,
- const char *ifname, in_port_t port)
+int udp_sock_init(const struct ctx *c, uint8_t pif,
+ const union inany_addr *addr, const char *ifname,
+ in_port_t port)
{
union udp_listen_epoll_ref uref = {
- .pif = ns ? PIF_SPLICE : PIF_HOST,
+ .pif = pif,
.port = port,
};
int r4 = FD_REF_MAX + 1, r6 = FD_REF_MAX + 1;
+ int (*socks)[NUM_PORTS];
ASSERT(!c->no_udp);
+ ASSERT(pif_is_socket(pif))
- if (!addr && c->ifi4 && c->ifi6 && !ns) {
+ if (pif == PIF_HOST)
+ socks = udp_splice_init;
+ else
+ socks = udp_splice_ns;
+
+ if (!addr && c->ifi4 && c->ifi6 && pif == PIF_HOST) {
int s;
/* Attempt to get a dual stack socket */
s = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_HOST,
NULL, ifname, port, uref.u32);
- udp_splice_init[V4][port] = s < 0 ? -1 : s;
- udp_splice_init[V6][port] = s < 0 ? -1 : s;
+ socks[V4][port] = s < 0 ? -1 : s;
+ socks[V6][port] = s < 0 ? -1 : s;
if (IN_INTERVAL(0, FD_REF_MAX, s))
return 0;
}
if ((!addr || inany_v4(addr)) && c->ifi4) {
- if (!ns) {
- r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_HOST,
- addr ? addr : &inany_any4, ifname,
- port, uref.u32);
+ const union inany_addr *a = addr ?
+ addr : &inany_any4;
- udp_splice_init[V4][port] = r4 < 0 ? -1 : r4;
- } else {
- r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_SPLICE,
- &inany_loopback4, ifname,
- port, uref.u32);
- udp_splice_ns[V4][port] = r4 < 0 ? -1 : r4;
- }
+ if (pif == PIF_SPLICE)
+ a = &inany_loopback4;
+
+ r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif, a, ifname,
+ port, uref.u32);
+
+ socks[V4][port] = r4 < 0 ? -1 : r4;
}
if ((!addr || !inany_v4(addr)) && c->ifi6) {
- if (!ns) {
- r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_HOST,
- addr ? addr : &inany_any6, ifname,
- port, uref.u32);
+ const union inany_addr *a = addr ?
+ addr : &inany_any6;
- udp_splice_init[V6][port] = r6 < 0 ? -1 : r6;
- } else {
- r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_SPLICE,
- &inany_loopback6, ifname,
- port, uref.u32);
- udp_splice_ns[V6][port] = r6 < 0 ? -1 : r6;
- }
+ if (pif == PIF_SPLICE)
+ a = &inany_loopback6;
+
+ r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif, a, ifname,
+ port, uref.u32);
+
+ socks[V6][port] = r6 < 0 ? -1 : r6;
}
if (IN_INTERVAL(0, FD_REF_MAX, r4) || IN_INTERVAL(0, FD_REF_MAX, r6))
@@ -1216,7 +1220,8 @@ static void udp_port_rebind(struct ctx *c, bool outbound)
if ((c->ifi4 && socks[V4][port] == -1) ||
(c->ifi6 && socks[V6][port] == -1))
- udp_sock_init(c, outbound, NULL, NULL, port);
+ udp_sock_init(c, outbound ? PIF_SPLICE : PIF_HOST,
+ NULL, NULL, port);
}
}
diff --git a/udp.h b/udp.h
index 8f8531ad..f78dc528 100644
--- a/udp.h
+++ b/udp.h
@@ -17,8 +17,9 @@ int udp_tap_handler(const struct ctx *c, uint8_t pif,
sa_family_t af, const void *saddr, const void *daddr,
uint8_t ttl, const struct pool *p, int idx,
const struct timespec *now);
-int udp_sock_init(const struct ctx *c, int ns, const union inany_addr *addr,
- const char *ifname, in_port_t port);
+int udp_sock_init(const struct ctx *c, uint8_t pif,
+ const union inany_addr *addr, const char *ifname,
+ in_port_t port);
int udp_init(struct ctx *c);
void udp_timer(struct ctx *c, const struct timespec *now);
void udp_update_l2_buf(const unsigned char *eth_d, const unsigned char *eth_s);
--
2.51.0
^ permalink raw reply [flat|nested] 6+ messages in thread* Re: [PATCH v2 2/3] udp: Unify some more inbound/outbound parts of udp_sock_init()
2025-10-22 3:15 ` [PATCH v2 2/3] udp: Unify some more inbound/outbound parts of udp_sock_init() David Gibson
@ 2025-10-28 23:13 ` Stefano Brivio
2025-10-29 0:22 ` David Gibson
0 siblings, 1 reply; 6+ messages in thread
From: Stefano Brivio @ 2025-10-28 23:13 UTC (permalink / raw)
To: David Gibson; +Cc: passt-dev
Sorry for the delay but...
On Wed, 22 Oct 2025 14:15:26 +1100
David Gibson <david@gibson.dropbear.id.au> wrote:
> udp_sock_init() takes an 'ns' parameter determining if it creates a socket
> in the guest namespace or host namespace. Alter it to take a pif
> parameter instead, like tcp_sock_init(), and use that change to slightly
> reduce code duplication between the HOST and SPLICE cases.
>
> Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
> ---
> conf.c | 2 +-
> udp.c | 65 +++++++++++++++++++++++++++++++---------------------------
> udp.h | 5 +++--
> 3 files changed, 39 insertions(+), 33 deletions(-)
>
> diff --git a/conf.c b/conf.c
> index 26f1bcc0..08cb50aa 100644
> --- a/conf.c
> +++ b/conf.c
> @@ -171,7 +171,7 @@ static void conf_ports_range_except(const struct ctx *c, char optname,
> if (optname == 't')
> ret = tcp_sock_init(c, PIF_HOST, addr, ifname, i);
> else if (optname == 'u')
> - ret = udp_sock_init(c, 0, addr, ifname, i);
> + ret = udp_sock_init(c, PIF_HOST, addr, ifname, i);
> else
> /* No way to check in advance for -T and -U */
> ret = 0;
> diff --git a/udp.c b/udp.c
> index 86585b7e..7f5faf20 100644
> --- a/udp.c
> +++ b/udp.c
> @@ -1093,64 +1093,68 @@ int udp_tap_handler(const struct ctx *c, uint8_t pif,
> /**
> * udp_sock_init() - Initialise listening sockets for a given port
> * @c: Execution context
> - * @ns: In pasta mode, if set, bind with loopback address in namespace
> + * @pif: Interface to open the socket for (PIF_HOST or PIF_SPLICE)
> * @addr: Pointer to address for binding, NULL if not configured
> * @ifname: Name of interface to bind to, NULL if not configured
> * @port: Port, host order
> *
> * Return: 0 on (partial) success, negative error code on (complete) failure
> */
> -int udp_sock_init(const struct ctx *c, int ns, const union inany_addr *addr,
> - const char *ifname, in_port_t port)
> +int udp_sock_init(const struct ctx *c, uint8_t pif,
> + const union inany_addr *addr, const char *ifname,
> + in_port_t port)
> {
> union udp_listen_epoll_ref uref = {
> - .pif = ns ? PIF_SPLICE : PIF_HOST,
> + .pif = pif,
> .port = port,
> };
> int r4 = FD_REF_MAX + 1, r6 = FD_REF_MAX + 1;
> + int (*socks)[NUM_PORTS];
>
> ASSERT(!c->no_udp);
> + ASSERT(pif_is_socket(pif))
...this doesn't build. If I add the missing semicolon everything is
fine. Should I? Worth double checking on your side?
The series looks otherwise good to me.
>
> - if (!addr && c->ifi4 && c->ifi6 && !ns) {
> + if (pif == PIF_HOST)
> + socks = udp_splice_init;
> + else
> + socks = udp_splice_ns;
> +
> + if (!addr && c->ifi4 && c->ifi6 && pif == PIF_HOST) {
> int s;
>
> /* Attempt to get a dual stack socket */
> s = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_HOST,
> NULL, ifname, port, uref.u32);
> - udp_splice_init[V4][port] = s < 0 ? -1 : s;
> - udp_splice_init[V6][port] = s < 0 ? -1 : s;
> + socks[V4][port] = s < 0 ? -1 : s;
> + socks[V6][port] = s < 0 ? -1 : s;
> if (IN_INTERVAL(0, FD_REF_MAX, s))
> return 0;
> }
>
> if ((!addr || inany_v4(addr)) && c->ifi4) {
> - if (!ns) {
> - r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_HOST,
> - addr ? addr : &inany_any4, ifname,
> - port, uref.u32);
> + const union inany_addr *a = addr ?
> + addr : &inany_any4;
>
> - udp_splice_init[V4][port] = r4 < 0 ? -1 : r4;
> - } else {
> - r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_SPLICE,
> - &inany_loopback4, ifname,
> - port, uref.u32);
> - udp_splice_ns[V4][port] = r4 < 0 ? -1 : r4;
> - }
> + if (pif == PIF_SPLICE)
> + a = &inany_loopback4;
> +
> + r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif, a, ifname,
> + port, uref.u32);
> +
> + socks[V4][port] = r4 < 0 ? -1 : r4;
> }
>
> if ((!addr || !inany_v4(addr)) && c->ifi6) {
> - if (!ns) {
> - r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_HOST,
> - addr ? addr : &inany_any6, ifname,
> - port, uref.u32);
> + const union inany_addr *a = addr ?
> + addr : &inany_any6;
>
> - udp_splice_init[V6][port] = r6 < 0 ? -1 : r6;
> - } else {
> - r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, PIF_SPLICE,
> - &inany_loopback6, ifname,
> - port, uref.u32);
> - udp_splice_ns[V6][port] = r6 < 0 ? -1 : r6;
> - }
> + if (pif == PIF_SPLICE)
> + a = &inany_loopback6;
> +
> + r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif, a, ifname,
> + port, uref.u32);
> +
> + socks[V6][port] = r6 < 0 ? -1 : r6;
> }
>
> if (IN_INTERVAL(0, FD_REF_MAX, r4) || IN_INTERVAL(0, FD_REF_MAX, r6))
> @@ -1216,7 +1220,8 @@ static void udp_port_rebind(struct ctx *c, bool outbound)
>
> if ((c->ifi4 && socks[V4][port] == -1) ||
> (c->ifi6 && socks[V6][port] == -1))
> - udp_sock_init(c, outbound, NULL, NULL, port);
> + udp_sock_init(c, outbound ? PIF_SPLICE : PIF_HOST,
> + NULL, NULL, port);
> }
> }
>
> diff --git a/udp.h b/udp.h
> index 8f8531ad..f78dc528 100644
> --- a/udp.h
> +++ b/udp.h
> @@ -17,8 +17,9 @@ int udp_tap_handler(const struct ctx *c, uint8_t pif,
> sa_family_t af, const void *saddr, const void *daddr,
> uint8_t ttl, const struct pool *p, int idx,
> const struct timespec *now);
> -int udp_sock_init(const struct ctx *c, int ns, const union inany_addr *addr,
> - const char *ifname, in_port_t port);
> +int udp_sock_init(const struct ctx *c, uint8_t pif,
> + const union inany_addr *addr, const char *ifname,
> + in_port_t port);
> int udp_init(struct ctx *c);
> void udp_timer(struct ctx *c, const struct timespec *now);
> void udp_update_l2_buf(const unsigned char *eth_d, const unsigned char *eth_s);
--
Stefano
^ permalink raw reply [flat|nested] 6+ messages in thread* Re: [PATCH v2 2/3] udp: Unify some more inbound/outbound parts of udp_sock_init()
2025-10-28 23:13 ` Stefano Brivio
@ 2025-10-29 0:22 ` David Gibson
0 siblings, 0 replies; 6+ messages in thread
From: David Gibson @ 2025-10-29 0:22 UTC (permalink / raw)
To: Stefano Brivio; +Cc: passt-dev
[-- Attachment #1: Type: text/plain, Size: 3041 bytes --]
On Wed, Oct 29, 2025 at 12:13:38AM +0100, Stefano Brivio wrote:
> Sorry for the delay but...
>
> On Wed, 22 Oct 2025 14:15:26 +1100
> David Gibson <david@gibson.dropbear.id.au> wrote:
>
> > udp_sock_init() takes an 'ns' parameter determining if it creates a socket
> > in the guest namespace or host namespace. Alter it to take a pif
> > parameter instead, like tcp_sock_init(), and use that change to slightly
> > reduce code duplication between the HOST and SPLICE cases.
> >
> > Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
> > ---
> > conf.c | 2 +-
> > udp.c | 65 +++++++++++++++++++++++++++++++---------------------------
> > udp.h | 5 +++--
> > 3 files changed, 39 insertions(+), 33 deletions(-)
> >
> > diff --git a/conf.c b/conf.c
> > index 26f1bcc0..08cb50aa 100644
> > --- a/conf.c
> > +++ b/conf.c
> > @@ -171,7 +171,7 @@ static void conf_ports_range_except(const struct ctx *c, char optname,
> > if (optname == 't')
> > ret = tcp_sock_init(c, PIF_HOST, addr, ifname, i);
> > else if (optname == 'u')
> > - ret = udp_sock_init(c, 0, addr, ifname, i);
> > + ret = udp_sock_init(c, PIF_HOST, addr, ifname, i);
> > else
> > /* No way to check in advance for -T and -U */
> > ret = 0;
> > diff --git a/udp.c b/udp.c
> > index 86585b7e..7f5faf20 100644
> > --- a/udp.c
> > +++ b/udp.c
> > @@ -1093,64 +1093,68 @@ int udp_tap_handler(const struct ctx *c, uint8_t pif,
> > /**
> > * udp_sock_init() - Initialise listening sockets for a given port
> > * @c: Execution context
> > - * @ns: In pasta mode, if set, bind with loopback address in namespace
> > + * @pif: Interface to open the socket for (PIF_HOST or PIF_SPLICE)
> > * @addr: Pointer to address for binding, NULL if not configured
> > * @ifname: Name of interface to bind to, NULL if not configured
> > * @port: Port, host order
> > *
> > * Return: 0 on (partial) success, negative error code on (complete) failure
> > */
> > -int udp_sock_init(const struct ctx *c, int ns, const union inany_addr *addr,
> > - const char *ifname, in_port_t port)
> > +int udp_sock_init(const struct ctx *c, uint8_t pif,
> > + const union inany_addr *addr, const char *ifname,
> > + in_port_t port)
> > {
> > union udp_listen_epoll_ref uref = {
> > - .pif = ns ? PIF_SPLICE : PIF_HOST,
> > + .pif = pif,
> > .port = port,
> > };
> > int r4 = FD_REF_MAX + 1, r6 = FD_REF_MAX + 1;
> > + int (*socks)[NUM_PORTS];
> >
> > ASSERT(!c->no_udp);
> > + ASSERT(pif_is_socket(pif))
>
> ...this doesn't build. If I add the missing semicolon everything is
> fine. Should I? Worth double checking on your side?
Oh. Wow. Don't know how I missed that. I'll fix it. I need to
respin to add the fallback for kernels without BINDTODEVICE anyway.
--
David Gibson (he or they) | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au | minimalist, thank you, not the other way
| around.
http://www.ozlabs.org/~dgibson
[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 833 bytes --]
^ permalink raw reply [flat|nested] 6+ messages in thread
* [PATCH v2 3/3] tcp, udp: Bind outbound listening sockets by interface instead of address
2025-10-22 3:15 [PATCH v2 0/3] Reduce differences between inbound and outbound socket binding David Gibson
2025-10-22 3:15 ` [PATCH v2 1/3] tcp: Merge tcp_ns_sock_init[46]() into tcp_sock_init_one() David Gibson
2025-10-22 3:15 ` [PATCH v2 2/3] udp: Unify some more inbound/outbound parts of udp_sock_init() David Gibson
@ 2025-10-22 3:15 ` David Gibson
2 siblings, 0 replies; 6+ messages in thread
From: David Gibson @ 2025-10-22 3:15 UTC (permalink / raw)
To: passt-dev, Stefano Brivio; +Cc: David Gibson
Currently, outbound forwards (-T, -U) are handled by sockets bound to the
loopback address. Typically we create two sockets, one for 127.0.0.1 and
one for ::1.
This has some disadvantages:
* The guest can't connect to these services using its global IP address,
it must explicitly use 127.0.0.1 or ::1 (bug 100)
* The guest can't even connect via 127.0.0.0/8 addresses other than
127.0.0.1
* We can't use dual-stack sockets, we have to have separate sockets for
IPv4 and IPv6.
The restriction exist for a reason though. If the guest has any interfaces
other than pasta (e.g. a VPN tunnel) external hosts could reach the host
via the forwards. Especially combined with -T auto / -U auto this would
make it very easy to make a mistake with nasty security implications.
We can achieve both goals, however, if we don't bind the outbound listening
sockets to a particular address, but _do_ use SO_BINDTODEVICE to restrict
them to the "lo" interface.
Link: https://bugs.passt.top/show_bug.cgi?id=100
Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
---
pif.c | 6 ------
tcp.c | 18 ++----------------
udp.c | 27 ++++++++++-----------------
3 files changed, 12 insertions(+), 39 deletions(-)
diff --git a/pif.c b/pif.c
index 592fafaa..84e3ceae 100644
--- a/pif.c
+++ b/pif.c
@@ -87,12 +87,6 @@ int pif_sock_l4(const struct ctx *c, enum epoll_type type, uint8_t pif,
ASSERT(pif_is_socket(pif));
- if (pif == PIF_SPLICE) {
- /* Sanity checks */
- ASSERT(!ifname);
- ASSERT(addr && inany_is_loopback(addr));
- }
-
if (!addr)
return sock_l4_sa(c, type, &sa, sizeof(sa.sa6),
ifname, false, data);
diff --git a/tcp.c b/tcp.c
index a62c8df1..c3500f5e 100644
--- a/tcp.c
+++ b/tcp.c
@@ -2596,20 +2596,6 @@ int tcp_sock_init(const struct ctx *c, uint8_t pif,
return r4 < 0 ? r4 : r6;
}
-/**
- * tcp_ns_sock_init() - Init socket to listen for spliced outbound connections
- * @c: Execution context
- * @port: Port, host order
- */
-static void tcp_ns_sock_init(const struct ctx *c, in_port_t port)
-{
- ASSERT(!c->no_tcp);
-
- if (c->ifi4)
- tcp_sock_init_one(c, PIF_SPLICE, &inany_loopback4, NULL, port);
- if (c->ifi6)
- tcp_sock_init_one(c, PIF_SPLICE, &inany_loopback6, NULL, port);
-}
/**
* tcp_ns_socks_init() - Bind sockets in namespace for outbound connections
@@ -2629,7 +2615,7 @@ static int tcp_ns_socks_init(void *arg)
if (!bitmap_isset(c->tcp.fwd_out.map, port))
continue;
- tcp_ns_sock_init(c, port);
+ tcp_sock_init(c, PIF_SPLICE, NULL, "lo", port);
}
return 0;
@@ -2809,7 +2795,7 @@ static void tcp_port_rebind(struct ctx *c, bool outbound)
if ((c->ifi4 && socks[port][V4] == -1) ||
(c->ifi6 && socks[port][V6] == -1)) {
if (outbound)
- tcp_ns_sock_init(c, port);
+ tcp_sock_init(c, PIF_SPLICE, NULL, "lo", port);
else
tcp_sock_init(c, PIF_HOST, NULL, NULL, port);
}
diff --git a/udp.c b/udp.c
index 7f5faf20..1984bb80 100644
--- a/udp.c
+++ b/udp.c
@@ -1132,26 +1132,16 @@ int udp_sock_init(const struct ctx *c, uint8_t pif,
}
if ((!addr || inany_v4(addr)) && c->ifi4) {
- const union inany_addr *a = addr ?
- addr : &inany_any4;
-
- if (pif == PIF_SPLICE)
- a = &inany_loopback4;
-
- r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif, a, ifname,
+ r4 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif,
+ addr ? addr : &inany_any4, ifname,
port, uref.u32);
socks[V4][port] = r4 < 0 ? -1 : r4;
}
if ((!addr || !inany_v4(addr)) && c->ifi6) {
- const union inany_addr *a = addr ?
- addr : &inany_any6;
-
- if (pif == PIF_SPLICE)
- a = &inany_loopback6;
-
- r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif, a, ifname,
+ r6 = pif_sock_l4(c, EPOLL_TYPE_UDP_LISTEN, pif,
+ addr ? addr : &inany_any6, ifname,
port, uref.u32);
socks[V6][port] = r6 < 0 ? -1 : r6;
@@ -1219,9 +1209,12 @@ static void udp_port_rebind(struct ctx *c, bool outbound)
continue;
if ((c->ifi4 && socks[V4][port] == -1) ||
- (c->ifi6 && socks[V6][port] == -1))
- udp_sock_init(c, outbound ? PIF_SPLICE : PIF_HOST,
- NULL, NULL, port);
+ (c->ifi6 && socks[V6][port] == -1)) {
+ if (outbound)
+ udp_sock_init(c, PIF_SPLICE, NULL, "lo", port);
+ else
+ udp_sock_init(c, PIF_HOST, NULL, NULL, port);
+ }
}
}
--
2.51.0
^ permalink raw reply [flat|nested] 6+ messages in thread